proc: consolidate per-net single_open callers
[linux-2.6] / net / ipv6 / tcp_ipv6.c
1 /*
2  *      TCP over IPv6
3  *      Linux INET6 implementation
4  *
5  *      Authors:
6  *      Pedro Roque             <roque@di.fc.ul.pt>
7  *
8  *      Based on:
9  *      linux/net/ipv4/tcp.c
10  *      linux/net/ipv4/tcp_input.c
11  *      linux/net/ipv4/tcp_output.c
12  *
13  *      Fixes:
14  *      Hideaki YOSHIFUJI       :       sin6_scope_id support
15  *      YOSHIFUJI Hideaki @USAGI and:   Support IPV6_V6ONLY socket option, which
16  *      Alexey Kuznetsov                allow both IPv4 and IPv6 sockets to bind
17  *                                      a single port at the same time.
18  *      YOSHIFUJI Hideaki @USAGI:       convert /proc/net/tcp6 to seq_file.
19  *
20  *      This program is free software; you can redistribute it and/or
21  *      modify it under the terms of the GNU General Public License
22  *      as published by the Free Software Foundation; either version
23  *      2 of the License, or (at your option) any later version.
24  */
25
26 #include <linux/module.h>
27 #include <linux/errno.h>
28 #include <linux/types.h>
29 #include <linux/socket.h>
30 #include <linux/sockios.h>
31 #include <linux/net.h>
32 #include <linux/jiffies.h>
33 #include <linux/in.h>
34 #include <linux/in6.h>
35 #include <linux/netdevice.h>
36 #include <linux/init.h>
37 #include <linux/jhash.h>
38 #include <linux/ipsec.h>
39 #include <linux/times.h>
40
41 #include <linux/ipv6.h>
42 #include <linux/icmpv6.h>
43 #include <linux/random.h>
44
45 #include <net/tcp.h>
46 #include <net/ndisc.h>
47 #include <net/inet6_hashtables.h>
48 #include <net/inet6_connection_sock.h>
49 #include <net/ipv6.h>
50 #include <net/transp_v6.h>
51 #include <net/addrconf.h>
52 #include <net/ip6_route.h>
53 #include <net/ip6_checksum.h>
54 #include <net/inet_ecn.h>
55 #include <net/protocol.h>
56 #include <net/xfrm.h>
57 #include <net/snmp.h>
58 #include <net/dsfield.h>
59 #include <net/timewait_sock.h>
60 #include <net/netdma.h>
61 #include <net/inet_common.h>
62
63 #include <asm/uaccess.h>
64
65 #include <linux/proc_fs.h>
66 #include <linux/seq_file.h>
67
68 #include <linux/crypto.h>
69 #include <linux/scatterlist.h>
70
71 static void     tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
72 static void     tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req);
73
74 static int      tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
75
76 static struct inet_connection_sock_af_ops ipv6_mapped;
77 static struct inet_connection_sock_af_ops ipv6_specific;
78 #ifdef CONFIG_TCP_MD5SIG
79 static struct tcp_sock_af_ops tcp_sock_ipv6_specific;
80 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
81 #else
82 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
83                                                    struct in6_addr *addr)
84 {
85         return NULL;
86 }
87 #endif
88
89 static void tcp_v6_hash(struct sock *sk)
90 {
91         if (sk->sk_state != TCP_CLOSE) {
92                 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
93                         tcp_prot.hash(sk);
94                         return;
95                 }
96                 local_bh_disable();
97                 __inet6_hash(sk);
98                 local_bh_enable();
99         }
100 }
101
102 static __inline__ __sum16 tcp_v6_check(struct tcphdr *th, int len,
103                                    struct in6_addr *saddr,
104                                    struct in6_addr *daddr,
105                                    __wsum base)
106 {
107         return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
108 }
109
110 static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
111 {
112         return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
113                                             ipv6_hdr(skb)->saddr.s6_addr32,
114                                             tcp_hdr(skb)->dest,
115                                             tcp_hdr(skb)->source);
116 }
117
118 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
119                           int addr_len)
120 {
121         struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
122         struct inet_sock *inet = inet_sk(sk);
123         struct inet_connection_sock *icsk = inet_csk(sk);
124         struct ipv6_pinfo *np = inet6_sk(sk);
125         struct tcp_sock *tp = tcp_sk(sk);
126         struct in6_addr *saddr = NULL, *final_p = NULL, final;
127         struct flowi fl;
128         struct dst_entry *dst;
129         int addr_type;
130         int err;
131
132         if (addr_len < SIN6_LEN_RFC2133)
133                 return -EINVAL;
134
135         if (usin->sin6_family != AF_INET6)
136                 return(-EAFNOSUPPORT);
137
138         memset(&fl, 0, sizeof(fl));
139
140         if (np->sndflow) {
141                 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
142                 IP6_ECN_flow_init(fl.fl6_flowlabel);
143                 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
144                         struct ip6_flowlabel *flowlabel;
145                         flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
146                         if (flowlabel == NULL)
147                                 return -EINVAL;
148                         ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
149                         fl6_sock_release(flowlabel);
150                 }
151         }
152
153         /*
154          *      connect() to INADDR_ANY means loopback (BSD'ism).
155          */
156
157         if(ipv6_addr_any(&usin->sin6_addr))
158                 usin->sin6_addr.s6_addr[15] = 0x1;
159
160         addr_type = ipv6_addr_type(&usin->sin6_addr);
161
162         if(addr_type & IPV6_ADDR_MULTICAST)
163                 return -ENETUNREACH;
164
165         if (addr_type&IPV6_ADDR_LINKLOCAL) {
166                 if (addr_len >= sizeof(struct sockaddr_in6) &&
167                     usin->sin6_scope_id) {
168                         /* If interface is set while binding, indices
169                          * must coincide.
170                          */
171                         if (sk->sk_bound_dev_if &&
172                             sk->sk_bound_dev_if != usin->sin6_scope_id)
173                                 return -EINVAL;
174
175                         sk->sk_bound_dev_if = usin->sin6_scope_id;
176                 }
177
178                 /* Connect to link-local address requires an interface */
179                 if (!sk->sk_bound_dev_if)
180                         return -EINVAL;
181         }
182
183         if (tp->rx_opt.ts_recent_stamp &&
184             !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
185                 tp->rx_opt.ts_recent = 0;
186                 tp->rx_opt.ts_recent_stamp = 0;
187                 tp->write_seq = 0;
188         }
189
190         ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
191         np->flow_label = fl.fl6_flowlabel;
192
193         /*
194          *      TCP over IPv4
195          */
196
197         if (addr_type == IPV6_ADDR_MAPPED) {
198                 u32 exthdrlen = icsk->icsk_ext_hdr_len;
199                 struct sockaddr_in sin;
200
201                 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
202
203                 if (__ipv6_only_sock(sk))
204                         return -ENETUNREACH;
205
206                 sin.sin_family = AF_INET;
207                 sin.sin_port = usin->sin6_port;
208                 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
209
210                 icsk->icsk_af_ops = &ipv6_mapped;
211                 sk->sk_backlog_rcv = tcp_v4_do_rcv;
212 #ifdef CONFIG_TCP_MD5SIG
213                 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
214 #endif
215
216                 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
217
218                 if (err) {
219                         icsk->icsk_ext_hdr_len = exthdrlen;
220                         icsk->icsk_af_ops = &ipv6_specific;
221                         sk->sk_backlog_rcv = tcp_v6_do_rcv;
222 #ifdef CONFIG_TCP_MD5SIG
223                         tp->af_specific = &tcp_sock_ipv6_specific;
224 #endif
225                         goto failure;
226                 } else {
227                         ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000FFFF),
228                                       inet->saddr);
229                         ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000FFFF),
230                                       inet->rcv_saddr);
231                 }
232
233                 return err;
234         }
235
236         if (!ipv6_addr_any(&np->rcv_saddr))
237                 saddr = &np->rcv_saddr;
238
239         fl.proto = IPPROTO_TCP;
240         ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
241         ipv6_addr_copy(&fl.fl6_src,
242                        (saddr ? saddr : &np->saddr));
243         fl.oif = sk->sk_bound_dev_if;
244         fl.fl_ip_dport = usin->sin6_port;
245         fl.fl_ip_sport = inet->sport;
246
247         if (np->opt && np->opt->srcrt) {
248                 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
249                 ipv6_addr_copy(&final, &fl.fl6_dst);
250                 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
251                 final_p = &final;
252         }
253
254         security_sk_classify_flow(sk, &fl);
255
256         err = ip6_dst_lookup(sk, &dst, &fl);
257         if (err)
258                 goto failure;
259         if (final_p)
260                 ipv6_addr_copy(&fl.fl6_dst, final_p);
261
262         if ((err = __xfrm_lookup(&dst, &fl, sk, XFRM_LOOKUP_WAIT)) < 0) {
263                 if (err == -EREMOTE)
264                         err = ip6_dst_blackhole(sk, &dst, &fl);
265                 if (err < 0)
266                         goto failure;
267         }
268
269         if (saddr == NULL) {
270                 saddr = &fl.fl6_src;
271                 ipv6_addr_copy(&np->rcv_saddr, saddr);
272         }
273
274         /* set the source address */
275         ipv6_addr_copy(&np->saddr, saddr);
276         inet->rcv_saddr = LOOPBACK4_IPV6;
277
278         sk->sk_gso_type = SKB_GSO_TCPV6;
279         __ip6_dst_store(sk, dst, NULL, NULL);
280
281         icsk->icsk_ext_hdr_len = 0;
282         if (np->opt)
283                 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
284                                           np->opt->opt_nflen);
285
286         tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
287
288         inet->dport = usin->sin6_port;
289
290         tcp_set_state(sk, TCP_SYN_SENT);
291         err = inet6_hash_connect(&tcp_death_row, sk);
292         if (err)
293                 goto late_failure;
294
295         if (!tp->write_seq)
296                 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
297                                                              np->daddr.s6_addr32,
298                                                              inet->sport,
299                                                              inet->dport);
300
301         err = tcp_connect(sk);
302         if (err)
303                 goto late_failure;
304
305         return 0;
306
307 late_failure:
308         tcp_set_state(sk, TCP_CLOSE);
309         __sk_dst_reset(sk);
310 failure:
311         inet->dport = 0;
312         sk->sk_route_caps = 0;
313         return err;
314 }
315
316 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
317                 int type, int code, int offset, __be32 info)
318 {
319         struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
320         const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
321         struct ipv6_pinfo *np;
322         struct sock *sk;
323         int err;
324         struct tcp_sock *tp;
325         __u32 seq;
326         struct net *net = dev_net(skb->dev);
327
328         sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
329                         th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
330
331         if (sk == NULL) {
332                 ICMP6_INC_STATS_BH(__in6_dev_get(skb->dev), ICMP6_MIB_INERRORS);
333                 return;
334         }
335
336         if (sk->sk_state == TCP_TIME_WAIT) {
337                 inet_twsk_put(inet_twsk(sk));
338                 return;
339         }
340
341         bh_lock_sock(sk);
342         if (sock_owned_by_user(sk))
343                 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
344
345         if (sk->sk_state == TCP_CLOSE)
346                 goto out;
347
348         tp = tcp_sk(sk);
349         seq = ntohl(th->seq);
350         if (sk->sk_state != TCP_LISTEN &&
351             !between(seq, tp->snd_una, tp->snd_nxt)) {
352                 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
353                 goto out;
354         }
355
356         np = inet6_sk(sk);
357
358         if (type == ICMPV6_PKT_TOOBIG) {
359                 struct dst_entry *dst = NULL;
360
361                 if (sock_owned_by_user(sk))
362                         goto out;
363                 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
364                         goto out;
365
366                 /* icmp should have updated the destination cache entry */
367                 dst = __sk_dst_check(sk, np->dst_cookie);
368
369                 if (dst == NULL) {
370                         struct inet_sock *inet = inet_sk(sk);
371                         struct flowi fl;
372
373                         /* BUGGG_FUTURE: Again, it is not clear how
374                            to handle rthdr case. Ignore this complexity
375                            for now.
376                          */
377                         memset(&fl, 0, sizeof(fl));
378                         fl.proto = IPPROTO_TCP;
379                         ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
380                         ipv6_addr_copy(&fl.fl6_src, &np->saddr);
381                         fl.oif = sk->sk_bound_dev_if;
382                         fl.fl_ip_dport = inet->dport;
383                         fl.fl_ip_sport = inet->sport;
384                         security_skb_classify_flow(skb, &fl);
385
386                         if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
387                                 sk->sk_err_soft = -err;
388                                 goto out;
389                         }
390
391                         if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0) {
392                                 sk->sk_err_soft = -err;
393                                 goto out;
394                         }
395
396                 } else
397                         dst_hold(dst);
398
399                 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
400                         tcp_sync_mss(sk, dst_mtu(dst));
401                         tcp_simple_retransmit(sk);
402                 } /* else let the usual retransmit timer handle it */
403                 dst_release(dst);
404                 goto out;
405         }
406
407         icmpv6_err_convert(type, code, &err);
408
409         /* Might be for an request_sock */
410         switch (sk->sk_state) {
411                 struct request_sock *req, **prev;
412         case TCP_LISTEN:
413                 if (sock_owned_by_user(sk))
414                         goto out;
415
416                 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
417                                            &hdr->saddr, inet6_iif(skb));
418                 if (!req)
419                         goto out;
420
421                 /* ICMPs are not backlogged, hence we cannot get
422                  * an established socket here.
423                  */
424                 BUG_TRAP(req->sk == NULL);
425
426                 if (seq != tcp_rsk(req)->snt_isn) {
427                         NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
428                         goto out;
429                 }
430
431                 inet_csk_reqsk_queue_drop(sk, req, prev);
432                 goto out;
433
434         case TCP_SYN_SENT:
435         case TCP_SYN_RECV:  /* Cannot happen.
436                                It can, it SYNs are crossed. --ANK */
437                 if (!sock_owned_by_user(sk)) {
438                         sk->sk_err = err;
439                         sk->sk_error_report(sk);                /* Wake people up to see the error (see connect in sock.c) */
440
441                         tcp_done(sk);
442                 } else
443                         sk->sk_err_soft = err;
444                 goto out;
445         }
446
447         if (!sock_owned_by_user(sk) && np->recverr) {
448                 sk->sk_err = err;
449                 sk->sk_error_report(sk);
450         } else
451                 sk->sk_err_soft = err;
452
453 out:
454         bh_unlock_sock(sk);
455         sock_put(sk);
456 }
457
458
459 static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req)
460 {
461         struct inet6_request_sock *treq = inet6_rsk(req);
462         struct ipv6_pinfo *np = inet6_sk(sk);
463         struct sk_buff * skb;
464         struct ipv6_txoptions *opt = NULL;
465         struct in6_addr * final_p = NULL, final;
466         struct flowi fl;
467         struct dst_entry *dst;
468         int err = -1;
469
470         memset(&fl, 0, sizeof(fl));
471         fl.proto = IPPROTO_TCP;
472         ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
473         ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
474         fl.fl6_flowlabel = 0;
475         fl.oif = treq->iif;
476         fl.fl_ip_dport = inet_rsk(req)->rmt_port;
477         fl.fl_ip_sport = inet_sk(sk)->sport;
478         security_req_classify_flow(req, &fl);
479
480         opt = np->opt;
481         if (opt && opt->srcrt) {
482                 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
483                 ipv6_addr_copy(&final, &fl.fl6_dst);
484                 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
485                 final_p = &final;
486         }
487
488         err = ip6_dst_lookup(sk, &dst, &fl);
489         if (err)
490                 goto done;
491         if (final_p)
492                 ipv6_addr_copy(&fl.fl6_dst, final_p);
493         if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
494                 goto done;
495
496         skb = tcp_make_synack(sk, dst, req);
497         if (skb) {
498                 struct tcphdr *th = tcp_hdr(skb);
499
500                 th->check = tcp_v6_check(th, skb->len,
501                                          &treq->loc_addr, &treq->rmt_addr,
502                                          csum_partial((char *)th, skb->len, skb->csum));
503
504                 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
505                 err = ip6_xmit(sk, skb, &fl, opt, 0);
506                 err = net_xmit_eval(err);
507         }
508
509 done:
510         if (opt && opt != np->opt)
511                 sock_kfree_s(sk, opt, opt->tot_len);
512         dst_release(dst);
513         return err;
514 }
515
516 static inline void syn_flood_warning(struct sk_buff *skb)
517 {
518 #ifdef CONFIG_SYN_COOKIES
519         if (sysctl_tcp_syncookies)
520                 printk(KERN_INFO
521                        "TCPv6: Possible SYN flooding on port %d. "
522                        "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
523         else
524 #endif
525                 printk(KERN_INFO
526                        "TCPv6: Possible SYN flooding on port %d. "
527                        "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
528 }
529
530 static void tcp_v6_reqsk_destructor(struct request_sock *req)
531 {
532         if (inet6_rsk(req)->pktopts)
533                 kfree_skb(inet6_rsk(req)->pktopts);
534 }
535
536 #ifdef CONFIG_TCP_MD5SIG
537 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
538                                                    struct in6_addr *addr)
539 {
540         struct tcp_sock *tp = tcp_sk(sk);
541         int i;
542
543         BUG_ON(tp == NULL);
544
545         if (!tp->md5sig_info || !tp->md5sig_info->entries6)
546                 return NULL;
547
548         for (i = 0; i < tp->md5sig_info->entries6; i++) {
549                 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
550                         return &tp->md5sig_info->keys6[i].base;
551         }
552         return NULL;
553 }
554
555 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
556                                                 struct sock *addr_sk)
557 {
558         return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
559 }
560
561 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
562                                                       struct request_sock *req)
563 {
564         return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
565 }
566
567 static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
568                              char *newkey, u8 newkeylen)
569 {
570         /* Add key to the list */
571         struct tcp_md5sig_key *key;
572         struct tcp_sock *tp = tcp_sk(sk);
573         struct tcp6_md5sig_key *keys;
574
575         key = tcp_v6_md5_do_lookup(sk, peer);
576         if (key) {
577                 /* modify existing entry - just update that one */
578                 kfree(key->key);
579                 key->key = newkey;
580                 key->keylen = newkeylen;
581         } else {
582                 /* reallocate new list if current one is full. */
583                 if (!tp->md5sig_info) {
584                         tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
585                         if (!tp->md5sig_info) {
586                                 kfree(newkey);
587                                 return -ENOMEM;
588                         }
589                         sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
590                 }
591                 if (tcp_alloc_md5sig_pool() == NULL) {
592                         kfree(newkey);
593                         return -ENOMEM;
594                 }
595                 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
596                         keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
597                                        (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
598
599                         if (!keys) {
600                                 tcp_free_md5sig_pool();
601                                 kfree(newkey);
602                                 return -ENOMEM;
603                         }
604
605                         if (tp->md5sig_info->entries6)
606                                 memmove(keys, tp->md5sig_info->keys6,
607                                         (sizeof (tp->md5sig_info->keys6[0]) *
608                                          tp->md5sig_info->entries6));
609
610                         kfree(tp->md5sig_info->keys6);
611                         tp->md5sig_info->keys6 = keys;
612                         tp->md5sig_info->alloced6++;
613                 }
614
615                 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
616                                peer);
617                 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
618                 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
619
620                 tp->md5sig_info->entries6++;
621         }
622         return 0;
623 }
624
625 static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
626                                u8 *newkey, __u8 newkeylen)
627 {
628         return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
629                                  newkey, newkeylen);
630 }
631
632 static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
633 {
634         struct tcp_sock *tp = tcp_sk(sk);
635         int i;
636
637         for (i = 0; i < tp->md5sig_info->entries6; i++) {
638                 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
639                         /* Free the key */
640                         kfree(tp->md5sig_info->keys6[i].base.key);
641                         tp->md5sig_info->entries6--;
642
643                         if (tp->md5sig_info->entries6 == 0) {
644                                 kfree(tp->md5sig_info->keys6);
645                                 tp->md5sig_info->keys6 = NULL;
646                                 tp->md5sig_info->alloced6 = 0;
647                         } else {
648                                 /* shrink the database */
649                                 if (tp->md5sig_info->entries6 != i)
650                                         memmove(&tp->md5sig_info->keys6[i],
651                                                 &tp->md5sig_info->keys6[i+1],
652                                                 (tp->md5sig_info->entries6 - i)
653                                                 * sizeof (tp->md5sig_info->keys6[0]));
654                         }
655                         tcp_free_md5sig_pool();
656                         return 0;
657                 }
658         }
659         return -ENOENT;
660 }
661
662 static void tcp_v6_clear_md5_list (struct sock *sk)
663 {
664         struct tcp_sock *tp = tcp_sk(sk);
665         int i;
666
667         if (tp->md5sig_info->entries6) {
668                 for (i = 0; i < tp->md5sig_info->entries6; i++)
669                         kfree(tp->md5sig_info->keys6[i].base.key);
670                 tp->md5sig_info->entries6 = 0;
671                 tcp_free_md5sig_pool();
672         }
673
674         kfree(tp->md5sig_info->keys6);
675         tp->md5sig_info->keys6 = NULL;
676         tp->md5sig_info->alloced6 = 0;
677
678         if (tp->md5sig_info->entries4) {
679                 for (i = 0; i < tp->md5sig_info->entries4; i++)
680                         kfree(tp->md5sig_info->keys4[i].base.key);
681                 tp->md5sig_info->entries4 = 0;
682                 tcp_free_md5sig_pool();
683         }
684
685         kfree(tp->md5sig_info->keys4);
686         tp->md5sig_info->keys4 = NULL;
687         tp->md5sig_info->alloced4 = 0;
688 }
689
690 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
691                                   int optlen)
692 {
693         struct tcp_md5sig cmd;
694         struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
695         u8 *newkey;
696
697         if (optlen < sizeof(cmd))
698                 return -EINVAL;
699
700         if (copy_from_user(&cmd, optval, sizeof(cmd)))
701                 return -EFAULT;
702
703         if (sin6->sin6_family != AF_INET6)
704                 return -EINVAL;
705
706         if (!cmd.tcpm_keylen) {
707                 if (!tcp_sk(sk)->md5sig_info)
708                         return -ENOENT;
709                 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
710                         return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
711                 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
712         }
713
714         if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
715                 return -EINVAL;
716
717         if (!tcp_sk(sk)->md5sig_info) {
718                 struct tcp_sock *tp = tcp_sk(sk);
719                 struct tcp_md5sig_info *p;
720
721                 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
722                 if (!p)
723                         return -ENOMEM;
724
725                 tp->md5sig_info = p;
726                 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
727         }
728
729         newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
730         if (!newkey)
731                 return -ENOMEM;
732         if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
733                 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
734                                          newkey, cmd.tcpm_keylen);
735         }
736         return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
737 }
738
739 static int tcp_v6_do_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
740                                    struct in6_addr *saddr,
741                                    struct in6_addr *daddr,
742                                    struct tcphdr *th, unsigned int tcplen)
743 {
744         struct tcp_md5sig_pool *hp;
745         struct tcp6_pseudohdr *bp;
746         int err;
747
748         hp = tcp_get_md5sig_pool();
749         if (!hp) {
750                 printk(KERN_WARNING "%s(): hash pool not found...\n", __func__);
751                 goto clear_hash_noput;
752         }
753
754         bp = &hp->md5_blk.ip6;
755
756         /* 1. TCP pseudo-header (RFC2460) */
757         ipv6_addr_copy(&bp->saddr, saddr);
758         ipv6_addr_copy(&bp->daddr, daddr);
759         bp->len = htonl(tcplen);
760         bp->protocol = htonl(IPPROTO_TCP);
761
762         err = tcp_calc_md5_hash(md5_hash, key, sizeof(*bp),
763                                 th, tcplen, hp);
764
765         if (err)
766                 goto clear_hash;
767
768         /* Free up the crypto pool */
769         tcp_put_md5sig_pool();
770 out:
771         return 0;
772 clear_hash:
773         tcp_put_md5sig_pool();
774 clear_hash_noput:
775         memset(md5_hash, 0, 16);
776         goto out;
777 }
778
779 static int tcp_v6_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
780                                 struct sock *sk,
781                                 struct dst_entry *dst,
782                                 struct request_sock *req,
783                                 struct tcphdr *th, unsigned int tcplen)
784 {
785         struct in6_addr *saddr, *daddr;
786
787         if (sk) {
788                 saddr = &inet6_sk(sk)->saddr;
789                 daddr = &inet6_sk(sk)->daddr;
790         } else {
791                 saddr = &inet6_rsk(req)->loc_addr;
792                 daddr = &inet6_rsk(req)->rmt_addr;
793         }
794         return tcp_v6_do_calc_md5_hash(md5_hash, key,
795                                        saddr, daddr,
796                                        th, tcplen);
797 }
798
799 static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
800 {
801         __u8 *hash_location = NULL;
802         struct tcp_md5sig_key *hash_expected;
803         struct ipv6hdr *ip6h = ipv6_hdr(skb);
804         struct tcphdr *th = tcp_hdr(skb);
805         int genhash;
806         u8 newhash[16];
807
808         hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
809         hash_location = tcp_parse_md5sig_option(th);
810
811         /* do we have a hash as expected? */
812         if (!hash_expected) {
813                 if (!hash_location)
814                         return 0;
815                 if (net_ratelimit()) {
816                         printk(KERN_INFO "MD5 Hash NOT expected but found "
817                                "(" NIP6_FMT ", %u)->"
818                                "(" NIP6_FMT ", %u)\n",
819                                NIP6(ip6h->saddr), ntohs(th->source),
820                                NIP6(ip6h->daddr), ntohs(th->dest));
821                 }
822                 return 1;
823         }
824
825         if (!hash_location) {
826                 if (net_ratelimit()) {
827                         printk(KERN_INFO "MD5 Hash expected but NOT found "
828                                "(" NIP6_FMT ", %u)->"
829                                "(" NIP6_FMT ", %u)\n",
830                                NIP6(ip6h->saddr), ntohs(th->source),
831                                NIP6(ip6h->daddr), ntohs(th->dest));
832                 }
833                 return 1;
834         }
835
836         /* check the signature */
837         genhash = tcp_v6_do_calc_md5_hash(newhash,
838                                           hash_expected,
839                                           &ip6h->saddr, &ip6h->daddr,
840                                           th, skb->len);
841         if (genhash || memcmp(hash_location, newhash, 16) != 0) {
842                 if (net_ratelimit()) {
843                         printk(KERN_INFO "MD5 Hash %s for "
844                                "(" NIP6_FMT ", %u)->"
845                                "(" NIP6_FMT ", %u)\n",
846                                genhash ? "failed" : "mismatch",
847                                NIP6(ip6h->saddr), ntohs(th->source),
848                                NIP6(ip6h->daddr), ntohs(th->dest));
849                 }
850                 return 1;
851         }
852         return 0;
853 }
854 #endif
855
856 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
857         .family         =       AF_INET6,
858         .obj_size       =       sizeof(struct tcp6_request_sock),
859         .rtx_syn_ack    =       tcp_v6_send_synack,
860         .send_ack       =       tcp_v6_reqsk_send_ack,
861         .destructor     =       tcp_v6_reqsk_destructor,
862         .send_reset     =       tcp_v6_send_reset
863 };
864
865 #ifdef CONFIG_TCP_MD5SIG
866 static struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
867         .md5_lookup     =       tcp_v6_reqsk_md5_lookup,
868 };
869 #endif
870
871 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
872         .twsk_obj_size  = sizeof(struct tcp6_timewait_sock),
873         .twsk_unique    = tcp_twsk_unique,
874         .twsk_destructor= tcp_twsk_destructor,
875 };
876
877 static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
878 {
879         struct ipv6_pinfo *np = inet6_sk(sk);
880         struct tcphdr *th = tcp_hdr(skb);
881
882         if (skb->ip_summed == CHECKSUM_PARTIAL) {
883                 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,  0);
884                 skb->csum_start = skb_transport_header(skb) - skb->head;
885                 skb->csum_offset = offsetof(struct tcphdr, check);
886         } else {
887                 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
888                                             csum_partial((char *)th, th->doff<<2,
889                                                          skb->csum));
890         }
891 }
892
893 static int tcp_v6_gso_send_check(struct sk_buff *skb)
894 {
895         struct ipv6hdr *ipv6h;
896         struct tcphdr *th;
897
898         if (!pskb_may_pull(skb, sizeof(*th)))
899                 return -EINVAL;
900
901         ipv6h = ipv6_hdr(skb);
902         th = tcp_hdr(skb);
903
904         th->check = 0;
905         th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
906                                      IPPROTO_TCP, 0);
907         skb->csum_start = skb_transport_header(skb) - skb->head;
908         skb->csum_offset = offsetof(struct tcphdr, check);
909         skb->ip_summed = CHECKSUM_PARTIAL;
910         return 0;
911 }
912
913 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
914 {
915         struct tcphdr *th = tcp_hdr(skb), *t1;
916         struct sk_buff *buff;
917         struct flowi fl;
918         struct net *net = dev_net(skb->dst->dev);
919         struct sock *ctl_sk = net->ipv6.tcp_sk;
920         unsigned int tot_len = sizeof(*th);
921 #ifdef CONFIG_TCP_MD5SIG
922         struct tcp_md5sig_key *key;
923 #endif
924
925         if (th->rst)
926                 return;
927
928         if (!ipv6_unicast_destination(skb))
929                 return;
930
931 #ifdef CONFIG_TCP_MD5SIG
932         if (sk)
933                 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
934         else
935                 key = NULL;
936
937         if (key)
938                 tot_len += TCPOLEN_MD5SIG_ALIGNED;
939 #endif
940
941         /*
942          * We need to grab some memory, and put together an RST,
943          * and then put it into the queue to be sent.
944          */
945
946         buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
947                          GFP_ATOMIC);
948         if (buff == NULL)
949                 return;
950
951         skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
952
953         t1 = (struct tcphdr *) skb_push(buff, tot_len);
954
955         /* Swap the send and the receive. */
956         memset(t1, 0, sizeof(*t1));
957         t1->dest = th->source;
958         t1->source = th->dest;
959         t1->doff = tot_len / 4;
960         t1->rst = 1;
961
962         if(th->ack) {
963                 t1->seq = th->ack_seq;
964         } else {
965                 t1->ack = 1;
966                 t1->ack_seq = htonl(ntohl(th->seq) + th->syn + th->fin
967                                     + skb->len - (th->doff<<2));
968         }
969
970 #ifdef CONFIG_TCP_MD5SIG
971         if (key) {
972                 __be32 *opt = (__be32*)(t1 + 1);
973                 opt[0] = htonl((TCPOPT_NOP << 24) |
974                                (TCPOPT_NOP << 16) |
975                                (TCPOPT_MD5SIG << 8) |
976                                TCPOLEN_MD5SIG);
977                 tcp_v6_do_calc_md5_hash((__u8 *)&opt[1], key,
978                                         &ipv6_hdr(skb)->daddr,
979                                         &ipv6_hdr(skb)->saddr,
980                                         t1, tot_len);
981         }
982 #endif
983
984         buff->csum = csum_partial((char *)t1, sizeof(*t1), 0);
985
986         memset(&fl, 0, sizeof(fl));
987         ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
988         ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
989
990         t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
991                                     sizeof(*t1), IPPROTO_TCP,
992                                     buff->csum);
993
994         fl.proto = IPPROTO_TCP;
995         fl.oif = inet6_iif(skb);
996         fl.fl_ip_dport = t1->dest;
997         fl.fl_ip_sport = t1->source;
998         security_skb_classify_flow(skb, &fl);
999
1000         /* Pass a socket to ip6_dst_lookup either it is for RST
1001          * Underlying function will use this to retrieve the network
1002          * namespace
1003          */
1004         if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1005
1006                 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1007                         ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1008                         TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
1009                         TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
1010                         return;
1011                 }
1012         }
1013
1014         kfree_skb(buff);
1015 }
1016
1017 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1018                             struct tcp_md5sig_key *key)
1019 {
1020         struct tcphdr *th = tcp_hdr(skb), *t1;
1021         struct sk_buff *buff;
1022         struct flowi fl;
1023         struct net *net = dev_net(skb->dev);
1024         struct sock *ctl_sk = net->ipv6.tcp_sk;
1025         unsigned int tot_len = sizeof(struct tcphdr);
1026         __be32 *topt;
1027
1028         if (ts)
1029                 tot_len += TCPOLEN_TSTAMP_ALIGNED;
1030 #ifdef CONFIG_TCP_MD5SIG
1031         if (key)
1032                 tot_len += TCPOLEN_MD5SIG_ALIGNED;
1033 #endif
1034
1035         buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1036                          GFP_ATOMIC);
1037         if (buff == NULL)
1038                 return;
1039
1040         skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1041
1042         t1 = (struct tcphdr *) skb_push(buff,tot_len);
1043
1044         /* Swap the send and the receive. */
1045         memset(t1, 0, sizeof(*t1));
1046         t1->dest = th->source;
1047         t1->source = th->dest;
1048         t1->doff = tot_len/4;
1049         t1->seq = htonl(seq);
1050         t1->ack_seq = htonl(ack);
1051         t1->ack = 1;
1052         t1->window = htons(win);
1053
1054         topt = (__be32 *)(t1 + 1);
1055
1056         if (ts) {
1057                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1058                                 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1059                 *topt++ = htonl(tcp_time_stamp);
1060                 *topt = htonl(ts);
1061         }
1062
1063 #ifdef CONFIG_TCP_MD5SIG
1064         if (key) {
1065                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1066                                 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1067                 tcp_v6_do_calc_md5_hash((__u8 *)topt, key,
1068                                         &ipv6_hdr(skb)->daddr,
1069                                         &ipv6_hdr(skb)->saddr,
1070                                         t1, tot_len);
1071         }
1072 #endif
1073
1074         buff->csum = csum_partial((char *)t1, tot_len, 0);
1075
1076         memset(&fl, 0, sizeof(fl));
1077         ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1078         ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1079
1080         t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
1081                                     tot_len, IPPROTO_TCP,
1082                                     buff->csum);
1083
1084         fl.proto = IPPROTO_TCP;
1085         fl.oif = inet6_iif(skb);
1086         fl.fl_ip_dport = t1->dest;
1087         fl.fl_ip_sport = t1->source;
1088         security_skb_classify_flow(skb, &fl);
1089
1090         if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1091                 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1092                         ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1093                         TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
1094                         return;
1095                 }
1096         }
1097
1098         kfree_skb(buff);
1099 }
1100
1101 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1102 {
1103         struct inet_timewait_sock *tw = inet_twsk(sk);
1104         struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1105
1106         tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
1107                         tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
1108                         tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1109
1110         inet_twsk_put(tw);
1111 }
1112
1113 static void tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req)
1114 {
1115         tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
1116                         tcp_v6_md5_do_lookup(skb->sk, &ipv6_hdr(skb)->daddr));
1117 }
1118
1119
1120 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1121 {
1122         struct request_sock *req, **prev;
1123         const struct tcphdr *th = tcp_hdr(skb);
1124         struct sock *nsk;
1125
1126         /* Find possible connection requests. */
1127         req = inet6_csk_search_req(sk, &prev, th->source,
1128                                    &ipv6_hdr(skb)->saddr,
1129                                    &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1130         if (req)
1131                 return tcp_check_req(sk, skb, req, prev);
1132
1133         nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
1134                         &ipv6_hdr(skb)->saddr, th->source,
1135                         &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1136
1137         if (nsk) {
1138                 if (nsk->sk_state != TCP_TIME_WAIT) {
1139                         bh_lock_sock(nsk);
1140                         return nsk;
1141                 }
1142                 inet_twsk_put(inet_twsk(nsk));
1143                 return NULL;
1144         }
1145
1146 #ifdef CONFIG_SYN_COOKIES
1147         if (!th->rst && !th->syn && th->ack)
1148                 sk = cookie_v6_check(sk, skb);
1149 #endif
1150         return sk;
1151 }
1152
1153 /* FIXME: this is substantially similar to the ipv4 code.
1154  * Can some kind of merge be done? -- erics
1155  */
1156 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1157 {
1158         struct inet6_request_sock *treq;
1159         struct ipv6_pinfo *np = inet6_sk(sk);
1160         struct tcp_options_received tmp_opt;
1161         struct tcp_sock *tp = tcp_sk(sk);
1162         struct request_sock *req = NULL;
1163         __u32 isn = TCP_SKB_CB(skb)->when;
1164 #ifdef CONFIG_SYN_COOKIES
1165         int want_cookie = 0;
1166 #else
1167 #define want_cookie 0
1168 #endif
1169
1170         if (skb->protocol == htons(ETH_P_IP))
1171                 return tcp_v4_conn_request(sk, skb);
1172
1173         if (!ipv6_unicast_destination(skb))
1174                 goto drop;
1175
1176         if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1177                 if (net_ratelimit())
1178                         syn_flood_warning(skb);
1179 #ifdef CONFIG_SYN_COOKIES
1180                 if (sysctl_tcp_syncookies)
1181                         want_cookie = 1;
1182                 else
1183 #endif
1184                 goto drop;
1185         }
1186
1187         if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1188                 goto drop;
1189
1190         req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1191         if (req == NULL)
1192                 goto drop;
1193
1194 #ifdef CONFIG_TCP_MD5SIG
1195         tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1196 #endif
1197
1198         tcp_clear_options(&tmp_opt);
1199         tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1200         tmp_opt.user_mss = tp->rx_opt.user_mss;
1201
1202         tcp_parse_options(skb, &tmp_opt, 0);
1203
1204         if (want_cookie && !tmp_opt.saw_tstamp)
1205                 tcp_clear_options(&tmp_opt);
1206
1207         tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1208         tcp_openreq_init(req, &tmp_opt, skb);
1209
1210         treq = inet6_rsk(req);
1211         ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1212         ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
1213         if (!want_cookie)
1214                 TCP_ECN_create_request(req, tcp_hdr(skb));
1215
1216         if (want_cookie) {
1217                 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1218                 req->cookie_ts = tmp_opt.tstamp_ok;
1219         } else if (!isn) {
1220                 if (ipv6_opt_accepted(sk, skb) ||
1221                     np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1222                     np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1223                         atomic_inc(&skb->users);
1224                         treq->pktopts = skb;
1225                 }
1226                 treq->iif = sk->sk_bound_dev_if;
1227
1228                 /* So that link locals have meaning */
1229                 if (!sk->sk_bound_dev_if &&
1230                     ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1231                         treq->iif = inet6_iif(skb);
1232
1233                 isn = tcp_v6_init_sequence(skb);
1234         }
1235
1236         tcp_rsk(req)->snt_isn = isn;
1237
1238         security_inet_conn_request(sk, skb, req);
1239
1240         if (tcp_v6_send_synack(sk, req))
1241                 goto drop;
1242
1243         if (!want_cookie) {
1244                 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1245                 return 0;
1246         }
1247
1248 drop:
1249         if (req)
1250                 reqsk_free(req);
1251
1252         return 0; /* don't send reset */
1253 }
1254
1255 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1256                                           struct request_sock *req,
1257                                           struct dst_entry *dst)
1258 {
1259         struct inet6_request_sock *treq = inet6_rsk(req);
1260         struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1261         struct tcp6_sock *newtcp6sk;
1262         struct inet_sock *newinet;
1263         struct tcp_sock *newtp;
1264         struct sock *newsk;
1265         struct ipv6_txoptions *opt;
1266 #ifdef CONFIG_TCP_MD5SIG
1267         struct tcp_md5sig_key *key;
1268 #endif
1269
1270         if (skb->protocol == htons(ETH_P_IP)) {
1271                 /*
1272                  *      v6 mapped
1273                  */
1274
1275                 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1276
1277                 if (newsk == NULL)
1278                         return NULL;
1279
1280                 newtcp6sk = (struct tcp6_sock *)newsk;
1281                 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1282
1283                 newinet = inet_sk(newsk);
1284                 newnp = inet6_sk(newsk);
1285                 newtp = tcp_sk(newsk);
1286
1287                 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1288
1289                 ipv6_addr_set(&newnp->daddr, 0, 0, htonl(0x0000FFFF),
1290                               newinet->daddr);
1291
1292                 ipv6_addr_set(&newnp->saddr, 0, 0, htonl(0x0000FFFF),
1293                               newinet->saddr);
1294
1295                 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1296
1297                 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1298                 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1299 #ifdef CONFIG_TCP_MD5SIG
1300                 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1301 #endif
1302
1303                 newnp->pktoptions  = NULL;
1304                 newnp->opt         = NULL;
1305                 newnp->mcast_oif   = inet6_iif(skb);
1306                 newnp->mcast_hops  = ipv6_hdr(skb)->hop_limit;
1307
1308                 /*
1309                  * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1310                  * here, tcp_create_openreq_child now does this for us, see the comment in
1311                  * that function for the gory details. -acme
1312                  */
1313
1314                 /* It is tricky place. Until this moment IPv4 tcp
1315                    worked with IPv6 icsk.icsk_af_ops.
1316                    Sync it now.
1317                  */
1318                 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1319
1320                 return newsk;
1321         }
1322
1323         opt = np->opt;
1324
1325         if (sk_acceptq_is_full(sk))
1326                 goto out_overflow;
1327
1328         if (dst == NULL) {
1329                 struct in6_addr *final_p = NULL, final;
1330                 struct flowi fl;
1331
1332                 memset(&fl, 0, sizeof(fl));
1333                 fl.proto = IPPROTO_TCP;
1334                 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1335                 if (opt && opt->srcrt) {
1336                         struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1337                         ipv6_addr_copy(&final, &fl.fl6_dst);
1338                         ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1339                         final_p = &final;
1340                 }
1341                 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1342                 fl.oif = sk->sk_bound_dev_if;
1343                 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
1344                 fl.fl_ip_sport = inet_sk(sk)->sport;
1345                 security_req_classify_flow(req, &fl);
1346
1347                 if (ip6_dst_lookup(sk, &dst, &fl))
1348                         goto out;
1349
1350                 if (final_p)
1351                         ipv6_addr_copy(&fl.fl6_dst, final_p);
1352
1353                 if ((xfrm_lookup(&dst, &fl, sk, 0)) < 0)
1354                         goto out;
1355         }
1356
1357         newsk = tcp_create_openreq_child(sk, req, skb);
1358         if (newsk == NULL)
1359                 goto out;
1360
1361         /*
1362          * No need to charge this sock to the relevant IPv6 refcnt debug socks
1363          * count here, tcp_create_openreq_child now does this for us, see the
1364          * comment in that function for the gory details. -acme
1365          */
1366
1367         newsk->sk_gso_type = SKB_GSO_TCPV6;
1368         __ip6_dst_store(newsk, dst, NULL, NULL);
1369
1370         newtcp6sk = (struct tcp6_sock *)newsk;
1371         inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1372
1373         newtp = tcp_sk(newsk);
1374         newinet = inet_sk(newsk);
1375         newnp = inet6_sk(newsk);
1376
1377         memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1378
1379         ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1380         ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1381         ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1382         newsk->sk_bound_dev_if = treq->iif;
1383
1384         /* Now IPv6 options...
1385
1386            First: no IPv4 options.
1387          */
1388         newinet->opt = NULL;
1389         newnp->ipv6_fl_list = NULL;
1390
1391         /* Clone RX bits */
1392         newnp->rxopt.all = np->rxopt.all;
1393
1394         /* Clone pktoptions received with SYN */
1395         newnp->pktoptions = NULL;
1396         if (treq->pktopts != NULL) {
1397                 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1398                 kfree_skb(treq->pktopts);
1399                 treq->pktopts = NULL;
1400                 if (newnp->pktoptions)
1401                         skb_set_owner_r(newnp->pktoptions, newsk);
1402         }
1403         newnp->opt        = NULL;
1404         newnp->mcast_oif  = inet6_iif(skb);
1405         newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1406
1407         /* Clone native IPv6 options from listening socket (if any)
1408
1409            Yes, keeping reference count would be much more clever,
1410            but we make one more one thing there: reattach optmem
1411            to newsk.
1412          */
1413         if (opt) {
1414                 newnp->opt = ipv6_dup_options(newsk, opt);
1415                 if (opt != np->opt)
1416                         sock_kfree_s(sk, opt, opt->tot_len);
1417         }
1418
1419         inet_csk(newsk)->icsk_ext_hdr_len = 0;
1420         if (newnp->opt)
1421                 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1422                                                      newnp->opt->opt_flen);
1423
1424         tcp_mtup_init(newsk);
1425         tcp_sync_mss(newsk, dst_mtu(dst));
1426         newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1427         tcp_initialize_rcv_mss(newsk);
1428
1429         newinet->daddr = newinet->saddr = newinet->rcv_saddr = LOOPBACK4_IPV6;
1430
1431 #ifdef CONFIG_TCP_MD5SIG
1432         /* Copy over the MD5 key from the original socket */
1433         if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1434                 /* We're using one, so create a matching key
1435                  * on the newsk structure. If we fail to get
1436                  * memory, then we end up not copying the key
1437                  * across. Shucks.
1438                  */
1439                 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1440                 if (newkey != NULL)
1441                         tcp_v6_md5_do_add(newsk, &inet6_sk(sk)->daddr,
1442                                           newkey, key->keylen);
1443         }
1444 #endif
1445
1446         __inet6_hash(newsk);
1447         __inet_inherit_port(sk, newsk);
1448
1449         return newsk;
1450
1451 out_overflow:
1452         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1453 out:
1454         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1455         if (opt && opt != np->opt)
1456                 sock_kfree_s(sk, opt, opt->tot_len);
1457         dst_release(dst);
1458         return NULL;
1459 }
1460
1461 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1462 {
1463         if (skb->ip_summed == CHECKSUM_COMPLETE) {
1464                 if (!tcp_v6_check(tcp_hdr(skb), skb->len, &ipv6_hdr(skb)->saddr,
1465                                   &ipv6_hdr(skb)->daddr, skb->csum)) {
1466                         skb->ip_summed = CHECKSUM_UNNECESSARY;
1467                         return 0;
1468                 }
1469         }
1470
1471         skb->csum = ~csum_unfold(tcp_v6_check(tcp_hdr(skb), skb->len,
1472                                               &ipv6_hdr(skb)->saddr,
1473                                               &ipv6_hdr(skb)->daddr, 0));
1474
1475         if (skb->len <= 76) {
1476                 return __skb_checksum_complete(skb);
1477         }
1478         return 0;
1479 }
1480
1481 /* The socket must have it's spinlock held when we get
1482  * here.
1483  *
1484  * We have a potential double-lock case here, so even when
1485  * doing backlog processing we use the BH locking scheme.
1486  * This is because we cannot sleep with the original spinlock
1487  * held.
1488  */
1489 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1490 {
1491         struct ipv6_pinfo *np = inet6_sk(sk);
1492         struct tcp_sock *tp;
1493         struct sk_buff *opt_skb = NULL;
1494
1495         /* Imagine: socket is IPv6. IPv4 packet arrives,
1496            goes to IPv4 receive handler and backlogged.
1497            From backlog it always goes here. Kerboom...
1498            Fortunately, tcp_rcv_established and rcv_established
1499            handle them correctly, but it is not case with
1500            tcp_v6_hnd_req and tcp_v6_send_reset().   --ANK
1501          */
1502
1503         if (skb->protocol == htons(ETH_P_IP))
1504                 return tcp_v4_do_rcv(sk, skb);
1505
1506 #ifdef CONFIG_TCP_MD5SIG
1507         if (tcp_v6_inbound_md5_hash (sk, skb))
1508                 goto discard;
1509 #endif
1510
1511         if (sk_filter(sk, skb))
1512                 goto discard;
1513
1514         /*
1515          *      socket locking is here for SMP purposes as backlog rcv
1516          *      is currently called with bh processing disabled.
1517          */
1518
1519         /* Do Stevens' IPV6_PKTOPTIONS.
1520
1521            Yes, guys, it is the only place in our code, where we
1522            may make it not affecting IPv4.
1523            The rest of code is protocol independent,
1524            and I do not like idea to uglify IPv4.
1525
1526            Actually, all the idea behind IPV6_PKTOPTIONS
1527            looks not very well thought. For now we latch
1528            options, received in the last packet, enqueued
1529            by tcp. Feel free to propose better solution.
1530                                                --ANK (980728)
1531          */
1532         if (np->rxopt.all)
1533                 opt_skb = skb_clone(skb, GFP_ATOMIC);
1534
1535         if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1536                 TCP_CHECK_TIMER(sk);
1537                 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1538                         goto reset;
1539                 TCP_CHECK_TIMER(sk);
1540                 if (opt_skb)
1541                         goto ipv6_pktoptions;
1542                 return 0;
1543         }
1544
1545         if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1546                 goto csum_err;
1547
1548         if (sk->sk_state == TCP_LISTEN) {
1549                 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1550                 if (!nsk)
1551                         goto discard;
1552
1553                 /*
1554                  * Queue it on the new socket if the new socket is active,
1555                  * otherwise we just shortcircuit this and continue with
1556                  * the new socket..
1557                  */
1558                 if(nsk != sk) {
1559                         if (tcp_child_process(sk, nsk, skb))
1560                                 goto reset;
1561                         if (opt_skb)
1562                                 __kfree_skb(opt_skb);
1563                         return 0;
1564                 }
1565         }
1566
1567         TCP_CHECK_TIMER(sk);
1568         if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1569                 goto reset;
1570         TCP_CHECK_TIMER(sk);
1571         if (opt_skb)
1572                 goto ipv6_pktoptions;
1573         return 0;
1574
1575 reset:
1576         tcp_v6_send_reset(sk, skb);
1577 discard:
1578         if (opt_skb)
1579                 __kfree_skb(opt_skb);
1580         kfree_skb(skb);
1581         return 0;
1582 csum_err:
1583         TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1584         goto discard;
1585
1586
1587 ipv6_pktoptions:
1588         /* Do you ask, what is it?
1589
1590            1. skb was enqueued by tcp.
1591            2. skb is added to tail of read queue, rather than out of order.
1592            3. socket is not in passive state.
1593            4. Finally, it really contains options, which user wants to receive.
1594          */
1595         tp = tcp_sk(sk);
1596         if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1597             !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1598                 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1599                         np->mcast_oif = inet6_iif(opt_skb);
1600                 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1601                         np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1602                 if (ipv6_opt_accepted(sk, opt_skb)) {
1603                         skb_set_owner_r(opt_skb, sk);
1604                         opt_skb = xchg(&np->pktoptions, opt_skb);
1605                 } else {
1606                         __kfree_skb(opt_skb);
1607                         opt_skb = xchg(&np->pktoptions, NULL);
1608                 }
1609         }
1610
1611         if (opt_skb)
1612                 kfree_skb(opt_skb);
1613         return 0;
1614 }
1615
1616 static int tcp_v6_rcv(struct sk_buff *skb)
1617 {
1618         struct tcphdr *th;
1619         struct sock *sk;
1620         int ret;
1621         struct net *net = dev_net(skb->dev);
1622
1623         if (skb->pkt_type != PACKET_HOST)
1624                 goto discard_it;
1625
1626         /*
1627          *      Count it even if it's bad.
1628          */
1629         TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1630
1631         if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1632                 goto discard_it;
1633
1634         th = tcp_hdr(skb);
1635
1636         if (th->doff < sizeof(struct tcphdr)/4)
1637                 goto bad_packet;
1638         if (!pskb_may_pull(skb, th->doff*4))
1639                 goto discard_it;
1640
1641         if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1642                 goto bad_packet;
1643
1644         th = tcp_hdr(skb);
1645         TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1646         TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1647                                     skb->len - th->doff*4);
1648         TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1649         TCP_SKB_CB(skb)->when = 0;
1650         TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1651         TCP_SKB_CB(skb)->sacked = 0;
1652
1653         sk = __inet6_lookup(net, &tcp_hashinfo,
1654                         &ipv6_hdr(skb)->saddr, th->source,
1655                         &ipv6_hdr(skb)->daddr, ntohs(th->dest),
1656                         inet6_iif(skb));
1657
1658         if (!sk)
1659                 goto no_tcp_socket;
1660
1661 process:
1662         if (sk->sk_state == TCP_TIME_WAIT)
1663                 goto do_time_wait;
1664
1665         if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1666                 goto discard_and_relse;
1667
1668         if (sk_filter(sk, skb))
1669                 goto discard_and_relse;
1670
1671         skb->dev = NULL;
1672
1673         bh_lock_sock_nested(sk);
1674         ret = 0;
1675         if (!sock_owned_by_user(sk)) {
1676 #ifdef CONFIG_NET_DMA
1677                 struct tcp_sock *tp = tcp_sk(sk);
1678                 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1679                         tp->ucopy.dma_chan = get_softnet_dma();
1680                 if (tp->ucopy.dma_chan)
1681                         ret = tcp_v6_do_rcv(sk, skb);
1682                 else
1683 #endif
1684                 {
1685                         if (!tcp_prequeue(sk, skb))
1686                                 ret = tcp_v6_do_rcv(sk, skb);
1687                 }
1688         } else
1689                 sk_add_backlog(sk, skb);
1690         bh_unlock_sock(sk);
1691
1692         sock_put(sk);
1693         return ret ? -1 : 0;
1694
1695 no_tcp_socket:
1696         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1697                 goto discard_it;
1698
1699         if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1700 bad_packet:
1701                 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1702         } else {
1703                 tcp_v6_send_reset(NULL, skb);
1704         }
1705
1706 discard_it:
1707
1708         /*
1709          *      Discard frame
1710          */
1711
1712         kfree_skb(skb);
1713         return 0;
1714
1715 discard_and_relse:
1716         sock_put(sk);
1717         goto discard_it;
1718
1719 do_time_wait:
1720         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1721                 inet_twsk_put(inet_twsk(sk));
1722                 goto discard_it;
1723         }
1724
1725         if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1726                 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1727                 inet_twsk_put(inet_twsk(sk));
1728                 goto discard_it;
1729         }
1730
1731         switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1732         case TCP_TW_SYN:
1733         {
1734                 struct sock *sk2;
1735
1736                 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1737                                             &ipv6_hdr(skb)->daddr,
1738                                             ntohs(th->dest), inet6_iif(skb));
1739                 if (sk2 != NULL) {
1740                         struct inet_timewait_sock *tw = inet_twsk(sk);
1741                         inet_twsk_deschedule(tw, &tcp_death_row);
1742                         inet_twsk_put(tw);
1743                         sk = sk2;
1744                         goto process;
1745                 }
1746                 /* Fall through to ACK */
1747         }
1748         case TCP_TW_ACK:
1749                 tcp_v6_timewait_ack(sk, skb);
1750                 break;
1751         case TCP_TW_RST:
1752                 goto no_tcp_socket;
1753         case TCP_TW_SUCCESS:;
1754         }
1755         goto discard_it;
1756 }
1757
1758 static int tcp_v6_remember_stamp(struct sock *sk)
1759 {
1760         /* Alas, not yet... */
1761         return 0;
1762 }
1763
1764 static struct inet_connection_sock_af_ops ipv6_specific = {
1765         .queue_xmit        = inet6_csk_xmit,
1766         .send_check        = tcp_v6_send_check,
1767         .rebuild_header    = inet6_sk_rebuild_header,
1768         .conn_request      = tcp_v6_conn_request,
1769         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1770         .remember_stamp    = tcp_v6_remember_stamp,
1771         .net_header_len    = sizeof(struct ipv6hdr),
1772         .setsockopt        = ipv6_setsockopt,
1773         .getsockopt        = ipv6_getsockopt,
1774         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1775         .sockaddr_len      = sizeof(struct sockaddr_in6),
1776         .bind_conflict     = inet6_csk_bind_conflict,
1777 #ifdef CONFIG_COMPAT
1778         .compat_setsockopt = compat_ipv6_setsockopt,
1779         .compat_getsockopt = compat_ipv6_getsockopt,
1780 #endif
1781 };
1782
1783 #ifdef CONFIG_TCP_MD5SIG
1784 static struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1785         .md5_lookup     =       tcp_v6_md5_lookup,
1786         .calc_md5_hash  =       tcp_v6_calc_md5_hash,
1787         .md5_add        =       tcp_v6_md5_add_func,
1788         .md5_parse      =       tcp_v6_parse_md5_keys,
1789 };
1790 #endif
1791
1792 /*
1793  *      TCP over IPv4 via INET6 API
1794  */
1795
1796 static struct inet_connection_sock_af_ops ipv6_mapped = {
1797         .queue_xmit        = ip_queue_xmit,
1798         .send_check        = tcp_v4_send_check,
1799         .rebuild_header    = inet_sk_rebuild_header,
1800         .conn_request      = tcp_v6_conn_request,
1801         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1802         .remember_stamp    = tcp_v4_remember_stamp,
1803         .net_header_len    = sizeof(struct iphdr),
1804         .setsockopt        = ipv6_setsockopt,
1805         .getsockopt        = ipv6_getsockopt,
1806         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1807         .sockaddr_len      = sizeof(struct sockaddr_in6),
1808         .bind_conflict     = inet6_csk_bind_conflict,
1809 #ifdef CONFIG_COMPAT
1810         .compat_setsockopt = compat_ipv6_setsockopt,
1811         .compat_getsockopt = compat_ipv6_getsockopt,
1812 #endif
1813 };
1814
1815 #ifdef CONFIG_TCP_MD5SIG
1816 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1817         .md5_lookup     =       tcp_v4_md5_lookup,
1818         .calc_md5_hash  =       tcp_v4_calc_md5_hash,
1819         .md5_add        =       tcp_v6_md5_add_func,
1820         .md5_parse      =       tcp_v6_parse_md5_keys,
1821 };
1822 #endif
1823
1824 /* NOTE: A lot of things set to zero explicitly by call to
1825  *       sk_alloc() so need not be done here.
1826  */
1827 static int tcp_v6_init_sock(struct sock *sk)
1828 {
1829         struct inet_connection_sock *icsk = inet_csk(sk);
1830         struct tcp_sock *tp = tcp_sk(sk);
1831
1832         skb_queue_head_init(&tp->out_of_order_queue);
1833         tcp_init_xmit_timers(sk);
1834         tcp_prequeue_init(tp);
1835
1836         icsk->icsk_rto = TCP_TIMEOUT_INIT;
1837         tp->mdev = TCP_TIMEOUT_INIT;
1838
1839         /* So many TCP implementations out there (incorrectly) count the
1840          * initial SYN frame in their delayed-ACK and congestion control
1841          * algorithms that we must have the following bandaid to talk
1842          * efficiently to them.  -DaveM
1843          */
1844         tp->snd_cwnd = 2;
1845
1846         /* See draft-stevens-tcpca-spec-01 for discussion of the
1847          * initialization of these values.
1848          */
1849         tp->snd_ssthresh = 0x7fffffff;
1850         tp->snd_cwnd_clamp = ~0;
1851         tp->mss_cache = 536;
1852
1853         tp->reordering = sysctl_tcp_reordering;
1854
1855         sk->sk_state = TCP_CLOSE;
1856
1857         icsk->icsk_af_ops = &ipv6_specific;
1858         icsk->icsk_ca_ops = &tcp_init_congestion_ops;
1859         icsk->icsk_sync_mss = tcp_sync_mss;
1860         sk->sk_write_space = sk_stream_write_space;
1861         sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1862
1863 #ifdef CONFIG_TCP_MD5SIG
1864         tp->af_specific = &tcp_sock_ipv6_specific;
1865 #endif
1866
1867         sk->sk_sndbuf = sysctl_tcp_wmem[1];
1868         sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1869
1870         atomic_inc(&tcp_sockets_allocated);
1871
1872         return 0;
1873 }
1874
1875 static void tcp_v6_destroy_sock(struct sock *sk)
1876 {
1877 #ifdef CONFIG_TCP_MD5SIG
1878         /* Clean up the MD5 key list */
1879         if (tcp_sk(sk)->md5sig_info)
1880                 tcp_v6_clear_md5_list(sk);
1881 #endif
1882         tcp_v4_destroy_sock(sk);
1883         inet6_destroy_sock(sk);
1884 }
1885
1886 #ifdef CONFIG_PROC_FS
1887 /* Proc filesystem TCPv6 sock list dumping. */
1888 static void get_openreq6(struct seq_file *seq,
1889                          struct sock *sk, struct request_sock *req, int i, int uid)
1890 {
1891         int ttd = req->expires - jiffies;
1892         struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1893         struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1894
1895         if (ttd < 0)
1896                 ttd = 0;
1897
1898         seq_printf(seq,
1899                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1900                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1901                    i,
1902                    src->s6_addr32[0], src->s6_addr32[1],
1903                    src->s6_addr32[2], src->s6_addr32[3],
1904                    ntohs(inet_sk(sk)->sport),
1905                    dest->s6_addr32[0], dest->s6_addr32[1],
1906                    dest->s6_addr32[2], dest->s6_addr32[3],
1907                    ntohs(inet_rsk(req)->rmt_port),
1908                    TCP_SYN_RECV,
1909                    0,0, /* could print option size, but that is af dependent. */
1910                    1,   /* timers active (only the expire timer) */
1911                    jiffies_to_clock_t(ttd),
1912                    req->retrans,
1913                    uid,
1914                    0,  /* non standard timer */
1915                    0, /* open_requests have no inode */
1916                    0, req);
1917 }
1918
1919 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1920 {
1921         struct in6_addr *dest, *src;
1922         __u16 destp, srcp;
1923         int timer_active;
1924         unsigned long timer_expires;
1925         struct inet_sock *inet = inet_sk(sp);
1926         struct tcp_sock *tp = tcp_sk(sp);
1927         const struct inet_connection_sock *icsk = inet_csk(sp);
1928         struct ipv6_pinfo *np = inet6_sk(sp);
1929
1930         dest  = &np->daddr;
1931         src   = &np->rcv_saddr;
1932         destp = ntohs(inet->dport);
1933         srcp  = ntohs(inet->sport);
1934
1935         if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1936                 timer_active    = 1;
1937                 timer_expires   = icsk->icsk_timeout;
1938         } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1939                 timer_active    = 4;
1940                 timer_expires   = icsk->icsk_timeout;
1941         } else if (timer_pending(&sp->sk_timer)) {
1942                 timer_active    = 2;
1943                 timer_expires   = sp->sk_timer.expires;
1944         } else {
1945                 timer_active    = 0;
1946                 timer_expires = jiffies;
1947         }
1948
1949         seq_printf(seq,
1950                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1951                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %lu %lu %u %u %d\n",
1952                    i,
1953                    src->s6_addr32[0], src->s6_addr32[1],
1954                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1955                    dest->s6_addr32[0], dest->s6_addr32[1],
1956                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1957                    sp->sk_state,
1958                    tp->write_seq-tp->snd_una,
1959                    (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1960                    timer_active,
1961                    jiffies_to_clock_t(timer_expires - jiffies),
1962                    icsk->icsk_retransmits,
1963                    sock_i_uid(sp),
1964                    icsk->icsk_probes_out,
1965                    sock_i_ino(sp),
1966                    atomic_read(&sp->sk_refcnt), sp,
1967                    jiffies_to_clock_t(icsk->icsk_rto),
1968                    jiffies_to_clock_t(icsk->icsk_ack.ato),
1969                    (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1970                    tp->snd_cwnd, tp->snd_ssthresh>=0xFFFF?-1:tp->snd_ssthresh
1971                    );
1972 }
1973
1974 static void get_timewait6_sock(struct seq_file *seq,
1975                                struct inet_timewait_sock *tw, int i)
1976 {
1977         struct in6_addr *dest, *src;
1978         __u16 destp, srcp;
1979         struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1980         int ttd = tw->tw_ttd - jiffies;
1981
1982         if (ttd < 0)
1983                 ttd = 0;
1984
1985         dest = &tw6->tw_v6_daddr;
1986         src  = &tw6->tw_v6_rcv_saddr;
1987         destp = ntohs(tw->tw_dport);
1988         srcp  = ntohs(tw->tw_sport);
1989
1990         seq_printf(seq,
1991                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1992                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1993                    i,
1994                    src->s6_addr32[0], src->s6_addr32[1],
1995                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1996                    dest->s6_addr32[0], dest->s6_addr32[1],
1997                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1998                    tw->tw_substate, 0, 0,
1999                    3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
2000                    atomic_read(&tw->tw_refcnt), tw);
2001 }
2002
2003 static int tcp6_seq_show(struct seq_file *seq, void *v)
2004 {
2005         struct tcp_iter_state *st;
2006
2007         if (v == SEQ_START_TOKEN) {
2008                 seq_puts(seq,
2009                          "  sl  "
2010                          "local_address                         "
2011                          "remote_address                        "
2012                          "st tx_queue rx_queue tr tm->when retrnsmt"
2013                          "   uid  timeout inode\n");
2014                 goto out;
2015         }
2016         st = seq->private;
2017
2018         switch (st->state) {
2019         case TCP_SEQ_STATE_LISTENING:
2020         case TCP_SEQ_STATE_ESTABLISHED:
2021                 get_tcp6_sock(seq, v, st->num);
2022                 break;
2023         case TCP_SEQ_STATE_OPENREQ:
2024                 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2025                 break;
2026         case TCP_SEQ_STATE_TIME_WAIT:
2027                 get_timewait6_sock(seq, v, st->num);
2028                 break;
2029         }
2030 out:
2031         return 0;
2032 }
2033
2034 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
2035         .name           = "tcp6",
2036         .family         = AF_INET6,
2037         .seq_fops       = {
2038                 .owner          = THIS_MODULE,
2039         },
2040         .seq_ops        = {
2041                 .show           = tcp6_seq_show,
2042         },
2043 };
2044
2045 int tcp6_proc_init(struct net *net)
2046 {
2047         return tcp_proc_register(net, &tcp6_seq_afinfo);
2048 }
2049
2050 void tcp6_proc_exit(struct net *net)
2051 {
2052         tcp_proc_unregister(net, &tcp6_seq_afinfo);
2053 }
2054 #endif
2055
2056 struct proto tcpv6_prot = {
2057         .name                   = "TCPv6",
2058         .owner                  = THIS_MODULE,
2059         .close                  = tcp_close,
2060         .connect                = tcp_v6_connect,
2061         .disconnect             = tcp_disconnect,
2062         .accept                 = inet_csk_accept,
2063         .ioctl                  = tcp_ioctl,
2064         .init                   = tcp_v6_init_sock,
2065         .destroy                = tcp_v6_destroy_sock,
2066         .shutdown               = tcp_shutdown,
2067         .setsockopt             = tcp_setsockopt,
2068         .getsockopt             = tcp_getsockopt,
2069         .recvmsg                = tcp_recvmsg,
2070         .backlog_rcv            = tcp_v6_do_rcv,
2071         .hash                   = tcp_v6_hash,
2072         .unhash                 = inet_unhash,
2073         .get_port               = inet_csk_get_port,
2074         .enter_memory_pressure  = tcp_enter_memory_pressure,
2075         .sockets_allocated      = &tcp_sockets_allocated,
2076         .memory_allocated       = &tcp_memory_allocated,
2077         .memory_pressure        = &tcp_memory_pressure,
2078         .orphan_count           = &tcp_orphan_count,
2079         .sysctl_mem             = sysctl_tcp_mem,
2080         .sysctl_wmem            = sysctl_tcp_wmem,
2081         .sysctl_rmem            = sysctl_tcp_rmem,
2082         .max_header             = MAX_TCP_HEADER,
2083         .obj_size               = sizeof(struct tcp6_sock),
2084         .twsk_prot              = &tcp6_timewait_sock_ops,
2085         .rsk_prot               = &tcp6_request_sock_ops,
2086         .h.hashinfo             = &tcp_hashinfo,
2087 #ifdef CONFIG_COMPAT
2088         .compat_setsockopt      = compat_tcp_setsockopt,
2089         .compat_getsockopt      = compat_tcp_getsockopt,
2090 #endif
2091 };
2092
2093 static struct inet6_protocol tcpv6_protocol = {
2094         .handler        =       tcp_v6_rcv,
2095         .err_handler    =       tcp_v6_err,
2096         .gso_send_check =       tcp_v6_gso_send_check,
2097         .gso_segment    =       tcp_tso_segment,
2098         .flags          =       INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2099 };
2100
2101 static struct inet_protosw tcpv6_protosw = {
2102         .type           =       SOCK_STREAM,
2103         .protocol       =       IPPROTO_TCP,
2104         .prot           =       &tcpv6_prot,
2105         .ops            =       &inet6_stream_ops,
2106         .capability     =       -1,
2107         .no_check       =       0,
2108         .flags          =       INET_PROTOSW_PERMANENT |
2109                                 INET_PROTOSW_ICSK,
2110 };
2111
2112 static int tcpv6_net_init(struct net *net)
2113 {
2114         return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2115                                     SOCK_RAW, IPPROTO_TCP, net);
2116 }
2117
2118 static void tcpv6_net_exit(struct net *net)
2119 {
2120         inet_ctl_sock_destroy(net->ipv6.tcp_sk);
2121 }
2122
2123 static struct pernet_operations tcpv6_net_ops = {
2124         .init = tcpv6_net_init,
2125         .exit = tcpv6_net_exit,
2126 };
2127
2128 int __init tcpv6_init(void)
2129 {
2130         int ret;
2131
2132         ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2133         if (ret)
2134                 goto out;
2135
2136         /* register inet6 protocol */
2137         ret = inet6_register_protosw(&tcpv6_protosw);
2138         if (ret)
2139                 goto out_tcpv6_protocol;
2140
2141         ret = register_pernet_subsys(&tcpv6_net_ops);
2142         if (ret)
2143                 goto out_tcpv6_protosw;
2144 out:
2145         return ret;
2146
2147 out_tcpv6_protocol:
2148         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2149 out_tcpv6_protosw:
2150         inet6_unregister_protosw(&tcpv6_protosw);
2151         goto out;
2152 }
2153
2154 void tcpv6_exit(void)
2155 {
2156         unregister_pernet_subsys(&tcpv6_net_ops);
2157         inet6_unregister_protosw(&tcpv6_protosw);
2158         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2159 }