ipv6.c 29.0 KB
Newer Older
1 2
/*
 *	DCCP over IPv6
A
Arnaldo Carvalho de Melo 已提交
3
 *	Linux INET6 implementation
4 5 6 7 8 9 10 11 12 13 14 15 16
 *
 *	Based on net/dccp6/ipv6.c
 *
 *	Arnaldo Carvalho de Melo <acme@ghostprotocols.net>
 *
 *	This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

#include <linux/module.h>
#include <linux/random.h>
17
#include <linux/slab.h>
18 19 20 21 22
#include <linux/xfrm.h>

#include <net/addrconf.h>
#include <net/inet_common.h>
#include <net/inet_hashtables.h>
23
#include <net/inet_sock.h>
24 25 26 27 28 29
#include <net/inet6_connection_sock.h>
#include <net/inet6_hashtables.h>
#include <net/ip6_route.h>
#include <net/ipv6.h>
#include <net/protocol.h>
#include <net/transp_v6.h>
30
#include <net/ip6_checksum.h>
31
#include <net/xfrm.h>
32
#include <net/secure_seq.h>
33 34 35

#include "dccp.h"
#include "ipv6.h"
36
#include "feat.h"
37

38
/* The per-net dccp.v6_ctl_sk is used for sending RSTs and ACKs */
39

40 41
static const struct inet_connection_sock_af_ops dccp_ipv6_mapped;
static const struct inet_connection_sock_af_ops dccp_ipv6_af_ops;
42

43
/* add pseudo-header to DCCP checksum stored in skb->csum */
44
static inline __sum16 dccp_v6_csum_finish(struct sk_buff *skb,
45 46
				      const struct in6_addr *saddr,
				      const struct in6_addr *daddr)
47
{
48 49 50
	return csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_DCCP, skb->csum);
}

51
static inline void dccp_v6_send_check(struct sock *sk, struct sk_buff *skb)
52 53 54 55 56
{
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct dccp_hdr *dh = dccp_hdr(skb);

	dccp_csum_outgoing(skb);
57
	dh->dccph_checksum = dccp_v6_csum_finish(skb, &np->saddr, &sk->sk_v6_daddr);
58 59
}

60
static inline __u64 dccp_v6_init_sequence(struct sk_buff *skb)
61
{
62 63
	return secure_dccpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
					     ipv6_hdr(skb)->saddr.s6_addr32,
64 65 66
					     dccp_hdr(skb)->dccph_dport,
					     dccp_hdr(skb)->dccph_sport     );

67 68 69
}

static void dccp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
70
			u8 type, u8 code, int offset, __be32 info)
71
{
72
	const struct ipv6hdr *hdr = (const struct ipv6hdr *)skb->data;
73
	const struct dccp_hdr *dh = (struct dccp_hdr *)(skb->data + offset);
74
	struct dccp_sock *dp;
75 76 77 78
	struct ipv6_pinfo *np;
	struct sock *sk;
	int err;
	__u64 seq;
79
	struct net *net = dev_net(skb->dev);
80

81 82
	if (skb->len < offset + sizeof(*dh) ||
	    skb->len < offset + __dccp_basic_hdr_len(dh)) {
83 84
		ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
				   ICMP6_MIB_INERRORS);
85 86 87
		return;
	}

88 89 90 91
	sk = __inet6_lookup_established(net, &dccp_hashinfo,
					&hdr->daddr, dh->dccph_dport,
					&hdr->saddr, ntohs(dh->dccph_sport),
					inet6_iif(skb));
92

93
	if (!sk) {
94 95
		ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
				   ICMP6_MIB_INERRORS);
96 97 98 99
		return;
	}

	if (sk->sk_state == DCCP_TIME_WAIT) {
100
		inet_twsk_put(inet_twsk(sk));
101 102
		return;
	}
103 104 105
	seq = dccp_hdr_seq(dh);
	if (sk->sk_state == DCCP_NEW_SYN_RECV)
		return dccp_req_err(sk, seq);
106 107 108

	bh_lock_sock(sk);
	if (sock_owned_by_user(sk))
109
		NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
110 111 112 113

	if (sk->sk_state == DCCP_CLOSED)
		goto out;

114 115 116 117 118 119 120
	dp = dccp_sk(sk);
	if ((1 << sk->sk_state) & ~(DCCPF_REQUESTING | DCCPF_LISTEN) &&
	    !between48(seq, dp->dccps_awl, dp->dccps_awh)) {
		NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
		goto out;
	}

121 122
	np = inet6_sk(sk);

123 124 125
	if (type == NDISC_REDIRECT) {
		struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);

126
		if (dst)
127
			dst->ops->redirect(dst, sk, skb);
128
		goto out;
129 130
	}

131 132 133
	if (type == ICMPV6_PKT_TOOBIG) {
		struct dst_entry *dst = NULL;

134 135 136
		if (!ip6_sk_accept_pmtu(sk))
			goto out;

137 138 139 140 141
		if (sock_owned_by_user(sk))
			goto out;
		if ((1 << sk->sk_state) & (DCCPF_LISTEN | DCCPF_CLOSED))
			goto out;

142 143 144 145 146
		dst = inet6_csk_update_pmtu(sk, ntohl(info));
		if (!dst)
			goto out;

		if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst))
147 148 149 150 151 152 153 154 155 156
			dccp_sync_mss(sk, dst_mtu(dst));
		goto out;
	}

	icmpv6_err_convert(type, code, &err);

	/* Might be for an request_sock */
	switch (sk->sk_state) {
	case DCCP_REQUESTING:
	case DCCP_RESPOND:  /* Cannot happen.
A
Arnaldo Carvalho de Melo 已提交
157
			       It can, it SYNs are crossed. --ANK */
158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183
		if (!sock_owned_by_user(sk)) {
			DCCP_INC_STATS_BH(DCCP_MIB_ATTEMPTFAILS);
			sk->sk_err = err;
			/*
			 * Wake people up to see the error
			 * (see connect in sock.c)
			 */
			sk->sk_error_report(sk);
			dccp_done(sk);
		} else
			sk->sk_err_soft = err;
		goto out;
	}

	if (!sock_owned_by_user(sk) && np->recverr) {
		sk->sk_err = err;
		sk->sk_error_report(sk);
	} else
		sk->sk_err_soft = err;

out:
	bh_unlock_sock(sk);
	sock_put(sk);
}


184
static int dccp_v6_send_response(const struct sock *sk, struct request_sock *req)
185
{
186
	struct inet_request_sock *ireq = inet_rsk(req);
187 188
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct sk_buff *skb;
189
	struct in6_addr *final_p, final;
190
	struct flowi6 fl6;
191
	int err = -1;
192
	struct dst_entry *dst;
193

194 195
	memset(&fl6, 0, sizeof(fl6));
	fl6.flowi6_proto = IPPROTO_DCCP;
196 197
	fl6.daddr = ireq->ir_v6_rmt_addr;
	fl6.saddr = ireq->ir_v6_loc_addr;
198
	fl6.flowlabel = 0;
199 200
	fl6.flowi6_oif = ireq->ir_iif;
	fl6.fl6_dport = ireq->ir_rmt_port;
E
Eric Dumazet 已提交
201
	fl6.fl6_sport = htons(ireq->ir_num);
202
	security_req_classify_flow(req, flowi6_to_flowi(&fl6));
203 204


205 206 207
	rcu_read_lock();
	final_p = fl6_update_dst(&fl6, rcu_dereference(np->opt), &final);
	rcu_read_unlock();
208

209
	dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
210 211 212
	if (IS_ERR(dst)) {
		err = PTR_ERR(dst);
		dst = NULL;
213
		goto done;
214
	}
215 216 217 218

	skb = dccp_make_response(sk, dst, req);
	if (skb != NULL) {
		struct dccp_hdr *dh = dccp_hdr(skb);
A
Arnaldo Carvalho de Melo 已提交
219

220
		dh->dccph_checksum = dccp_v6_csum_finish(skb,
221 222 223
							 &ireq->ir_v6_loc_addr,
							 &ireq->ir_v6_rmt_addr);
		fl6.daddr = ireq->ir_v6_rmt_addr;
224 225 226 227
		rcu_read_lock();
		err = ip6_xmit(sk, skb, &fl6, rcu_dereference(np->opt),
			       np->tclass);
		rcu_read_unlock();
228
		err = net_xmit_eval(err);
229 230 231
	}

done:
232
	dst_release(dst);
233 234 235 236 237
	return err;
}

static void dccp_v6_reqsk_destructor(struct request_sock *req)
{
238
	dccp_feat_list_purge(&dccp_rsk(req)->dreq_featneg);
239
	kfree_skb(inet_rsk(req)->pktopts);
240 241
}

242
static void dccp_v6_ctl_send_reset(const struct sock *sk, struct sk_buff *rxskb)
243
{
244
	const struct ipv6hdr *rxip6h;
245
	struct sk_buff *skb;
246
	struct flowi6 fl6;
E
Eric Dumazet 已提交
247
	struct net *net = dev_net(skb_dst(rxskb)->dev);
248
	struct sock *ctl_sk = net->dccp.v6_ctl_sk;
E
Eric Dumazet 已提交
249
	struct dst_entry *dst;
250

251
	if (dccp_hdr(rxskb)->dccph_type == DCCP_PKT_RESET)
252 253 254
		return;

	if (!ipv6_unicast_destination(rxskb))
A
Arnaldo Carvalho de Melo 已提交
255
		return;
256

257
	skb = dccp_ctl_make_reset(ctl_sk, rxskb);
A
Arnaldo Carvalho de Melo 已提交
258
	if (skb == NULL)
259
		return;
260

261
	rxip6h = ipv6_hdr(rxskb);
262 263
	dccp_hdr(skb)->dccph_checksum = dccp_v6_csum_finish(skb, &rxip6h->saddr,
							    &rxip6h->daddr);
264

265
	memset(&fl6, 0, sizeof(fl6));
A
Alexey Dobriyan 已提交
266 267
	fl6.daddr = rxip6h->saddr;
	fl6.saddr = rxip6h->daddr;
268

269 270
	fl6.flowi6_proto = IPPROTO_DCCP;
	fl6.flowi6_oif = inet6_iif(rxskb);
271 272
	fl6.fl6_dport = dccp_hdr(skb)->dccph_dport;
	fl6.fl6_sport = dccp_hdr(skb)->dccph_sport;
273
	security_skb_classify_flow(rxskb, flowi6_to_flowi(&fl6));
274 275

	/* sk = NULL, but it is safe for now. RST socket required. */
276
	dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL);
277 278
	if (!IS_ERR(dst)) {
		skb_dst_set(skb, dst);
279
		ip6_xmit(ctl_sk, skb, &fl6, NULL, 0);
280 281 282
		DCCP_INC_STATS_BH(DCCP_MIB_OUTSEGS);
		DCCP_INC_STATS_BH(DCCP_MIB_OUTRSTS);
		return;
283 284 285 286 287
	}

	kfree_skb(skb);
}

288 289 290 291 292 293 294
static struct request_sock_ops dccp6_request_sock_ops = {
	.family		= AF_INET6,
	.obj_size	= sizeof(struct dccp6_request_sock),
	.rtx_syn_ack	= dccp_v6_send_response,
	.send_ack	= dccp_reqsk_send_ack,
	.destructor	= dccp_v6_reqsk_destructor,
	.send_reset	= dccp_v6_ctl_send_reset,
295
	.syn_ack_timeout = dccp_syn_ack_timeout,
296 297
};

298 299 300 301
static int dccp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
{
	struct request_sock *req;
	struct dccp_request_sock *dreq;
302
	struct inet_request_sock *ireq;
303
	struct ipv6_pinfo *np = inet6_sk(sk);
304
	const __be32 service = dccp_hdr_request(skb)->dccph_req_service;
305 306 307 308 309 310
	struct dccp_skb_cb *dcb = DCCP_SKB_CB(skb);

	if (skb->protocol == htons(ETH_P_IP))
		return dccp_v4_conn_request(sk, skb);

	if (!ipv6_unicast_destination(skb))
311
		return 0;	/* discard, don't send a reset here */
312 313

	if (dccp_bad_service_code(sk, service)) {
314
		dcb->dccpd_reset_code = DCCP_RESET_CODE_BAD_SERVICE_CODE;
315
		goto drop;
316
	}
317
	/*
A
Arnaldo Carvalho de Melo 已提交
318
	 * There are no SYN attacks on IPv6, yet...
319
	 */
320
	dcb->dccpd_reset_code = DCCP_RESET_CODE_TOO_BUSY;
321
	if (inet_csk_reqsk_queue_is_full(sk))
A
Arnaldo Carvalho de Melo 已提交
322
		goto drop;
323 324 325 326

	if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
		goto drop;

327
	req = inet_reqsk_alloc(&dccp6_request_sock_ops, sk, true);
328 329 330
	if (req == NULL)
		goto drop;

331 332
	if (dccp_reqsk_init(req, dccp_sk(sk), skb))
		goto drop_and_free;
333

334 335 336 337
	dreq = dccp_rsk(req);
	if (dccp_parse_options(sk, dreq, skb))
		goto drop_and_free;

338 339 340
	if (security_inet_conn_request(sk, skb, req))
		goto drop_and_free;

341 342 343
	ireq = inet_rsk(req);
	ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
	ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
E
Eric Dumazet 已提交
344
	ireq->ireq_family = AF_INET6;
345

346
	if (ipv6_opt_accepted(sk, skb, IP6CB(skb)) ||
347 348 349
	    np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
	    np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
		atomic_inc(&skb->users);
350
		ireq->pktopts = skb;
351
	}
352
	ireq->ir_iif = sk->sk_bound_dev_if;
353 354 355

	/* So that link locals have meaning */
	if (!sk->sk_bound_dev_if &&
356 357
	    ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
		ireq->ir_iif = inet6_iif(skb);
358

A
Arnaldo Carvalho de Melo 已提交
359
	/*
360 361
	 * Step 3: Process LISTEN state
	 *
362
	 *   Set S.ISR, S.GSR, S.SWL, S.SWH from packet or Init Cookie
363
	 *
364
	 * Setting S.SWL/S.SWH to is deferred to dccp_create_openreq_child().
365 366
	 */
	dreq->dreq_isr	   = dcb->dccpd_seq;
367
	dreq->dreq_gsr     = dreq->dreq_isr;
368
	dreq->dreq_iss	   = dccp_v6_init_sequence(skb);
369
	dreq->dreq_gss     = dreq->dreq_iss;
370 371
	dreq->dreq_service = service;

C
Christoph Paasch 已提交
372
	if (dccp_v6_send_response(sk, req))
373 374
		goto drop_and_free;

375
	inet_csk_reqsk_queue_hash_add(sk, req, DCCP_TIMEOUT_INIT);
376 377 378 379 380 381 382 383 384
	return 0;

drop_and_free:
	reqsk_free(req);
drop:
	DCCP_INC_STATS_BH(DCCP_MIB_ATTEMPTFAILS);
	return -1;
}

385
static struct sock *dccp_v6_request_recv_sock(const struct sock *sk,
386 387
					      struct sk_buff *skb,
					      struct request_sock *req,
388 389 390
					      struct dst_entry *dst,
					      struct request_sock *req_unhash,
					      bool *own_req)
391
{
392
	struct inet_request_sock *ireq = inet_rsk(req);
393 394
	struct ipv6_pinfo *newnp;
	const struct ipv6_pinfo *np = inet6_sk(sk);
395
	struct ipv6_txoptions *opt;
396 397 398 399 400 401 402 403
	struct inet_sock *newinet;
	struct dccp6_sock *newdp6;
	struct sock *newsk;

	if (skb->protocol == htons(ETH_P_IP)) {
		/*
		 *	v6 mapped
		 */
404 405
		newsk = dccp_v4_request_recv_sock(sk, skb, req, dst,
						  req_unhash, own_req);
A
Arnaldo Carvalho de Melo 已提交
406
		if (newsk == NULL)
407 408 409 410 411 412 413 414 415
			return NULL;

		newdp6 = (struct dccp6_sock *)newsk;
		newinet = inet_sk(newsk);
		newinet->pinet6 = &newdp6->inet6;
		newnp = inet6_sk(newsk);

		memcpy(newnp, np, sizeof(struct ipv6_pinfo));

416
		newnp->saddr = newsk->sk_v6_rcv_saddr;
417 418 419 420 421 422

		inet_csk(newsk)->icsk_af_ops = &dccp_ipv6_mapped;
		newsk->sk_backlog_rcv = dccp_v4_do_rcv;
		newnp->pktoptions  = NULL;
		newnp->opt	   = NULL;
		newnp->mcast_oif   = inet6_iif(skb);
423
		newnp->mcast_hops  = ipv6_hdr(skb)->hop_limit;
424 425 426 427 428 429 430 431 432 433 434

		/*
		 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
		 * here, dccp_create_openreq_child now does this for us, see the comment in
		 * that function for the gory details. -acme
		 */

		/* It is tricky place. Until this moment IPv4 tcp
		   worked with IPv6 icsk.icsk_af_ops.
		   Sync it now.
		 */
435
		dccp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
436 437 438 439 440 441 442 443

		return newsk;
	}


	if (sk_acceptq_is_full(sk))
		goto out_overflow;

444
	if (!dst) {
445 446
		struct flowi6 fl6;

447 448
		dst = inet6_csk_route_req(sk, &fl6, req, IPPROTO_DCCP);
		if (!dst)
449
			goto out;
A
Arnaldo Carvalho de Melo 已提交
450
	}
451 452 453

	newsk = dccp_create_openreq_child(sk, req, skb);
	if (newsk == NULL)
454
		goto out_nonewsk;
455 456 457 458 459 460 461

	/*
	 * No need to charge this sock to the relevant IPv6 refcnt debug socks
	 * count here, dccp_create_openreq_child now does this for us, see the
	 * comment in that function for the gory details. -acme
	 */

E
Eric Dumazet 已提交
462
	ip6_dst_store(newsk, dst, NULL, NULL);
A
Arnaldo Carvalho de Melo 已提交
463 464
	newsk->sk_route_caps = dst->dev->features & ~(NETIF_F_IP_CSUM |
						      NETIF_F_TSO);
465 466 467 468 469 470 471
	newdp6 = (struct dccp6_sock *)newsk;
	newinet = inet_sk(newsk);
	newinet->pinet6 = &newdp6->inet6;
	newnp = inet6_sk(newsk);

	memcpy(newnp, np, sizeof(struct ipv6_pinfo));

472 473 474 475
	newsk->sk_v6_daddr	= ireq->ir_v6_rmt_addr;
	newnp->saddr		= ireq->ir_v6_loc_addr;
	newsk->sk_v6_rcv_saddr	= ireq->ir_v6_loc_addr;
	newsk->sk_bound_dev_if	= ireq->ir_iif;
476

A
Arnaldo Carvalho de Melo 已提交
477
	/* Now IPv6 options...
478 479 480

	   First: no IPv4 options.
	 */
481
	newinet->inet_opt = NULL;
482 483 484 485 486 487 488

	/* Clone RX bits */
	newnp->rxopt.all = np->rxopt.all;

	newnp->pktoptions = NULL;
	newnp->opt	  = NULL;
	newnp->mcast_oif  = inet6_iif(skb);
489
	newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
490

A
Arnaldo Carvalho de Melo 已提交
491 492 493 494 495
	/*
	 * Clone native IPv6 options from listening socket (if any)
	 *
	 * Yes, keeping reference count would be much more clever, but we make
	 * one more one thing there: reattach optmem to newsk.
496
	 */
497 498 499 500 501
	opt = rcu_dereference(np->opt);
	if (opt) {
		opt = ipv6_dup_options(newsk, opt);
		RCU_INIT_POINTER(newnp->opt, opt);
	}
502
	inet_csk(newsk)->icsk_ext_hdr_len = 0;
503 504 505
	if (opt)
		inet_csk(newsk)->icsk_ext_hdr_len = opt->opt_nflen +
						    opt->opt_flen;
506 507 508

	dccp_sync_mss(newsk, dst_mtu(dst));

E
Eric Dumazet 已提交
509 510
	newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
	newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
511

512
	if (__inet_inherit_port(sk, newsk) < 0) {
513 514
		inet_csk_prepare_forced_close(newsk);
		dccp_done(newsk);
515 516
		goto out;
	}
517
	*own_req = inet_ehash_nolisten(newsk, req_to_sk(req_unhash));
E
Eric Dumazet 已提交
518 519 520 521 522 523 524 525
	/* Clone pktoptions received with SYN, if we own the req */
	if (*own_req && ireq->pktopts) {
		newnp->pktoptions = skb_clone(ireq->pktopts, GFP_ATOMIC);
		consume_skb(ireq->pktopts);
		ireq->pktopts = NULL;
		if (newnp->pktoptions)
			skb_set_owner_r(newnp->pktoptions, newsk);
	}
526 527 528 529

	return newsk;

out_overflow:
530
	NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
531 532
out_nonewsk:
	dst_release(dst);
533
out:
534
	NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561
	return NULL;
}

/* The socket must have it's spinlock held when we get
 * here.
 *
 * We have a potential double-lock case here, so even when
 * doing backlog processing we use the BH locking scheme.
 * This is because we cannot sleep with the original spinlock
 * held.
 */
static int dccp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
{
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct sk_buff *opt_skb = NULL;

	/* Imagine: socket is IPv6. IPv4 packet arrives,
	   goes to IPv4 receive handler and backlogged.
	   From backlog it always goes here. Kerboom...
	   Fortunately, dccp_rcv_established and rcv_established
	   handle them correctly, but it is not case with
	   dccp_v6_hnd_req and dccp_v6_ctl_send_reset().   --ANK
	 */

	if (skb->protocol == htons(ETH_P_IP))
		return dccp_v4_do_rcv(sk, skb);

562
	if (sk_filter(sk, skb))
563 564 565
		goto discard;

	/*
A
Arnaldo Carvalho de Melo 已提交
566 567
	 * socket locking is here for SMP purposes as backlog rcv is currently
	 * called with bh processing disabled.
568 569 570 571 572 573 574 575 576 577 578 579 580
	 */

	/* Do Stevens' IPV6_PKTOPTIONS.

	   Yes, guys, it is the only place in our code, where we
	   may make it not affecting IPv4.
	   The rest of code is protocol independent,
	   and I do not like idea to uglify IPv4.

	   Actually, all the idea behind IPV6_PKTOPTIONS
	   looks not very well thought. For now we latch
	   options, received in the last packet, enqueued
	   by tcp. Feel free to propose better solution.
581
					       --ANK (980728)
582 583
	 */
	if (np->rxopt.all)
584 585 586 587
	/*
	 * FIXME: Add handling of IPV6_PKTOPTIONS skb. See the comments below
	 *        (wrt ipv6_pktopions) and net/ipv6/tcp_ipv6.c for an example.
	 */
588 589 590 591 592
		opt_skb = skb_clone(skb, GFP_ATOMIC);

	if (sk->sk_state == DCCP_OPEN) { /* Fast path */
		if (dccp_rcv_established(sk, skb, dccp_hdr(skb), skb->len))
			goto reset;
D
David S. Miller 已提交
593
		if (opt_skb) {
594
			/* XXX This is where we would goto ipv6_pktoptions. */
D
David S. Miller 已提交
595 596
			__kfree_skb(opt_skb);
		}
597 598 599
		return 0;
	}

600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623
	/*
	 *  Step 3: Process LISTEN state
	 *     If S.state == LISTEN,
	 *	 If P.type == Request or P contains a valid Init Cookie option,
	 *	      (* Must scan the packet's options to check for Init
	 *		 Cookies.  Only Init Cookies are processed here,
	 *		 however; other options are processed in Step 8.  This
	 *		 scan need only be performed if the endpoint uses Init
	 *		 Cookies *)
	 *	      (* Generate a new socket and switch to that socket *)
	 *	      Set S := new socket for this port pair
	 *	      S.state = RESPOND
	 *	      Choose S.ISS (initial seqno) or set from Init Cookies
	 *	      Initialize S.GAR := S.ISS
	 *	      Set S.ISR, S.GSR, S.SWL, S.SWH from packet or Init Cookies
	 *	      Continue with S.state == RESPOND
	 *	      (* A Response packet will be generated in Step 11 *)
	 *	 Otherwise,
	 *	      Generate Reset(No Connection) unless P.type == Reset
	 *	      Drop packet and return
	 *
	 * NOTE: the check for the packet types is done in
	 *	 dccp_rcv_state_process
	 */
624 625 626

	if (dccp_rcv_state_process(sk, skb, dccp_hdr(skb), skb->len))
		goto reset;
D
David S. Miller 已提交
627
	if (opt_skb) {
628
		/* XXX This is where we would goto ipv6_pktoptions. */
D
David S. Miller 已提交
629 630
		__kfree_skb(opt_skb);
	}
631 632 633
	return 0;

reset:
634
	dccp_v6_ctl_send_reset(sk, skb);
635
discard:
A
Arnaldo Carvalho de Melo 已提交
636
	if (opt_skb != NULL)
637 638 639 640 641
		__kfree_skb(opt_skb);
	kfree_skb(skb);
	return 0;
}

642
static int dccp_v6_rcv(struct sk_buff *skb)
643 644 645
{
	const struct dccp_hdr *dh;
	struct sock *sk;
646
	int min_cov;
647

648
	/* Step 1: Check header basics */
649 650 651 652

	if (dccp_invalid_packet(skb))
		goto discard_it;

653
	/* Step 1: If header checksum is incorrect, drop packet and return. */
654 655
	if (dccp_v6_csum_finish(skb, &ipv6_hdr(skb)->saddr,
				     &ipv6_hdr(skb)->daddr)) {
656
		DCCP_WARN("dropped packet with invalid checksum\n");
657 658 659
		goto discard_it;
	}

660 661
	dh = dccp_hdr(skb);

662
	DCCP_SKB_CB(skb)->dccpd_seq  = dccp_hdr_seq(dh);
663 664 665 666 667 668 669
	DCCP_SKB_CB(skb)->dccpd_type = dh->dccph_type;

	if (dccp_packet_without_ack(skb))
		DCCP_SKB_CB(skb)->dccpd_ack_seq = DCCP_PKT_WITHOUT_ACK_SEQ;
	else
		DCCP_SKB_CB(skb)->dccpd_ack_seq = dccp_hdr_ack_seq(skb);

670
lookup:
671
	sk = __inet6_lookup_skb(&dccp_hashinfo, skb, __dccp_hdr_len(dh),
E
Eric Dumazet 已提交
672 673
			        dh->dccph_sport, dh->dccph_dport,
				inet6_iif(skb));
674
	if (!sk) {
675 676
		dccp_pr_debug("failed to look up flow ID in table and "
			      "get corresponding socket\n");
677
		goto no_dccp_socket;
678
	}
679

A
Arnaldo Carvalho de Melo 已提交
680
	/*
681
	 * Step 2:
682
	 *	... or S.state == TIMEWAIT,
683 684 685
	 *		Generate Reset(No Connection) unless P.type == Reset
	 *		Drop packet and return
	 */
686 687 688 689 690
	if (sk->sk_state == DCCP_TIME_WAIT) {
		dccp_pr_debug("sk->sk_state == DCCP_TIME_WAIT: do_time_wait\n");
		inet_twsk_put(inet_twsk(sk));
		goto no_dccp_socket;
	}
691

692 693 694 695 696
	if (sk->sk_state == DCCP_NEW_SYN_RECV) {
		struct request_sock *req = inet_reqsk(sk);
		struct sock *nsk = NULL;

		sk = req->rsk_listener;
697
		if (likely(sk->sk_state == DCCP_LISTEN)) {
698
			nsk = dccp_check_req(sk, skb, req);
699
		} else {
700
			inet_csk_reqsk_queue_drop_and_put(sk, req);
701 702
			goto lookup;
		}
703 704 705 706 707 708 709 710 711 712 713 714 715 716
		if (!nsk) {
			reqsk_put(req);
			goto discard_it;
		}
		if (nsk == sk) {
			sock_hold(sk);
			reqsk_put(req);
		} else if (dccp_child_process(sk, nsk, skb)) {
			dccp_v6_ctl_send_reset(sk, skb);
			goto discard_it;
		} else {
			return 0;
		}
	}
717 718
	/*
	 * RFC 4340, sec. 9.2.1: Minimum Checksum Coverage
719 720
	 *	o if MinCsCov = 0, only packets with CsCov = 0 are accepted
	 *	o if MinCsCov > 0, also accept packets with CsCov >= MinCsCov
721 722 723 724 725 726 727 728 729
	 */
	min_cov = dccp_sk(sk)->dccps_pcrlen;
	if (dh->dccph_cscov  &&  (min_cov == 0 || dh->dccph_cscov < min_cov))  {
		dccp_pr_debug("Packet CsCov %d does not satisfy MinCsCov %d\n",
			      dh->dccph_cscov, min_cov);
		/* FIXME: send Data Dropped option (see also dccp_v4_rcv) */
		goto discard_and_relse;
	}

730 731 732
	if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
		goto discard_and_relse;

733
	return sk_receive_skb(sk, skb, 1) ? -1 : 0;
734 735 736 737 738 739

no_dccp_socket:
	if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
		goto discard_it;
	/*
	 * Step 2:
740
	 *	If no socket ...
741 742 743 744 745 746
	 *		Generate Reset(No Connection) unless P.type == Reset
	 *		Drop packet and return
	 */
	if (dh->dccph_type != DCCP_PKT_RESET) {
		DCCP_SKB_CB(skb)->dccpd_reset_code =
					DCCP_RESET_CODE_NO_CONNECTION;
747
		dccp_v6_ctl_send_reset(sk, skb);
748 749
	}

750
discard_it:
751 752 753 754 755 756 757 758
	kfree_skb(skb);
	return 0;

discard_and_relse:
	sock_put(sk);
	goto discard_it;
}

759 760 761 762 763 764 765 766
static int dccp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
			   int addr_len)
{
	struct sockaddr_in6 *usin = (struct sockaddr_in6 *)uaddr;
	struct inet_connection_sock *icsk = inet_csk(sk);
	struct inet_sock *inet = inet_sk(sk);
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct dccp_sock *dp = dccp_sk(sk);
767
	struct in6_addr *saddr = NULL, *final_p, final;
768
	struct ipv6_txoptions *opt;
769
	struct flowi6 fl6;
770 771 772 773 774 775 776 777 778 779 780 781
	struct dst_entry *dst;
	int addr_type;
	int err;

	dp->dccps_role = DCCP_ROLE_CLIENT;

	if (addr_len < SIN6_LEN_RFC2133)
		return -EINVAL;

	if (usin->sin6_family != AF_INET6)
		return -EAFNOSUPPORT;

782
	memset(&fl6, 0, sizeof(fl6));
783 784

	if (np->sndflow) {
785 786 787
		fl6.flowlabel = usin->sin6_flowinfo & IPV6_FLOWINFO_MASK;
		IP6_ECN_flow_init(fl6.flowlabel);
		if (fl6.flowlabel & IPV6_FLOWLABEL_MASK) {
788
			struct ip6_flowlabel *flowlabel;
789
			flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823
			if (flowlabel == NULL)
				return -EINVAL;
			fl6_sock_release(flowlabel);
		}
	}
	/*
	 * connect() to INADDR_ANY means loopback (BSD'ism).
	 */
	if (ipv6_addr_any(&usin->sin6_addr))
		usin->sin6_addr.s6_addr[15] = 1;

	addr_type = ipv6_addr_type(&usin->sin6_addr);

	if (addr_type & IPV6_ADDR_MULTICAST)
		return -ENETUNREACH;

	if (addr_type & IPV6_ADDR_LINKLOCAL) {
		if (addr_len >= sizeof(struct sockaddr_in6) &&
		    usin->sin6_scope_id) {
			/* If interface is set while binding, indices
			 * must coincide.
			 */
			if (sk->sk_bound_dev_if &&
			    sk->sk_bound_dev_if != usin->sin6_scope_id)
				return -EINVAL;

			sk->sk_bound_dev_if = usin->sin6_scope_id;
		}

		/* Connect to link-local address requires an interface */
		if (!sk->sk_bound_dev_if)
			return -EINVAL;
	}

824
	sk->sk_v6_daddr = usin->sin6_addr;
825
	np->flow_label = fl6.flowlabel;
826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852

	/*
	 * DCCP over IPv4
	 */
	if (addr_type == IPV6_ADDR_MAPPED) {
		u32 exthdrlen = icsk->icsk_ext_hdr_len;
		struct sockaddr_in sin;

		SOCK_DEBUG(sk, "connect: ipv4 mapped\n");

		if (__ipv6_only_sock(sk))
			return -ENETUNREACH;

		sin.sin_family = AF_INET;
		sin.sin_port = usin->sin6_port;
		sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];

		icsk->icsk_af_ops = &dccp_ipv6_mapped;
		sk->sk_backlog_rcv = dccp_v4_do_rcv;

		err = dccp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
		if (err) {
			icsk->icsk_ext_hdr_len = exthdrlen;
			icsk->icsk_af_ops = &dccp_ipv6_af_ops;
			sk->sk_backlog_rcv = dccp_v6_do_rcv;
			goto failure;
		}
853
		np->saddr = sk->sk_v6_rcv_saddr;
854 855 856
		return err;
	}

857 858
	if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
		saddr = &sk->sk_v6_rcv_saddr;
859

860
	fl6.flowi6_proto = IPPROTO_DCCP;
861
	fl6.daddr = sk->sk_v6_daddr;
A
Alexey Dobriyan 已提交
862
	fl6.saddr = saddr ? *saddr : np->saddr;
863
	fl6.flowi6_oif = sk->sk_bound_dev_if;
864 865
	fl6.fl6_dport = usin->sin6_port;
	fl6.fl6_sport = inet->inet_sport;
866
	security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
867

868 869
	opt = rcu_dereference_protected(np->opt, sock_owned_by_user(sk));
	final_p = fl6_update_dst(&fl6, opt, &final);
870

871
	dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
872 873
	if (IS_ERR(dst)) {
		err = PTR_ERR(dst);
874
		goto failure;
875
	}
876 877

	if (saddr == NULL) {
878
		saddr = &fl6.saddr;
879
		sk->sk_v6_rcv_saddr = *saddr;
880 881 882
	}

	/* set the source address */
A
Alexey Dobriyan 已提交
883
	np->saddr = *saddr;
E
Eric Dumazet 已提交
884
	inet->inet_rcv_saddr = LOOPBACK4_IPV6;
885

E
Eric Dumazet 已提交
886
	ip6_dst_store(sk, dst, NULL, NULL);
887 888

	icsk->icsk_ext_hdr_len = 0;
889 890
	if (opt)
		icsk->icsk_ext_hdr_len = opt->opt_flen + opt->opt_nflen;
891

E
Eric Dumazet 已提交
892
	inet->inet_dport = usin->sin6_port;
893 894 895 896 897

	dccp_set_state(sk, DCCP_REQUESTING);
	err = inet6_hash_connect(&dccp_death_row, sk);
	if (err)
		goto late_failure;
898 899

	dp->dccps_iss = secure_dccpv6_sequence_number(np->saddr.s6_addr32,
900
						      sk->sk_v6_daddr.s6_addr32,
E
Eric Dumazet 已提交
901 902
						      inet->inet_sport,
						      inet->inet_dport);
903 904 905 906 907 908 909 910 911 912
	err = dccp_connect(sk);
	if (err)
		goto late_failure;

	return 0;

late_failure:
	dccp_set_state(sk, DCCP_CLOSED);
	__sk_dst_reset(sk);
failure:
E
Eric Dumazet 已提交
913
	inet->inet_dport = 0;
914 915 916 917
	sk->sk_route_caps = 0;
	return err;
}

918
static const struct inet_connection_sock_af_ops dccp_ipv6_af_ops = {
919 920 921 922 923 924 925 926 927 928
	.queue_xmit	   = inet6_csk_xmit,
	.send_check	   = dccp_v6_send_check,
	.rebuild_header	   = inet6_sk_rebuild_header,
	.conn_request	   = dccp_v6_conn_request,
	.syn_recv_sock	   = dccp_v6_request_recv_sock,
	.net_header_len	   = sizeof(struct ipv6hdr),
	.setsockopt	   = ipv6_setsockopt,
	.getsockopt	   = ipv6_getsockopt,
	.addr2sockaddr	   = inet6_csk_addr2sockaddr,
	.sockaddr_len	   = sizeof(struct sockaddr_in6),
929
	.bind_conflict	   = inet6_csk_bind_conflict,
930
#ifdef CONFIG_COMPAT
931 932
	.compat_setsockopt = compat_ipv6_setsockopt,
	.compat_getsockopt = compat_ipv6_getsockopt,
933
#endif
934 935 936 937 938
};

/*
 *	DCCP over IPv4 via INET6 API
 */
939
static const struct inet_connection_sock_af_ops dccp_ipv6_mapped = {
940 941 942 943 944 945 946 947 948 949
	.queue_xmit	   = ip_queue_xmit,
	.send_check	   = dccp_v4_send_check,
	.rebuild_header	   = inet_sk_rebuild_header,
	.conn_request	   = dccp_v6_conn_request,
	.syn_recv_sock	   = dccp_v6_request_recv_sock,
	.net_header_len	   = sizeof(struct iphdr),
	.setsockopt	   = ipv6_setsockopt,
	.getsockopt	   = ipv6_getsockopt,
	.addr2sockaddr	   = inet6_csk_addr2sockaddr,
	.sockaddr_len	   = sizeof(struct sockaddr_in6),
950
#ifdef CONFIG_COMPAT
951 952
	.compat_setsockopt = compat_ipv6_setsockopt,
	.compat_getsockopt = compat_ipv6_getsockopt,
953
#endif
954 955 956 957 958 959 960
};

/* NOTE: A lot of things set to zero explicitly by call to
 *       sk_alloc() so need not be done here.
 */
static int dccp_v6_init_sock(struct sock *sk)
{
961 962
	static __u8 dccp_v6_ctl_sock_initialized;
	int err = dccp_init_sock(sk, dccp_v6_ctl_sock_initialized);
963

964 965 966
	if (err == 0) {
		if (unlikely(!dccp_v6_ctl_sock_initialized))
			dccp_v6_ctl_sock_initialized = 1;
967
		inet_csk(sk)->icsk_af_ops = &dccp_ipv6_af_ops;
968
	}
969 970 971 972

	return err;
}

973
static void dccp_v6_destroy_sock(struct sock *sk)
974
{
975
	dccp_destroy_sock(sk);
976
	inet6_destroy_sock(sk);
977 978
}

979 980 981 982
static struct timewait_sock_ops dccp6_timewait_sock_ops = {
	.twsk_obj_size	= sizeof(struct dccp6_timewait_sock),
};

983
static struct proto dccp_v6_prot = {
984 985 986 987 988 989 990 991 992 993 994 995
	.name		   = "DCCPv6",
	.owner		   = THIS_MODULE,
	.close		   = dccp_close,
	.connect	   = dccp_v6_connect,
	.disconnect	   = dccp_disconnect,
	.ioctl		   = dccp_ioctl,
	.init		   = dccp_v6_init_sock,
	.setsockopt	   = dccp_setsockopt,
	.getsockopt	   = dccp_getsockopt,
	.sendmsg	   = dccp_sendmsg,
	.recvmsg	   = dccp_recvmsg,
	.backlog_rcv	   = dccp_v6_do_rcv,
996
	.hash		   = inet6_hash,
997
	.unhash		   = inet_unhash,
998
	.accept		   = inet_csk_accept,
999
	.get_port	   = inet_csk_get_port,
1000 1001 1002 1003 1004
	.shutdown	   = dccp_shutdown,
	.destroy	   = dccp_v6_destroy_sock,
	.orphan_count	   = &dccp_orphan_count,
	.max_header	   = MAX_DCCP_HEADER,
	.obj_size	   = sizeof(struct dccp6_sock),
1005
	.slab_flags	   = SLAB_DESTROY_BY_RCU,
1006 1007
	.rsk_prot	   = &dccp6_request_sock_ops,
	.twsk_prot	   = &dccp6_timewait_sock_ops,
1008
	.h.hashinfo	   = &dccp_hashinfo,
1009
#ifdef CONFIG_COMPAT
1010 1011
	.compat_setsockopt = compat_dccp_setsockopt,
	.compat_getsockopt = compat_dccp_getsockopt,
1012
#endif
1013 1014
};

1015
static const struct inet6_protocol dccp_v6_protocol = {
A
Arnaldo Carvalho de Melo 已提交
1016 1017 1018
	.handler	= dccp_v6_rcv,
	.err_handler	= dccp_v6_err,
	.flags		= INET6_PROTO_NOPOLICY | INET6_PROTO_FINAL,
1019 1020
};

1021
static const struct proto_ops inet6_dccp_ops = {
1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039
	.family		   = PF_INET6,
	.owner		   = THIS_MODULE,
	.release	   = inet6_release,
	.bind		   = inet6_bind,
	.connect	   = inet_stream_connect,
	.socketpair	   = sock_no_socketpair,
	.accept		   = inet_accept,
	.getname	   = inet6_getname,
	.poll		   = dccp_poll,
	.ioctl		   = inet6_ioctl,
	.listen		   = inet_dccp_listen,
	.shutdown	   = inet_shutdown,
	.setsockopt	   = sock_common_setsockopt,
	.getsockopt	   = sock_common_getsockopt,
	.sendmsg	   = inet_sendmsg,
	.recvmsg	   = sock_common_recvmsg,
	.mmap		   = sock_no_mmap,
	.sendpage	   = sock_no_sendpage,
1040
#ifdef CONFIG_COMPAT
1041 1042
	.compat_setsockopt = compat_sock_common_setsockopt,
	.compat_getsockopt = compat_sock_common_getsockopt,
1043
#endif
1044 1045 1046 1047 1048 1049 1050
};

static struct inet_protosw dccp_v6_protosw = {
	.type		= SOCK_DCCP,
	.protocol	= IPPROTO_DCCP,
	.prot		= &dccp_v6_prot,
	.ops		= &inet6_dccp_ops,
1051
	.flags		= INET_PROTOSW_ICSK,
1052 1053
};

1054
static int __net_init dccp_v6_init_net(struct net *net)
1055
{
1056 1057
	if (dccp_hashinfo.bhash == NULL)
		return -ESOCKTNOSUPPORT;
1058

1059 1060
	return inet_ctl_sock_create(&net->dccp.v6_ctl_sk, PF_INET6,
				    SOCK_DCCP, IPPROTO_DCCP, net);
1061 1062
}

1063
static void __net_exit dccp_v6_exit_net(struct net *net)
1064
{
1065
	inet_ctl_sock_destroy(net->dccp.v6_ctl_sk);
1066 1067 1068 1069 1070 1071 1072
}

static struct pernet_operations dccp_v6_ops = {
	.init   = dccp_v6_init_net,
	.exit   = dccp_v6_exit_net,
};

1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084
static int __init dccp_v6_init(void)
{
	int err = proto_register(&dccp_v6_prot, 1);

	if (err != 0)
		goto out;

	err = inet6_add_protocol(&dccp_v6_protocol, IPPROTO_DCCP);
	if (err != 0)
		goto out_unregister_proto;

	inet6_register_protosw(&dccp_v6_protosw);
1085

1086 1087 1088
	err = register_pernet_subsys(&dccp_v6_ops);
	if (err != 0)
		goto out_destroy_ctl_sock;
1089 1090
out:
	return err;
1091 1092

out_destroy_ctl_sock:
1093 1094
	inet6_del_protocol(&dccp_v6_protocol, IPPROTO_DCCP);
	inet6_unregister_protosw(&dccp_v6_protosw);
1095 1096 1097 1098 1099 1100 1101
out_unregister_proto:
	proto_unregister(&dccp_v6_prot);
	goto out;
}

static void __exit dccp_v6_exit(void)
{
1102
	unregister_pernet_subsys(&dccp_v6_ops);
1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115
	inet6_del_protocol(&dccp_v6_protocol, IPPROTO_DCCP);
	inet6_unregister_protosw(&dccp_v6_protosw);
	proto_unregister(&dccp_v6_prot);
}

module_init(dccp_v6_init);
module_exit(dccp_v6_exit);

/*
 * __stringify doesn't likes enums, so use SOCK_DCCP (6) and IPPROTO_DCCP (33)
 * values directly, Also cover the case where the protocol is not specified,
 * i.e. net-pf-PF_INET6-proto-0-type-SOCK_DCCP
 */
1116 1117
MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_INET6, 33, 6);
MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_INET6, 0, 6);
1118 1119 1120
MODULE_LICENSE("GPL");
MODULE_AUTHOR("Arnaldo Carvalho de Melo <acme@mandriva.com>");
MODULE_DESCRIPTION("DCCPv6 - Datagram Congestion Controlled Protocol");