exthdrs.c 20.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *	Extension Header handling for IPv6
 *	Linux INET6 implementation
 *
 *	Authors:
 *	Pedro Roque		<roque@di.fc.ul.pt>
 *	Andi Kleen		<ak@muc.de>
 *	Alexey Kuznetsov	<kuznet@ms2.inr.ac.ru>
 *
 *	This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

/* Changes:
17
 *	yoshfuji		: ensure not to overrun while parsing
L
Linus Torvalds 已提交
18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *				  tlv options.
 *	Mitsuru KANDA @USAGI and: Remove ipv6_parse_exthdrs().
 *	YOSHIFUJI Hideaki @USAGI  Register inbound extension header
 *				  handlers as inet6_protocol{}.
 */

#include <linux/errno.h>
#include <linux/types.h>
#include <linux/socket.h>
#include <linux/sockios.h>
#include <linux/net.h>
#include <linux/netdevice.h>
#include <linux/in6.h>
#include <linux/icmpv6.h>
32
#include <linux/slab.h>
33
#include <linux/export.h>
L
Linus Torvalds 已提交
34

35
#include <net/dst.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41 42 43 44 45
#include <net/sock.h>
#include <net/snmp.h>

#include <net/ipv6.h>
#include <net/protocol.h>
#include <net/transp_v6.h>
#include <net/rawv6.h>
#include <net/ndisc.h>
#include <net/ip6_route.h>
#include <net/addrconf.h>
A
Amerigo Wang 已提交
46
#if IS_ENABLED(CONFIG_IPV6_MIP6)
47 48
#include <net/xfrm.h>
#endif
L
Linus Torvalds 已提交
49 50 51 52 53 54

#include <asm/uaccess.h>

/*
 *	Parsing tlv encoded headers.
 *
55 56
 *	Parsing function "func" returns true, if parsing succeed
 *	and false, if it failed.
L
Linus Torvalds 已提交
57 58 59 60 61
 *	It MUST NOT touch skb->h.
 */

struct tlvtype_proc {
	int	type;
62
	bool	(*func)(struct sk_buff *skb, int offset);
L
Linus Torvalds 已提交
63 64 65 66 67 68 69 70
};

/*********************
  Generic functions
 *********************/

/* An unknown option is detected, decide what to do */

71
static bool ip6_tlvopt_unknown(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
72
{
73
	switch ((skb_network_header(skb)[optoff] & 0xC0) >> 6) {
L
Linus Torvalds 已提交
74
	case 0: /* ignore */
75
		return true;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83

	case 1: /* drop packet */
		break;

	case 3: /* Send ICMP if not a multicast address and drop packet */
		/* Actually, it is redundant check. icmp_send
		   will recheck in any case.
		 */
84
		if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr))
L
Linus Torvalds 已提交
85 86 87
			break;
	case 2: /* send ICMP PARM PROB regardless and drop packet */
		icmpv6_param_prob(skb, ICMPV6_UNK_OPTION, optoff);
88
		return false;
89
	}
L
Linus Torvalds 已提交
90 91

	kfree_skb(skb);
92
	return false;
L
Linus Torvalds 已提交
93 94 95 96
}

/* Parse tlv encoded option header (hop-by-hop or destination) */

97
static bool ip6_parse_tlv(const struct tlvtype_proc *procs, struct sk_buff *skb)
L
Linus Torvalds 已提交
98
{
99
	const struct tlvtype_proc *curr;
100
	const unsigned char *nh = skb_network_header(skb);
101
	int off = skb_network_header_len(skb);
102
	int len = (skb_transport_header(skb)[1] + 1) << 3;
103
	int padlen = 0;
L
Linus Torvalds 已提交
104

105
	if (skb_transport_offset(skb) + len > skb_headlen(skb))
L
Linus Torvalds 已提交
106 107 108 109 110 111
		goto bad;

	off += 2;
	len -= 2;

	while (len > 0) {
112
		int optlen = nh[off + 1] + 2;
113
		int i;
L
Linus Torvalds 已提交
114

115
		switch (nh[off]) {
116
		case IPV6_TLV_PAD1:
L
Linus Torvalds 已提交
117
			optlen = 1;
118 119 120
			padlen++;
			if (padlen > 7)
				goto bad;
L
Linus Torvalds 已提交
121 122 123
			break;

		case IPV6_TLV_PADN:
124 125 126 127 128
			/* RFC 2460 states that the purpose of PadN is
			 * to align the containing header to multiples
			 * of 8. 7 is therefore the highest valid value.
			 * See also RFC 4942, Section 2.1.9.5.
			 */
129 130
			padlen += optlen;
			if (padlen > 7)
131 132 133 134 135 136 137 138 139
				goto bad;
			/* RFC 4942 recommends receiving hosts to
			 * actively check PadN payload to contain
			 * only zeroes.
			 */
			for (i = 2; i < optlen; i++) {
				if (nh[off + i] != 0)
					goto bad;
			}
L
Linus Torvalds 已提交
140 141 142 143 144 145
			break;

		default: /* Other TLV code so scan list */
			if (optlen > len)
				goto bad;
			for (curr=procs; curr->type >= 0; curr++) {
146
				if (curr->type == nh[off]) {
147 148
					/* type specific length/alignment
					   checks will be performed in the
L
Linus Torvalds 已提交
149
					   func(). */
150 151
					if (curr->func(skb, off) == false)
						return false;
L
Linus Torvalds 已提交
152 153 154 155
					break;
				}
			}
			if (curr->type < 0) {
156
				if (ip6_tlvopt_unknown(skb, off) == 0)
157
					return false;
L
Linus Torvalds 已提交
158
			}
159
			padlen = 0;
L
Linus Torvalds 已提交
160 161 162 163 164
			break;
		}
		off += optlen;
		len -= optlen;
	}
165 166 167 168 169 170 171
	/* This case will not be caught by above check since its padding
	 * length is smaller than 7:
	 * 1 byte NH + 1 byte Length + 6 bytes Padding
	 */
	if ((padlen == 6) && ((off - skb_network_header_len(skb)) == 8))
		goto bad;

L
Linus Torvalds 已提交
172
	if (len == 0)
173
		return true;
L
Linus Torvalds 已提交
174 175
bad:
	kfree_skb(skb);
176
	return false;
L
Linus Torvalds 已提交
177 178 179 180 181 182
}

/*****************************
  Destination options header.
 *****************************/

A
Amerigo Wang 已提交
183
#if IS_ENABLED(CONFIG_IPV6_MIP6)
184
static bool ipv6_dest_hao(struct sk_buff *skb, int optoff)
185 186 187
{
	struct ipv6_destopt_hao *hao;
	struct inet6_skb_parm *opt = IP6CB(skb);
188
	struct ipv6hdr *ipv6h = ipv6_hdr(skb);
189 190 191 192 193 194 195 196 197 198
	struct in6_addr tmp_addr;
	int ret;

	if (opt->dsthao) {
		LIMIT_NETDEBUG(KERN_DEBUG "hao duplicated\n");
		goto discard;
	}
	opt->dsthao = opt->dst1;
	opt->dst1 = 0;

199
	hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) + optoff);
200 201 202 203 204 205 206 207 208

	if (hao->length != 16) {
		LIMIT_NETDEBUG(
			KERN_DEBUG "hao invalid option length = %d\n", hao->length);
		goto discard;
	}

	if (!(ipv6_addr_type(&hao->addr) & IPV6_ADDR_UNICAST)) {
		LIMIT_NETDEBUG(
H
Harvey Harrison 已提交
209
			KERN_DEBUG "hao is not an unicast addr: %pI6\n", &hao->addr);
210 211 212 213 214 215 216 217 218
		goto discard;
	}

	ret = xfrm6_input_addr(skb, (xfrm_address_t *)&ipv6h->daddr,
			       (xfrm_address_t *)&hao->addr, IPPROTO_DSTOPTS);
	if (unlikely(ret < 0))
		goto discard;

	if (skb_cloned(skb)) {
219
		if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC))
220 221 222
			goto discard;

		/* update all variable using below by copied skbuff */
223
		hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) +
224
						  optoff);
225
		ipv6h = ipv6_hdr(skb);
226 227 228 229 230
	}

	if (skb->ip_summed == CHECKSUM_COMPLETE)
		skb->ip_summed = CHECKSUM_NONE;

A
Alexey Dobriyan 已提交
231 232 233
	tmp_addr = ipv6h->saddr;
	ipv6h->saddr = hao->addr;
	hao->addr = tmp_addr;
234

235
	if (skb->tstamp.tv64 == 0)
236 237
		__net_timestamp(skb);

238
	return true;
239 240 241

 discard:
	kfree_skb(skb);
242
	return false;
243 244 245
}
#endif

246
static const struct tlvtype_proc tlvprocdestopt_lst[] = {
A
Amerigo Wang 已提交
247
#if IS_ENABLED(CONFIG_IPV6_MIP6)
248 249 250 251 252
	{
		.type	= IPV6_TLV_HAO,
		.func	= ipv6_dest_hao,
	},
#endif
L
Linus Torvalds 已提交
253 254 255
	{-1,			NULL}
};

256
static int ipv6_destopt_rcv(struct sk_buff *skb)
L
Linus Torvalds 已提交
257 258
{
	struct inet6_skb_parm *opt = IP6CB(skb);
A
Amerigo Wang 已提交
259
#if IS_ENABLED(CONFIG_IPV6_MIP6)
260 261
	__u16 dstbuf;
#endif
262
	struct dst_entry *dst = skb_dst(skb);
L
Linus Torvalds 已提交
263

264 265
	if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
	    !pskb_may_pull(skb, (skb_transport_offset(skb) +
266
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
267
		IP6_INC_STATS_BH(dev_net(dst->dev), ip6_dst_idev(dst),
268
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
269 270 271 272
		kfree_skb(skb);
		return -1;
	}

273
	opt->lastopt = opt->dst1 = skb_network_header_len(skb);
A
Amerigo Wang 已提交
274
#if IS_ENABLED(CONFIG_IPV6_MIP6)
275 276
	dstbuf = opt->dst1;
#endif
L
Linus Torvalds 已提交
277

278
	if (ip6_parse_tlv(tlvprocdestopt_lst, skb)) {
279
		skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
280
		opt = IP6CB(skb);
A
Amerigo Wang 已提交
281
#if IS_ENABLED(CONFIG_IPV6_MIP6)
282 283
		opt->nhoff = dstbuf;
#else
284
		opt->nhoff = opt->dst1;
285
#endif
L
Linus Torvalds 已提交
286 287 288
		return 1;
	}

289 290
	IP6_INC_STATS_BH(dev_net(dst->dev),
			 ip6_dst_idev(dst), IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
291 292 293 294 295 296 297
	return -1;
}

/********************************
  Routing header.
 ********************************/

298
/* called with rcu_read_lock() */
299
static int ipv6_rthdr_rcv(struct sk_buff *skb)
L
Linus Torvalds 已提交
300 301
{
	struct inet6_skb_parm *opt = IP6CB(skb);
302
	struct in6_addr *addr = NULL;
L
Linus Torvalds 已提交
303
	struct in6_addr daddr;
304
	struct inet6_dev *idev;
L
Linus Torvalds 已提交
305 306 307
	int n, i;
	struct ipv6_rt_hdr *hdr;
	struct rt0_hdr *rthdr;
308 309
	struct net *net = dev_net(skb->dev);
	int accept_source_route = net->ipv6.devconf_all->accept_source_route;
310

311 312 313
	idev = __in6_dev_get(skb->dev);
	if (idev && accept_source_route > idev->cnf.accept_source_route)
		accept_source_route = idev->cnf.accept_source_route;
314

315 316
	if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
	    !pskb_may_pull(skb, (skb_transport_offset(skb) +
317
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
E
Eric Dumazet 已提交
318
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
319
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
320 321 322 323
		kfree_skb(skb);
		return -1;
	}

324
	hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
L
Linus Torvalds 已提交
325

326
	if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr) ||
L
Linus Torvalds 已提交
327
	    skb->pkt_type != PACKET_HOST) {
E
Eric Dumazet 已提交
328
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
329
				 IPSTATS_MIB_INADDRERRORS);
L
Linus Torvalds 已提交
330 331 332 333 334 335
		kfree_skb(skb);
		return -1;
	}

looped_back:
	if (hdr->segments_left == 0) {
336
		switch (hdr->type) {
A
Amerigo Wang 已提交
337
#if IS_ENABLED(CONFIG_IPV6_MIP6)
338 339 340 341 342
		case IPV6_SRCRT_TYPE_2:
			/* Silently discard type 2 header unless it was
			 * processed by own
			 */
			if (!addr) {
E
Eric Dumazet 已提交
343
				IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
344
						 IPSTATS_MIB_INADDRERRORS);
345 346 347 348 349 350 351 352 353
				kfree_skb(skb);
				return -1;
			}
			break;
#endif
		default:
			break;
		}

354
		opt->lastopt = opt->srcrt = skb_network_header_len(skb);
355
		skb->transport_header += (hdr->hdrlen + 1) << 3;
L
Linus Torvalds 已提交
356 357
		opt->dst0 = opt->dst1;
		opt->dst1 = 0;
358
		opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
L
Linus Torvalds 已提交
359 360 361
		return 1;
	}

362
	switch (hdr->type) {
A
Amerigo Wang 已提交
363
#if IS_ENABLED(CONFIG_IPV6_MIP6)
364
	case IPV6_SRCRT_TYPE_2:
365 366
		if (accept_source_route < 0)
			goto unknown_rh;
367 368
		/* Silently discard invalid RTH type 2 */
		if (hdr->hdrlen != 2 || hdr->segments_left != 1) {
E
Eric Dumazet 已提交
369
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
370
					 IPSTATS_MIB_INHDRERRORS);
371 372 373 374 375
			kfree_skb(skb);
			return -1;
		}
		break;
#endif
376 377
	default:
		goto unknown_rh;
L
Linus Torvalds 已提交
378 379 380 381 382 383 384 385 386 387
	}

	/*
	 *	This is the routing header forwarding algorithm from
	 *	RFC 2460, page 16.
	 */

	n = hdr->hdrlen >> 1;

	if (hdr->segments_left > n) {
E
Eric Dumazet 已提交
388
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
389
				 IPSTATS_MIB_INHDRERRORS);
390 391 392
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
				  ((&hdr->segments_left) -
				   skb_network_header(skb)));
L
Linus Torvalds 已提交
393 394 395 396 397 398 399 400
		return -1;
	}

	/* We are about to mangle packet header. Be careful!
	   Do not damage packets queued somewhere.
	 */
	if (skb_cloned(skb)) {
		/* the copy is a forwarded packet */
401
		if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
E
Eric Dumazet 已提交
402
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
403 404
					 IPSTATS_MIB_OUTDISCARDS);
			kfree_skb(skb);
L
Linus Torvalds 已提交
405 406
			return -1;
		}
407
		hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
L
Linus Torvalds 已提交
408 409
	}

410
	if (skb->ip_summed == CHECKSUM_COMPLETE)
L
Linus Torvalds 已提交
411 412 413 414 415 416 417 418
		skb->ip_summed = CHECKSUM_NONE;

	i = n - --hdr->segments_left;

	rthdr = (struct rt0_hdr *) hdr;
	addr = rthdr->addr;
	addr += i - 1;

419
	switch (hdr->type) {
A
Amerigo Wang 已提交
420
#if IS_ENABLED(CONFIG_IPV6_MIP6)
421 422
	case IPV6_SRCRT_TYPE_2:
		if (xfrm6_input_addr(skb, (xfrm_address_t *)addr,
423
				     (xfrm_address_t *)&ipv6_hdr(skb)->saddr,
424
				     IPPROTO_ROUTING) < 0) {
E
Eric Dumazet 已提交
425
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
426
					 IPSTATS_MIB_INADDRERRORS);
427 428 429
			kfree_skb(skb);
			return -1;
		}
E
Eric Dumazet 已提交
430 431
		if (!ipv6_chk_home_addr(dev_net(skb_dst(skb)->dev), addr)) {
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
432
					 IPSTATS_MIB_INADDRERRORS);
433 434 435 436 437 438 439 440 441
			kfree_skb(skb);
			return -1;
		}
		break;
#endif
	default:
		break;
	}

L
Linus Torvalds 已提交
442
	if (ipv6_addr_is_multicast(addr)) {
E
Eric Dumazet 已提交
443
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
444
				 IPSTATS_MIB_INADDRERRORS);
L
Linus Torvalds 已提交
445 446 447 448
		kfree_skb(skb);
		return -1;
	}

A
Alexey Dobriyan 已提交
449 450 451
	daddr = *addr;
	*addr = ipv6_hdr(skb)->daddr;
	ipv6_hdr(skb)->daddr = daddr;
L
Linus Torvalds 已提交
452

E
Eric Dumazet 已提交
453
	skb_dst_drop(skb);
L
Linus Torvalds 已提交
454
	ip6_route_input(skb);
E
Eric Dumazet 已提交
455
	if (skb_dst(skb)->error) {
456
		skb_push(skb, skb->data - skb_network_header(skb));
L
Linus Torvalds 已提交
457 458 459 460
		dst_input(skb);
		return -1;
	}

E
Eric Dumazet 已提交
461
	if (skb_dst(skb)->dev->flags&IFF_LOOPBACK) {
462
		if (ipv6_hdr(skb)->hop_limit <= 1) {
E
Eric Dumazet 已提交
463
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
464
					 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
465
			icmpv6_send(skb, ICMPV6_TIME_EXCEED, ICMPV6_EXC_HOPLIMIT,
466
				    0);
L
Linus Torvalds 已提交
467 468 469
			kfree_skb(skb);
			return -1;
		}
470
		ipv6_hdr(skb)->hop_limit--;
L
Linus Torvalds 已提交
471 472 473
		goto looped_back;
	}

474
	skb_push(skb, skb->data - skb_network_header(skb));
L
Linus Torvalds 已提交
475 476
	dst_input(skb);
	return -1;
477 478

unknown_rh:
E
Eric Dumazet 已提交
479
	IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)), IPSTATS_MIB_INHDRERRORS);
480 481 482
	icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
			  (&hdr->type) - skb_network_header(skb));
	return -1;
L
Linus Torvalds 已提交
483 484
}

485
static const struct inet6_protocol rthdr_protocol = {
L
Linus Torvalds 已提交
486
	.handler	=	ipv6_rthdr_rcv,
487
	.flags		=	INET6_PROTO_NOPOLICY,
488 489
};

490
static const struct inet6_protocol destopt_protocol = {
491
	.handler	=	ipv6_destopt_rcv,
492
	.flags		=	INET6_PROTO_NOPOLICY,
493 494
};

495
static const struct inet6_protocol nodata_protocol = {
496 497 498 499 500
	.handler	=	dst_discard,
	.flags		=	INET6_PROTO_NOPOLICY,
};

int __init ipv6_exthdrs_init(void)
L
Linus Torvalds 已提交
501
{
502 503
	int ret;

504 505
	ret = inet6_add_protocol(&rthdr_protocol, IPPROTO_ROUTING);
	if (ret)
506
		goto out;
507

508 509 510 511 512 513 514 515 516 517 518 519
	ret = inet6_add_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
	if (ret)
		goto out_rthdr;

	ret = inet6_add_protocol(&nodata_protocol, IPPROTO_NONE);
	if (ret)
		goto out_destopt;

out:
	return ret;
out_destopt:
	inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
520 521
out_rthdr:
	inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
522
	goto out;
L
Linus Torvalds 已提交
523 524
};

525 526 527 528 529 530 531
void ipv6_exthdrs_exit(void)
{
	inet6_del_protocol(&nodata_protocol, IPPROTO_NONE);
	inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
	inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
}

L
Linus Torvalds 已提交
532 533 534 535
/**********************************
  Hop-by-hop options.
 **********************************/

536
/*
E
Eric Dumazet 已提交
537
 * Note: we cannot rely on skb_dst(skb) before we assign it in ip6_route_input().
538 539 540
 */
static inline struct inet6_dev *ipv6_skb_idev(struct sk_buff *skb)
{
E
Eric Dumazet 已提交
541
	return skb_dst(skb) ? ip6_dst_idev(skb_dst(skb)) : __in6_dev_get(skb->dev);
542 543
}

544 545 546 547 548
static inline struct net *ipv6_skb_net(struct sk_buff *skb)
{
	return skb_dst(skb) ? dev_net(skb_dst(skb)->dev) : dev_net(skb->dev);
}

L
Linus Torvalds 已提交
549 550
/* Router Alert as of RFC 2711 */

551
static bool ipv6_hop_ra(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
552
{
553
	const unsigned char *nh = skb_network_header(skb);
554

555
	if (nh[optoff + 1] == 2) {
L
Linus Torvalds 已提交
556
		IP6CB(skb)->ra = optoff;
557
		return true;
L
Linus Torvalds 已提交
558
	}
559
	LIMIT_NETDEBUG(KERN_DEBUG "ipv6_hop_ra: wrong RA length %d\n",
560
		       nh[optoff + 1]);
L
Linus Torvalds 已提交
561
	kfree_skb(skb);
562
	return false;
L
Linus Torvalds 已提交
563 564 565 566
}

/* Jumbo payload */

567
static bool ipv6_hop_jumbo(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
568
{
569
	const unsigned char *nh = skb_network_header(skb);
570
	struct net *net = ipv6_skb_net(skb);
L
Linus Torvalds 已提交
571 572
	u32 pkt_len;

573
	if (nh[optoff + 1] != 4 || (optoff & 3) != 2) {
574
		LIMIT_NETDEBUG(KERN_DEBUG "ipv6_hop_jumbo: wrong jumbo opt length/alignment %d\n",
575
			       nh[optoff+1]);
576
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
577
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
578 579 580
		goto drop;
	}

581
	pkt_len = ntohl(*(__be32 *)(nh + optoff + 2));
L
Linus Torvalds 已提交
582
	if (pkt_len <= IPV6_MAXPLEN) {
583 584
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
585
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff+2);
586
		return false;
L
Linus Torvalds 已提交
587
	}
588
	if (ipv6_hdr(skb)->payload_len) {
589 590
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
591
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff);
592
		return false;
L
Linus Torvalds 已提交
593 594 595
	}

	if (pkt_len > skb->len - sizeof(struct ipv6hdr)) {
596 597
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INTRUNCATEDPKTS);
L
Linus Torvalds 已提交
598 599
		goto drop;
	}
600 601 602 603

	if (pskb_trim_rcsum(skb, pkt_len + sizeof(struct ipv6hdr)))
		goto drop;

604
	return true;
L
Linus Torvalds 已提交
605 606 607

drop:
	kfree_skb(skb);
608
	return false;
L
Linus Torvalds 已提交
609 610
}

611
static const struct tlvtype_proc tlvprochopopt_lst[] = {
L
Linus Torvalds 已提交
612 613 614 615 616 617 618 619 620 621 622
	{
		.type	= IPV6_TLV_ROUTERALERT,
		.func	= ipv6_hop_ra,
	},
	{
		.type	= IPV6_TLV_JUMBO,
		.func	= ipv6_hop_jumbo,
	},
	{ -1, }
};

623
int ipv6_parse_hopopts(struct sk_buff *skb)
L
Linus Torvalds 已提交
624
{
625 626
	struct inet6_skb_parm *opt = IP6CB(skb);

627
	/*
628
	 * skb_network_header(skb) is equal to skb->data, and
629
	 * skb_network_header_len(skb) is always equal to
630 631 632 633
	 * sizeof(struct ipv6hdr) by definition of
	 * hop-by-hop options.
	 */
	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr) + 8) ||
634 635
	    !pskb_may_pull(skb, (sizeof(struct ipv6hdr) +
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
636 637 638 639
		kfree_skb(skb);
		return -1;
	}

640
	opt->hop = sizeof(struct ipv6hdr);
641
	if (ip6_parse_tlv(tlvprochopopt_lst, skb)) {
642
		skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
643
		opt = IP6CB(skb);
644
		opt->nhoff = sizeof(struct ipv6hdr);
645
		return 1;
646
	}
L
Linus Torvalds 已提交
647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667
	return -1;
}

/*
 *	Creating outbound headers.
 *
 *	"build" functions work when skb is filled from head to tail (datagram)
 *	"push"	functions work when headers are added from tail to head (tcp)
 *
 *	In both cases we assume, that caller reserved enough room
 *	for headers.
 */

static void ipv6_push_rthdr(struct sk_buff *skb, u8 *proto,
			    struct ipv6_rt_hdr *opt,
			    struct in6_addr **addr_p)
{
	struct rt0_hdr *phdr, *ihdr;
	int hops;

	ihdr = (struct rt0_hdr *) opt;
668

L
Linus Torvalds 已提交
669 670 671 672 673 674 675 676 677
	phdr = (struct rt0_hdr *) skb_push(skb, (ihdr->rt_hdr.hdrlen + 1) << 3);
	memcpy(phdr, ihdr, sizeof(struct rt0_hdr));

	hops = ihdr->rt_hdr.hdrlen >> 1;

	if (hops > 1)
		memcpy(phdr->addr, ihdr->addr + 1,
		       (hops - 1) * sizeof(struct in6_addr));

A
Alexey Dobriyan 已提交
678
	phdr->addr[hops - 1] = **addr_p;
L
Linus Torvalds 已提交
679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697
	*addr_p = ihdr->addr;

	phdr->rt_hdr.nexthdr = *proto;
	*proto = NEXTHDR_ROUTING;
}

static void ipv6_push_exthdr(struct sk_buff *skb, u8 *proto, u8 type, struct ipv6_opt_hdr *opt)
{
	struct ipv6_opt_hdr *h = (struct ipv6_opt_hdr *)skb_push(skb, ipv6_optlen(opt));

	memcpy(h, opt, ipv6_optlen(opt));
	h->nexthdr = *proto;
	*proto = type;
}

void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			  u8 *proto,
			  struct in6_addr **daddr)
{
698
	if (opt->srcrt) {
L
Linus Torvalds 已提交
699
		ipv6_push_rthdr(skb, proto, opt->srcrt, daddr);
700 701 702 703 704 705 706
		/*
		 * IPV6_RTHDRDSTOPTS is ignored
		 * unless IPV6_RTHDR is set (RFC3542).
		 */
		if (opt->dst0opt)
			ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst0opt);
	}
L
Linus Torvalds 已提交
707 708 709
	if (opt->hopopt)
		ipv6_push_exthdr(skb, proto, NEXTHDR_HOP, opt->hopopt);
}
710 711
EXPORT_SYMBOL(ipv6_push_nfrag_opts);

L
Linus Torvalds 已提交
712 713 714 715 716 717 718 719 720 721 722 723 724
void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt, u8 *proto)
{
	if (opt->dst1opt)
		ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst1opt);
}

struct ipv6_txoptions *
ipv6_dup_options(struct sock *sk, struct ipv6_txoptions *opt)
{
	struct ipv6_txoptions *opt2;

	opt2 = sock_kmalloc(sk, opt->tot_len, GFP_ATOMIC);
	if (opt2) {
725
		long dif = (char *)opt2 - (char *)opt;
L
Linus Torvalds 已提交
726 727
		memcpy(opt2, opt, opt->tot_len);
		if (opt2->hopopt)
728
			*((char **)&opt2->hopopt) += dif;
L
Linus Torvalds 已提交
729
		if (opt2->dst0opt)
730
			*((char **)&opt2->dst0opt) += dif;
L
Linus Torvalds 已提交
731
		if (opt2->dst1opt)
732
			*((char **)&opt2->dst1opt) += dif;
L
Linus Torvalds 已提交
733
		if (opt2->srcrt)
734
			*((char **)&opt2->srcrt) += dif;
L
Linus Torvalds 已提交
735 736 737
	}
	return opt2;
}
738 739
EXPORT_SYMBOL_GPL(ipv6_dup_options);

740 741 742 743 744 745 746 747 748 749
static int ipv6_renew_option(void *ohdr,
			     struct ipv6_opt_hdr __user *newopt, int newoptlen,
			     int inherit,
			     struct ipv6_opt_hdr **hdr,
			     char **p)
{
	if (inherit) {
		if (ohdr) {
			memcpy(*p, ohdr, ipv6_optlen((struct ipv6_opt_hdr *)ohdr));
			*hdr = (struct ipv6_opt_hdr *)*p;
J
Joe Perches 已提交
750
			*p += CMSG_ALIGN(ipv6_optlen(*hdr));
751 752 753 754 755 756
		}
	} else {
		if (newopt) {
			if (copy_from_user(*p, newopt, newoptlen))
				return -EFAULT;
			*hdr = (struct ipv6_opt_hdr *)*p;
J
Joe Perches 已提交
757
			if (ipv6_optlen(*hdr) > newoptlen)
758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774
				return -EINVAL;
			*p += CMSG_ALIGN(newoptlen);
		}
	}
	return 0;
}

struct ipv6_txoptions *
ipv6_renew_options(struct sock *sk, struct ipv6_txoptions *opt,
		   int newtype,
		   struct ipv6_opt_hdr __user *newopt, int newoptlen)
{
	int tot_len = 0;
	char *p;
	struct ipv6_txoptions *opt2;
	int err;

775 776 777 778 779 780 781 782 783 784 785
	if (opt) {
		if (newtype != IPV6_HOPOPTS && opt->hopopt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->hopopt));
		if (newtype != IPV6_RTHDRDSTOPTS && opt->dst0opt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst0opt));
		if (newtype != IPV6_RTHDR && opt->srcrt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->srcrt));
		if (newtype != IPV6_DSTOPTS && opt->dst1opt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst1opt));
	}

786 787 788 789 790 791
	if (newopt && newoptlen)
		tot_len += CMSG_ALIGN(newoptlen);

	if (!tot_len)
		return NULL;

792
	tot_len += sizeof(*opt2);
793 794 795 796 797 798 799 800 801
	opt2 = sock_kmalloc(sk, tot_len, GFP_ATOMIC);
	if (!opt2)
		return ERR_PTR(-ENOBUFS);

	memset(opt2, 0, tot_len);

	opt2->tot_len = tot_len;
	p = (char *)(opt2 + 1);

802
	err = ipv6_renew_option(opt ? opt->hopopt : NULL, newopt, newoptlen,
803 804 805 806 807
				newtype != IPV6_HOPOPTS,
				&opt2->hopopt, &p);
	if (err)
		goto out;

808
	err = ipv6_renew_option(opt ? opt->dst0opt : NULL, newopt, newoptlen,
809 810 811 812 813
				newtype != IPV6_RTHDRDSTOPTS,
				&opt2->dst0opt, &p);
	if (err)
		goto out;

814
	err = ipv6_renew_option(opt ? opt->srcrt : NULL, newopt, newoptlen,
815
				newtype != IPV6_RTHDR,
816
				(struct ipv6_opt_hdr **)&opt2->srcrt, &p);
817 818 819
	if (err)
		goto out;

820
	err = ipv6_renew_option(opt ? opt->dst1opt : NULL, newopt, newoptlen,
821 822 823 824 825 826 827 828 829 830 831 832
				newtype != IPV6_DSTOPTS,
				&opt2->dst1opt, &p);
	if (err)
		goto out;

	opt2->opt_nflen = (opt2->hopopt ? ipv6_optlen(opt2->hopopt) : 0) +
			  (opt2->dst0opt ? ipv6_optlen(opt2->dst0opt) : 0) +
			  (opt2->srcrt ? ipv6_optlen(opt2->srcrt) : 0);
	opt2->opt_flen = (opt2->dst1opt ? ipv6_optlen(opt2->dst1opt) : 0);

	return opt2;
out:
833
	sock_kfree_s(sk, opt2, opt2->tot_len);
834 835 836
	return ERR_PTR(err);
}

837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854
struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
					  struct ipv6_txoptions *opt)
{
	/*
	 * ignore the dest before srcrt unless srcrt is being included.
	 * --yoshfuji
	 */
	if (opt && opt->dst0opt && !opt->srcrt) {
		if (opt_space != opt) {
			memcpy(opt_space, opt, sizeof(*opt_space));
			opt = opt_space;
		}
		opt->opt_nflen -= ipv6_optlen(opt->dst0opt);
		opt->dst0opt = NULL;
	}

	return opt;
}
855
EXPORT_SYMBOL_GPL(ipv6_fixup_options);
856

857 858 859 860
/**
 * fl6_update_dst - update flowi destination address with info given
 *                  by srcrt option, if any.
 *
861
 * @fl6: flowi6 for which daddr is to be updated
862
 * @opt: struct ipv6_txoptions in which to look for srcrt opt
863
 * @orig: copy of original daddr address if modified
864 865
 *
 * Returns NULL if no txoptions or no srcrt, otherwise returns orig
866
 * and initial value of fl6->daddr set in orig
867
 */
868
struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
869 870 871 872 873 874
				const struct ipv6_txoptions *opt,
				struct in6_addr *orig)
{
	if (!opt || !opt->srcrt)
		return NULL;

A
Alexey Dobriyan 已提交
875 876
	*orig = fl6->daddr;
	fl6->daddr = *((struct rt0_hdr *)opt->srcrt)->addr;
877 878 879
	return orig;
}
EXPORT_SYMBOL_GPL(fl6_update_dst);