exthdrs.c 20.6 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *	Extension Header handling for IPv6
 *	Linux INET6 implementation
 *
 *	Authors:
 *	Pedro Roque		<roque@di.fc.ul.pt>
 *	Andi Kleen		<ak@muc.de>
 *	Alexey Kuznetsov	<kuznet@ms2.inr.ac.ru>
 *
 *	This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

/* Changes:
17
 *	yoshfuji		: ensure not to overrun while parsing
L
Linus Torvalds 已提交
18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *				  tlv options.
 *	Mitsuru KANDA @USAGI and: Remove ipv6_parse_exthdrs().
 *	YOSHIFUJI Hideaki @USAGI  Register inbound extension header
 *				  handlers as inet6_protocol{}.
 */

#include <linux/errno.h>
#include <linux/types.h>
#include <linux/socket.h>
#include <linux/sockios.h>
#include <linux/net.h>
#include <linux/netdevice.h>
#include <linux/in6.h>
#include <linux/icmpv6.h>
32
#include <linux/slab.h>
33
#include <linux/export.h>
L
Linus Torvalds 已提交
34

35
#include <net/dst.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41 42 43 44 45
#include <net/sock.h>
#include <net/snmp.h>

#include <net/ipv6.h>
#include <net/protocol.h>
#include <net/transp_v6.h>
#include <net/rawv6.h>
#include <net/ndisc.h>
#include <net/ip6_route.h>
#include <net/addrconf.h>
A
Amerigo Wang 已提交
46
#if IS_ENABLED(CONFIG_IPV6_MIP6)
47 48
#include <net/xfrm.h>
#endif
L
Linus Torvalds 已提交
49 50 51 52 53 54

#include <asm/uaccess.h>

/*
 *	Parsing tlv encoded headers.
 *
55 56
 *	Parsing function "func" returns true, if parsing succeed
 *	and false, if it failed.
L
Linus Torvalds 已提交
57 58 59 60 61
 *	It MUST NOT touch skb->h.
 */

struct tlvtype_proc {
	int	type;
62
	bool	(*func)(struct sk_buff *skb, int offset);
L
Linus Torvalds 已提交
63 64 65 66 67 68 69 70
};

/*********************
  Generic functions
 *********************/

/* An unknown option is detected, decide what to do */

71
static bool ip6_tlvopt_unknown(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
72
{
73
	switch ((skb_network_header(skb)[optoff] & 0xC0) >> 6) {
L
Linus Torvalds 已提交
74
	case 0: /* ignore */
75
		return true;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83

	case 1: /* drop packet */
		break;

	case 3: /* Send ICMP if not a multicast address and drop packet */
		/* Actually, it is redundant check. icmp_send
		   will recheck in any case.
		 */
84
		if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr))
L
Linus Torvalds 已提交
85 86 87
			break;
	case 2: /* send ICMP PARM PROB regardless and drop packet */
		icmpv6_param_prob(skb, ICMPV6_UNK_OPTION, optoff);
88
		return false;
89
	}
L
Linus Torvalds 已提交
90 91

	kfree_skb(skb);
92
	return false;
L
Linus Torvalds 已提交
93 94 95 96
}

/* Parse tlv encoded option header (hop-by-hop or destination) */

97
static bool ip6_parse_tlv(const struct tlvtype_proc *procs, struct sk_buff *skb)
L
Linus Torvalds 已提交
98
{
99
	const struct tlvtype_proc *curr;
100
	const unsigned char *nh = skb_network_header(skb);
101
	int off = skb_network_header_len(skb);
102
	int len = (skb_transport_header(skb)[1] + 1) << 3;
103
	int padlen = 0;
L
Linus Torvalds 已提交
104

105
	if (skb_transport_offset(skb) + len > skb_headlen(skb))
L
Linus Torvalds 已提交
106 107 108 109 110 111
		goto bad;

	off += 2;
	len -= 2;

	while (len > 0) {
112
		int optlen = nh[off + 1] + 2;
113
		int i;
L
Linus Torvalds 已提交
114

115
		switch (nh[off]) {
116
		case IPV6_TLV_PAD1:
L
Linus Torvalds 已提交
117
			optlen = 1;
118 119 120
			padlen++;
			if (padlen > 7)
				goto bad;
L
Linus Torvalds 已提交
121 122 123
			break;

		case IPV6_TLV_PADN:
124 125 126 127 128
			/* RFC 2460 states that the purpose of PadN is
			 * to align the containing header to multiples
			 * of 8. 7 is therefore the highest valid value.
			 * See also RFC 4942, Section 2.1.9.5.
			 */
129 130
			padlen += optlen;
			if (padlen > 7)
131 132 133 134 135 136 137 138 139
				goto bad;
			/* RFC 4942 recommends receiving hosts to
			 * actively check PadN payload to contain
			 * only zeroes.
			 */
			for (i = 2; i < optlen; i++) {
				if (nh[off + i] != 0)
					goto bad;
			}
L
Linus Torvalds 已提交
140 141 142 143 144
			break;

		default: /* Other TLV code so scan list */
			if (optlen > len)
				goto bad;
145
			for (curr = procs; curr->type >= 0; curr++) {
146
				if (curr->type == nh[off]) {
147 148
					/* type specific length/alignment
					   checks will be performed in the
L
Linus Torvalds 已提交
149
					   func(). */
150 151
					if (curr->func(skb, off) == false)
						return false;
L
Linus Torvalds 已提交
152 153 154 155
					break;
				}
			}
			if (curr->type < 0) {
156
				if (ip6_tlvopt_unknown(skb, off) == 0)
157
					return false;
L
Linus Torvalds 已提交
158
			}
159
			padlen = 0;
L
Linus Torvalds 已提交
160 161 162 163 164
			break;
		}
		off += optlen;
		len -= optlen;
	}
165

L
Linus Torvalds 已提交
166
	if (len == 0)
167
		return true;
L
Linus Torvalds 已提交
168 169
bad:
	kfree_skb(skb);
170
	return false;
L
Linus Torvalds 已提交
171 172 173 174 175 176
}

/*****************************
  Destination options header.
 *****************************/

A
Amerigo Wang 已提交
177
#if IS_ENABLED(CONFIG_IPV6_MIP6)
178
static bool ipv6_dest_hao(struct sk_buff *skb, int optoff)
179 180 181
{
	struct ipv6_destopt_hao *hao;
	struct inet6_skb_parm *opt = IP6CB(skb);
182
	struct ipv6hdr *ipv6h = ipv6_hdr(skb);
183 184 185 186 187 188 189 190 191 192
	struct in6_addr tmp_addr;
	int ret;

	if (opt->dsthao) {
		LIMIT_NETDEBUG(KERN_DEBUG "hao duplicated\n");
		goto discard;
	}
	opt->dsthao = opt->dst1;
	opt->dst1 = 0;

193
	hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) + optoff);
194 195 196 197 198 199 200 201 202

	if (hao->length != 16) {
		LIMIT_NETDEBUG(
			KERN_DEBUG "hao invalid option length = %d\n", hao->length);
		goto discard;
	}

	if (!(ipv6_addr_type(&hao->addr) & IPV6_ADDR_UNICAST)) {
		LIMIT_NETDEBUG(
H
Harvey Harrison 已提交
203
			KERN_DEBUG "hao is not an unicast addr: %pI6\n", &hao->addr);
204 205 206 207 208 209 210 211 212
		goto discard;
	}

	ret = xfrm6_input_addr(skb, (xfrm_address_t *)&ipv6h->daddr,
			       (xfrm_address_t *)&hao->addr, IPPROTO_DSTOPTS);
	if (unlikely(ret < 0))
		goto discard;

	if (skb_cloned(skb)) {
213
		if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC))
214 215 216
			goto discard;

		/* update all variable using below by copied skbuff */
217
		hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) +
218
						  optoff);
219
		ipv6h = ipv6_hdr(skb);
220 221 222 223 224
	}

	if (skb->ip_summed == CHECKSUM_COMPLETE)
		skb->ip_summed = CHECKSUM_NONE;

A
Alexey Dobriyan 已提交
225 226 227
	tmp_addr = ipv6h->saddr;
	ipv6h->saddr = hao->addr;
	hao->addr = tmp_addr;
228

229
	if (skb->tstamp.tv64 == 0)
230 231
		__net_timestamp(skb);

232
	return true;
233 234 235

 discard:
	kfree_skb(skb);
236
	return false;
237 238 239
}
#endif

240
static const struct tlvtype_proc tlvprocdestopt_lst[] = {
A
Amerigo Wang 已提交
241
#if IS_ENABLED(CONFIG_IPV6_MIP6)
242 243 244 245 246
	{
		.type	= IPV6_TLV_HAO,
		.func	= ipv6_dest_hao,
	},
#endif
L
Linus Torvalds 已提交
247 248 249
	{-1,			NULL}
};

250
static int ipv6_destopt_rcv(struct sk_buff *skb)
L
Linus Torvalds 已提交
251 252
{
	struct inet6_skb_parm *opt = IP6CB(skb);
A
Amerigo Wang 已提交
253
#if IS_ENABLED(CONFIG_IPV6_MIP6)
254 255
	__u16 dstbuf;
#endif
256
	struct dst_entry *dst = skb_dst(skb);
L
Linus Torvalds 已提交
257

258 259
	if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
	    !pskb_may_pull(skb, (skb_transport_offset(skb) +
260
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
261
		IP6_INC_STATS_BH(dev_net(dst->dev), ip6_dst_idev(dst),
262
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
263 264 265 266
		kfree_skb(skb);
		return -1;
	}

267
	opt->lastopt = opt->dst1 = skb_network_header_len(skb);
A
Amerigo Wang 已提交
268
#if IS_ENABLED(CONFIG_IPV6_MIP6)
269 270
	dstbuf = opt->dst1;
#endif
L
Linus Torvalds 已提交
271

272
	if (ip6_parse_tlv(tlvprocdestopt_lst, skb)) {
273
		skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
274
		opt = IP6CB(skb);
A
Amerigo Wang 已提交
275
#if IS_ENABLED(CONFIG_IPV6_MIP6)
276 277
		opt->nhoff = dstbuf;
#else
278
		opt->nhoff = opt->dst1;
279
#endif
L
Linus Torvalds 已提交
280 281 282
		return 1;
	}

283 284
	IP6_INC_STATS_BH(dev_net(dst->dev),
			 ip6_dst_idev(dst), IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
285 286 287 288 289 290 291
	return -1;
}

/********************************
  Routing header.
 ********************************/

292
/* called with rcu_read_lock() */
293
static int ipv6_rthdr_rcv(struct sk_buff *skb)
L
Linus Torvalds 已提交
294 295
{
	struct inet6_skb_parm *opt = IP6CB(skb);
296
	struct in6_addr *addr = NULL;
L
Linus Torvalds 已提交
297
	struct in6_addr daddr;
298
	struct inet6_dev *idev;
L
Linus Torvalds 已提交
299 300 301
	int n, i;
	struct ipv6_rt_hdr *hdr;
	struct rt0_hdr *rthdr;
302 303
	struct net *net = dev_net(skb->dev);
	int accept_source_route = net->ipv6.devconf_all->accept_source_route;
304

305 306 307
	idev = __in6_dev_get(skb->dev);
	if (idev && accept_source_route > idev->cnf.accept_source_route)
		accept_source_route = idev->cnf.accept_source_route;
308

309 310
	if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
	    !pskb_may_pull(skb, (skb_transport_offset(skb) +
311
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
E
Eric Dumazet 已提交
312
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
313
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
314 315 316 317
		kfree_skb(skb);
		return -1;
	}

318
	hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
L
Linus Torvalds 已提交
319

320
	if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr) ||
L
Linus Torvalds 已提交
321
	    skb->pkt_type != PACKET_HOST) {
E
Eric Dumazet 已提交
322
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
323
				 IPSTATS_MIB_INADDRERRORS);
L
Linus Torvalds 已提交
324 325 326 327 328 329
		kfree_skb(skb);
		return -1;
	}

looped_back:
	if (hdr->segments_left == 0) {
330
		switch (hdr->type) {
A
Amerigo Wang 已提交
331
#if IS_ENABLED(CONFIG_IPV6_MIP6)
332 333 334 335 336
		case IPV6_SRCRT_TYPE_2:
			/* Silently discard type 2 header unless it was
			 * processed by own
			 */
			if (!addr) {
E
Eric Dumazet 已提交
337
				IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
338
						 IPSTATS_MIB_INADDRERRORS);
339 340 341 342 343 344 345 346 347
				kfree_skb(skb);
				return -1;
			}
			break;
#endif
		default:
			break;
		}

348
		opt->lastopt = opt->srcrt = skb_network_header_len(skb);
349
		skb->transport_header += (hdr->hdrlen + 1) << 3;
L
Linus Torvalds 已提交
350 351
		opt->dst0 = opt->dst1;
		opt->dst1 = 0;
352
		opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
L
Linus Torvalds 已提交
353 354 355
		return 1;
	}

356
	switch (hdr->type) {
A
Amerigo Wang 已提交
357
#if IS_ENABLED(CONFIG_IPV6_MIP6)
358
	case IPV6_SRCRT_TYPE_2:
359 360
		if (accept_source_route < 0)
			goto unknown_rh;
361 362
		/* Silently discard invalid RTH type 2 */
		if (hdr->hdrlen != 2 || hdr->segments_left != 1) {
E
Eric Dumazet 已提交
363
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
364
					 IPSTATS_MIB_INHDRERRORS);
365 366 367 368 369
			kfree_skb(skb);
			return -1;
		}
		break;
#endif
370 371
	default:
		goto unknown_rh;
L
Linus Torvalds 已提交
372 373 374 375 376 377 378 379 380 381
	}

	/*
	 *	This is the routing header forwarding algorithm from
	 *	RFC 2460, page 16.
	 */

	n = hdr->hdrlen >> 1;

	if (hdr->segments_left > n) {
E
Eric Dumazet 已提交
382
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
383
				 IPSTATS_MIB_INHDRERRORS);
384 385 386
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
				  ((&hdr->segments_left) -
				   skb_network_header(skb)));
L
Linus Torvalds 已提交
387 388 389 390 391 392 393 394
		return -1;
	}

	/* We are about to mangle packet header. Be careful!
	   Do not damage packets queued somewhere.
	 */
	if (skb_cloned(skb)) {
		/* the copy is a forwarded packet */
395
		if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
E
Eric Dumazet 已提交
396
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
397 398
					 IPSTATS_MIB_OUTDISCARDS);
			kfree_skb(skb);
L
Linus Torvalds 已提交
399 400
			return -1;
		}
401
		hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
L
Linus Torvalds 已提交
402 403
	}

404
	if (skb->ip_summed == CHECKSUM_COMPLETE)
L
Linus Torvalds 已提交
405 406 407 408 409 410 411 412
		skb->ip_summed = CHECKSUM_NONE;

	i = n - --hdr->segments_left;

	rthdr = (struct rt0_hdr *) hdr;
	addr = rthdr->addr;
	addr += i - 1;

413
	switch (hdr->type) {
A
Amerigo Wang 已提交
414
#if IS_ENABLED(CONFIG_IPV6_MIP6)
415 416
	case IPV6_SRCRT_TYPE_2:
		if (xfrm6_input_addr(skb, (xfrm_address_t *)addr,
417
				     (xfrm_address_t *)&ipv6_hdr(skb)->saddr,
418
				     IPPROTO_ROUTING) < 0) {
E
Eric Dumazet 已提交
419
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
420
					 IPSTATS_MIB_INADDRERRORS);
421 422 423
			kfree_skb(skb);
			return -1;
		}
E
Eric Dumazet 已提交
424 425
		if (!ipv6_chk_home_addr(dev_net(skb_dst(skb)->dev), addr)) {
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
426
					 IPSTATS_MIB_INADDRERRORS);
427 428 429 430 431 432 433 434 435
			kfree_skb(skb);
			return -1;
		}
		break;
#endif
	default:
		break;
	}

L
Linus Torvalds 已提交
436
	if (ipv6_addr_is_multicast(addr)) {
E
Eric Dumazet 已提交
437
		IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
438
				 IPSTATS_MIB_INADDRERRORS);
L
Linus Torvalds 已提交
439 440 441 442
		kfree_skb(skb);
		return -1;
	}

A
Alexey Dobriyan 已提交
443 444 445
	daddr = *addr;
	*addr = ipv6_hdr(skb)->daddr;
	ipv6_hdr(skb)->daddr = daddr;
L
Linus Torvalds 已提交
446

E
Eric Dumazet 已提交
447
	skb_dst_drop(skb);
L
Linus Torvalds 已提交
448
	ip6_route_input(skb);
E
Eric Dumazet 已提交
449
	if (skb_dst(skb)->error) {
450
		skb_push(skb, skb->data - skb_network_header(skb));
L
Linus Torvalds 已提交
451 452 453 454
		dst_input(skb);
		return -1;
	}

E
Eric Dumazet 已提交
455
	if (skb_dst(skb)->dev->flags&IFF_LOOPBACK) {
456
		if (ipv6_hdr(skb)->hop_limit <= 1) {
E
Eric Dumazet 已提交
457
			IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)),
458
					 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
459
			icmpv6_send(skb, ICMPV6_TIME_EXCEED, ICMPV6_EXC_HOPLIMIT,
460
				    0);
L
Linus Torvalds 已提交
461 462 463
			kfree_skb(skb);
			return -1;
		}
464
		ipv6_hdr(skb)->hop_limit--;
L
Linus Torvalds 已提交
465 466 467
		goto looped_back;
	}

468
	skb_push(skb, skb->data - skb_network_header(skb));
L
Linus Torvalds 已提交
469 470
	dst_input(skb);
	return -1;
471 472

unknown_rh:
E
Eric Dumazet 已提交
473
	IP6_INC_STATS_BH(net, ip6_dst_idev(skb_dst(skb)), IPSTATS_MIB_INHDRERRORS);
474 475 476
	icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
			  (&hdr->type) - skb_network_header(skb));
	return -1;
L
Linus Torvalds 已提交
477 478
}

479
static const struct inet6_protocol rthdr_protocol = {
L
Linus Torvalds 已提交
480
	.handler	=	ipv6_rthdr_rcv,
481
	.flags		=	INET6_PROTO_NOPOLICY,
482 483
};

484
static const struct inet6_protocol destopt_protocol = {
485
	.handler	=	ipv6_destopt_rcv,
486
	.flags		=	INET6_PROTO_NOPOLICY,
487 488
};

489
static const struct inet6_protocol nodata_protocol = {
490 491 492 493 494
	.handler	=	dst_discard,
	.flags		=	INET6_PROTO_NOPOLICY,
};

int __init ipv6_exthdrs_init(void)
L
Linus Torvalds 已提交
495
{
496 497
	int ret;

498 499
	ret = inet6_add_protocol(&rthdr_protocol, IPPROTO_ROUTING);
	if (ret)
500
		goto out;
501

502 503 504 505 506 507 508 509 510 511 512 513
	ret = inet6_add_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
	if (ret)
		goto out_rthdr;

	ret = inet6_add_protocol(&nodata_protocol, IPPROTO_NONE);
	if (ret)
		goto out_destopt;

out:
	return ret;
out_destopt:
	inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
514 515
out_rthdr:
	inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
516
	goto out;
L
Linus Torvalds 已提交
517 518
};

519 520 521 522 523 524 525
void ipv6_exthdrs_exit(void)
{
	inet6_del_protocol(&nodata_protocol, IPPROTO_NONE);
	inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
	inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
}

L
Linus Torvalds 已提交
526 527 528 529
/**********************************
  Hop-by-hop options.
 **********************************/

530
/*
E
Eric Dumazet 已提交
531
 * Note: we cannot rely on skb_dst(skb) before we assign it in ip6_route_input().
532 533 534
 */
static inline struct inet6_dev *ipv6_skb_idev(struct sk_buff *skb)
{
E
Eric Dumazet 已提交
535
	return skb_dst(skb) ? ip6_dst_idev(skb_dst(skb)) : __in6_dev_get(skb->dev);
536 537
}

538 539 540 541 542
static inline struct net *ipv6_skb_net(struct sk_buff *skb)
{
	return skb_dst(skb) ? dev_net(skb_dst(skb)->dev) : dev_net(skb->dev);
}

L
Linus Torvalds 已提交
543 544
/* Router Alert as of RFC 2711 */

545
static bool ipv6_hop_ra(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
546
{
547
	const unsigned char *nh = skb_network_header(skb);
548

549
	if (nh[optoff + 1] == 2) {
550 551
		IP6CB(skb)->flags |= IP6SKB_ROUTERALERT;
		memcpy(&IP6CB(skb)->ra, nh + optoff + 2, sizeof(IP6CB(skb)->ra));
552
		return true;
L
Linus Torvalds 已提交
553
	}
554
	LIMIT_NETDEBUG(KERN_DEBUG "ipv6_hop_ra: wrong RA length %d\n",
555
		       nh[optoff + 1]);
L
Linus Torvalds 已提交
556
	kfree_skb(skb);
557
	return false;
L
Linus Torvalds 已提交
558 559 560 561
}

/* Jumbo payload */

562
static bool ipv6_hop_jumbo(struct sk_buff *skb, int optoff)
L
Linus Torvalds 已提交
563
{
564
	const unsigned char *nh = skb_network_header(skb);
565
	struct net *net = ipv6_skb_net(skb);
L
Linus Torvalds 已提交
566 567
	u32 pkt_len;

568
	if (nh[optoff + 1] != 4 || (optoff & 3) != 2) {
569
		LIMIT_NETDEBUG(KERN_DEBUG "ipv6_hop_jumbo: wrong jumbo opt length/alignment %d\n",
570
			       nh[optoff+1]);
571
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
572
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
573 574 575
		goto drop;
	}

576
	pkt_len = ntohl(*(__be32 *)(nh + optoff + 2));
L
Linus Torvalds 已提交
577
	if (pkt_len <= IPV6_MAXPLEN) {
578 579
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
580
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff+2);
581
		return false;
L
Linus Torvalds 已提交
582
	}
583
	if (ipv6_hdr(skb)->payload_len) {
584 585
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INHDRERRORS);
L
Linus Torvalds 已提交
586
		icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff);
587
		return false;
L
Linus Torvalds 已提交
588 589 590
	}

	if (pkt_len > skb->len - sizeof(struct ipv6hdr)) {
591 592
		IP6_INC_STATS_BH(net, ipv6_skb_idev(skb),
				 IPSTATS_MIB_INTRUNCATEDPKTS);
L
Linus Torvalds 已提交
593 594
		goto drop;
	}
595 596 597 598

	if (pskb_trim_rcsum(skb, pkt_len + sizeof(struct ipv6hdr)))
		goto drop;

599
	return true;
L
Linus Torvalds 已提交
600 601 602

drop:
	kfree_skb(skb);
603
	return false;
L
Linus Torvalds 已提交
604 605
}

606
static const struct tlvtype_proc tlvprochopopt_lst[] = {
L
Linus Torvalds 已提交
607 608 609 610 611 612 613 614 615 616 617
	{
		.type	= IPV6_TLV_ROUTERALERT,
		.func	= ipv6_hop_ra,
	},
	{
		.type	= IPV6_TLV_JUMBO,
		.func	= ipv6_hop_jumbo,
	},
	{ -1, }
};

618
int ipv6_parse_hopopts(struct sk_buff *skb)
L
Linus Torvalds 已提交
619
{
620 621
	struct inet6_skb_parm *opt = IP6CB(skb);

622
	/*
623
	 * skb_network_header(skb) is equal to skb->data, and
624
	 * skb_network_header_len(skb) is always equal to
625 626 627 628
	 * sizeof(struct ipv6hdr) by definition of
	 * hop-by-hop options.
	 */
	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr) + 8) ||
629 630
	    !pskb_may_pull(skb, (sizeof(struct ipv6hdr) +
				 ((skb_transport_header(skb)[1] + 1) << 3)))) {
631 632 633 634
		kfree_skb(skb);
		return -1;
	}

635
	opt->hop = sizeof(struct ipv6hdr);
636
	if (ip6_parse_tlv(tlvprochopopt_lst, skb)) {
637
		skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
638
		opt = IP6CB(skb);
639
		opt->nhoff = sizeof(struct ipv6hdr);
640
		return 1;
641
	}
L
Linus Torvalds 已提交
642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662
	return -1;
}

/*
 *	Creating outbound headers.
 *
 *	"build" functions work when skb is filled from head to tail (datagram)
 *	"push"	functions work when headers are added from tail to head (tcp)
 *
 *	In both cases we assume, that caller reserved enough room
 *	for headers.
 */

static void ipv6_push_rthdr(struct sk_buff *skb, u8 *proto,
			    struct ipv6_rt_hdr *opt,
			    struct in6_addr **addr_p)
{
	struct rt0_hdr *phdr, *ihdr;
	int hops;

	ihdr = (struct rt0_hdr *) opt;
663

L
Linus Torvalds 已提交
664 665 666 667 668 669 670 671 672
	phdr = (struct rt0_hdr *) skb_push(skb, (ihdr->rt_hdr.hdrlen + 1) << 3);
	memcpy(phdr, ihdr, sizeof(struct rt0_hdr));

	hops = ihdr->rt_hdr.hdrlen >> 1;

	if (hops > 1)
		memcpy(phdr->addr, ihdr->addr + 1,
		       (hops - 1) * sizeof(struct in6_addr));

A
Alexey Dobriyan 已提交
673
	phdr->addr[hops - 1] = **addr_p;
L
Linus Torvalds 已提交
674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692
	*addr_p = ihdr->addr;

	phdr->rt_hdr.nexthdr = *proto;
	*proto = NEXTHDR_ROUTING;
}

static void ipv6_push_exthdr(struct sk_buff *skb, u8 *proto, u8 type, struct ipv6_opt_hdr *opt)
{
	struct ipv6_opt_hdr *h = (struct ipv6_opt_hdr *)skb_push(skb, ipv6_optlen(opt));

	memcpy(h, opt, ipv6_optlen(opt));
	h->nexthdr = *proto;
	*proto = type;
}

void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			  u8 *proto,
			  struct in6_addr **daddr)
{
693
	if (opt->srcrt) {
L
Linus Torvalds 已提交
694
		ipv6_push_rthdr(skb, proto, opt->srcrt, daddr);
695 696 697 698 699 700 701
		/*
		 * IPV6_RTHDRDSTOPTS is ignored
		 * unless IPV6_RTHDR is set (RFC3542).
		 */
		if (opt->dst0opt)
			ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst0opt);
	}
L
Linus Torvalds 已提交
702 703 704
	if (opt->hopopt)
		ipv6_push_exthdr(skb, proto, NEXTHDR_HOP, opt->hopopt);
}
705 706
EXPORT_SYMBOL(ipv6_push_nfrag_opts);

L
Linus Torvalds 已提交
707 708 709 710 711 712 713 714 715 716 717 718 719
void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt, u8 *proto)
{
	if (opt->dst1opt)
		ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst1opt);
}

struct ipv6_txoptions *
ipv6_dup_options(struct sock *sk, struct ipv6_txoptions *opt)
{
	struct ipv6_txoptions *opt2;

	opt2 = sock_kmalloc(sk, opt->tot_len, GFP_ATOMIC);
	if (opt2) {
720
		long dif = (char *)opt2 - (char *)opt;
L
Linus Torvalds 已提交
721 722
		memcpy(opt2, opt, opt->tot_len);
		if (opt2->hopopt)
723
			*((char **)&opt2->hopopt) += dif;
L
Linus Torvalds 已提交
724
		if (opt2->dst0opt)
725
			*((char **)&opt2->dst0opt) += dif;
L
Linus Torvalds 已提交
726
		if (opt2->dst1opt)
727
			*((char **)&opt2->dst1opt) += dif;
L
Linus Torvalds 已提交
728
		if (opt2->srcrt)
729
			*((char **)&opt2->srcrt) += dif;
L
Linus Torvalds 已提交
730 731 732
	}
	return opt2;
}
733 734
EXPORT_SYMBOL_GPL(ipv6_dup_options);

735 736 737 738 739 740 741 742 743 744
static int ipv6_renew_option(void *ohdr,
			     struct ipv6_opt_hdr __user *newopt, int newoptlen,
			     int inherit,
			     struct ipv6_opt_hdr **hdr,
			     char **p)
{
	if (inherit) {
		if (ohdr) {
			memcpy(*p, ohdr, ipv6_optlen((struct ipv6_opt_hdr *)ohdr));
			*hdr = (struct ipv6_opt_hdr *)*p;
J
Joe Perches 已提交
745
			*p += CMSG_ALIGN(ipv6_optlen(*hdr));
746 747 748 749 750 751
		}
	} else {
		if (newopt) {
			if (copy_from_user(*p, newopt, newoptlen))
				return -EFAULT;
			*hdr = (struct ipv6_opt_hdr *)*p;
J
Joe Perches 已提交
752
			if (ipv6_optlen(*hdr) > newoptlen)
753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769
				return -EINVAL;
			*p += CMSG_ALIGN(newoptlen);
		}
	}
	return 0;
}

struct ipv6_txoptions *
ipv6_renew_options(struct sock *sk, struct ipv6_txoptions *opt,
		   int newtype,
		   struct ipv6_opt_hdr __user *newopt, int newoptlen)
{
	int tot_len = 0;
	char *p;
	struct ipv6_txoptions *opt2;
	int err;

770 771 772 773 774 775 776 777 778 779 780
	if (opt) {
		if (newtype != IPV6_HOPOPTS && opt->hopopt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->hopopt));
		if (newtype != IPV6_RTHDRDSTOPTS && opt->dst0opt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst0opt));
		if (newtype != IPV6_RTHDR && opt->srcrt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->srcrt));
		if (newtype != IPV6_DSTOPTS && opt->dst1opt)
			tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst1opt));
	}

781 782 783 784 785 786
	if (newopt && newoptlen)
		tot_len += CMSG_ALIGN(newoptlen);

	if (!tot_len)
		return NULL;

787
	tot_len += sizeof(*opt2);
788 789 790 791 792 793 794 795 796
	opt2 = sock_kmalloc(sk, tot_len, GFP_ATOMIC);
	if (!opt2)
		return ERR_PTR(-ENOBUFS);

	memset(opt2, 0, tot_len);

	opt2->tot_len = tot_len;
	p = (char *)(opt2 + 1);

797
	err = ipv6_renew_option(opt ? opt->hopopt : NULL, newopt, newoptlen,
798 799 800 801 802
				newtype != IPV6_HOPOPTS,
				&opt2->hopopt, &p);
	if (err)
		goto out;

803
	err = ipv6_renew_option(opt ? opt->dst0opt : NULL, newopt, newoptlen,
804 805 806 807 808
				newtype != IPV6_RTHDRDSTOPTS,
				&opt2->dst0opt, &p);
	if (err)
		goto out;

809
	err = ipv6_renew_option(opt ? opt->srcrt : NULL, newopt, newoptlen,
810
				newtype != IPV6_RTHDR,
811
				(struct ipv6_opt_hdr **)&opt2->srcrt, &p);
812 813 814
	if (err)
		goto out;

815
	err = ipv6_renew_option(opt ? opt->dst1opt : NULL, newopt, newoptlen,
816 817 818 819 820 821 822 823 824 825 826 827
				newtype != IPV6_DSTOPTS,
				&opt2->dst1opt, &p);
	if (err)
		goto out;

	opt2->opt_nflen = (opt2->hopopt ? ipv6_optlen(opt2->hopopt) : 0) +
			  (opt2->dst0opt ? ipv6_optlen(opt2->dst0opt) : 0) +
			  (opt2->srcrt ? ipv6_optlen(opt2->srcrt) : 0);
	opt2->opt_flen = (opt2->dst1opt ? ipv6_optlen(opt2->dst1opt) : 0);

	return opt2;
out:
828
	sock_kfree_s(sk, opt2, opt2->tot_len);
829 830 831
	return ERR_PTR(err);
}

832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849
struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
					  struct ipv6_txoptions *opt)
{
	/*
	 * ignore the dest before srcrt unless srcrt is being included.
	 * --yoshfuji
	 */
	if (opt && opt->dst0opt && !opt->srcrt) {
		if (opt_space != opt) {
			memcpy(opt_space, opt, sizeof(*opt_space));
			opt = opt_space;
		}
		opt->opt_nflen -= ipv6_optlen(opt->dst0opt);
		opt->dst0opt = NULL;
	}

	return opt;
}
850
EXPORT_SYMBOL_GPL(ipv6_fixup_options);
851

852 853 854 855
/**
 * fl6_update_dst - update flowi destination address with info given
 *                  by srcrt option, if any.
 *
856
 * @fl6: flowi6 for which daddr is to be updated
857
 * @opt: struct ipv6_txoptions in which to look for srcrt opt
858
 * @orig: copy of original daddr address if modified
859 860
 *
 * Returns NULL if no txoptions or no srcrt, otherwise returns orig
861
 * and initial value of fl6->daddr set in orig
862
 */
863
struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
864 865 866 867 868 869
				const struct ipv6_txoptions *opt,
				struct in6_addr *orig)
{
	if (!opt || !opt->srcrt)
		return NULL;

A
Alexey Dobriyan 已提交
870 871
	*orig = fl6->daddr;
	fl6->daddr = *((struct rt0_hdr *)opt->srcrt)->addr;
872 873 874
	return orig;
}
EXPORT_SYMBOL_GPL(fl6_update_dst);