ipv6.h 25.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 *	Linux INET6 implementation
 *
 *	Authors:
 *	Pedro Roque		<roque@di.fc.ul.pt>
 *
 *	This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

#ifndef _NET_IPV6_H
#define _NET_IPV6_H

#include <linux/ipv6.h>
#include <linux/hardirq.h>
E
Eric Dumazet 已提交
18
#include <linux/jhash.h>
19
#include <net/if_inet6.h>
L
Linus Torvalds 已提交
20 21
#include <net/ndisc.h>
#include <net/flow.h>
22
#include <net/flow_keys.h>
L
Linus Torvalds 已提交
23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
#include <net/snmp.h>

#define SIN6_LEN_RFC2133	24

#define IPV6_MAXPLEN		65535

/*
 *	NextHeader field of IPv6 header
 */

#define NEXTHDR_HOP		0	/* Hop-by-hop option header. */
#define NEXTHDR_TCP		6	/* TCP segment. */
#define NEXTHDR_UDP		17	/* UDP message. */
#define NEXTHDR_IPV6		41	/* IPv6 in IPv6 */
#define NEXTHDR_ROUTING		43	/* Routing header. */
#define NEXTHDR_FRAGMENT	44	/* Fragmentation/reassembly header. */
X
xeb@mail.ru 已提交
39
#define NEXTHDR_GRE		47	/* GRE header. */
L
Linus Torvalds 已提交
40 41 42 43 44
#define NEXTHDR_ESP		50	/* Encapsulating security payload. */
#define NEXTHDR_AUTH		51	/* Authentication header. */
#define NEXTHDR_ICMP		58	/* ICMP for IPv6. */
#define NEXTHDR_NONE		59	/* No next header */
#define NEXTHDR_DEST		60	/* Destination options header. */
J
Joe Stringer 已提交
45
#define NEXTHDR_SCTP		132	/* SCTP message. */
46
#define NEXTHDR_MOBILITY	135	/* Mobility header. */
L
Linus Torvalds 已提交
47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92

#define NEXTHDR_MAX		255



#define IPV6_DEFAULT_HOPLIMIT   64
#define IPV6_DEFAULT_MCASTHOPS	1

/*
 *	Addr type
 *	
 *	type	-	unicast | multicast
 *	scope	-	local	| site	    | global
 *	v4	-	compat
 *	v4mapped
 *	any
 *	loopback
 */

#define IPV6_ADDR_ANY		0x0000U

#define IPV6_ADDR_UNICAST      	0x0001U	
#define IPV6_ADDR_MULTICAST    	0x0002U	

#define IPV6_ADDR_LOOPBACK	0x0010U
#define IPV6_ADDR_LINKLOCAL	0x0020U
#define IPV6_ADDR_SITELOCAL	0x0040U

#define IPV6_ADDR_COMPATv4	0x0080U

#define IPV6_ADDR_SCOPE_MASK	0x00f0U

#define IPV6_ADDR_MAPPED	0x1000U

/*
 *	Addr scopes
 */
#define IPV6_ADDR_MC_SCOPE(a)	\
	((a)->s6_addr[1] & 0x0f)	/* nonstandard */
#define __IPV6_ADDR_SCOPE_INVALID	-1
#define IPV6_ADDR_SCOPE_NODELOCAL	0x01
#define IPV6_ADDR_SCOPE_LINKLOCAL	0x02
#define IPV6_ADDR_SCOPE_SITELOCAL	0x05
#define IPV6_ADDR_SCOPE_ORGLOCAL	0x08
#define IPV6_ADDR_SCOPE_GLOBAL		0x0e

93 94 95 96 97 98 99 100 101 102
/*
 *	Addr flags
 */
#define IPV6_ADDR_MC_FLAG_TRANSIENT(a)	\
	((a)->s6_addr[1] & 0x10)
#define IPV6_ADDR_MC_FLAG_PREFIX(a)	\
	((a)->s6_addr[1] & 0x20)
#define IPV6_ADDR_MC_FLAG_RENDEZVOUS(a)	\
	((a)->s6_addr[1] & 0x40)

L
Linus Torvalds 已提交
103 104 105 106 107
/*
 *	fragmentation header
 */

struct frag_hdr {
A
Al Viro 已提交
108 109 110 111
	__u8	nexthdr;
	__u8	reserved;
	__be16	frag_off;
	__be32	identification;
L
Linus Torvalds 已提交
112 113
};

114 115
#define	IP6_MF		0x0001
#define	IP6_OFFSET	0xFFF8
L
Linus Torvalds 已提交
116

117 118 119
#define IP6_REPLY_MARK(net, mark) \
	((net)->ipv6.sysctl.fwmark_reflect ? (mark) : 0)

L
Linus Torvalds 已提交
120 121 122 123
#include <net/sock.h>

/* sysctls */
extern int sysctl_mld_max_msf;
124

125
#define _DEVINC(net, statname, modifier, idev, field)			\
126
({									\
127 128
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
129
		SNMP_INC_STATS##modifier((_idev)->stats.statname, (field)); \
130
	SNMP_INC_STATS##modifier((net)->mib.statname##_statistics, (field));\
131
})
132

133 134 135 136 137 138 139 140 141
/* per device counters are atomic_long_t */
#define _DEVINCATOMIC(net, statname, modifier, idev, field)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_INC_STATS_ATOMIC_LONG((_idev)->stats.statname##dev, (field)); \
	SNMP_INC_STATS##modifier((net)->mib.statname##_statistics, (field));\
})

142 143 144 145 146 147 148 149 150
/* per device and per net counters are atomic_long_t */
#define _DEVINC_ATOMIC_ATOMIC(net, statname, idev, field)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_INC_STATS_ATOMIC_LONG((_idev)->stats.statname##dev, (field)); \
	SNMP_INC_STATS_ATOMIC_LONG((net)->mib.statname##_statistics, (field));\
})

151
#define _DEVADD(net, statname, modifier, idev, field, val)		\
152 153 154 155
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_ADD_STATS##modifier((_idev)->stats.statname, (field), (val)); \
156
	SNMP_ADD_STATS##modifier((net)->mib.statname##_statistics, (field), (val));\
157 158
})

159 160 161 162 163 164 165 166
#define _DEVUPD(net, statname, modifier, idev, field, val)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_UPD_PO_STATS##modifier((_idev)->stats.statname, field, (val)); \
	SNMP_UPD_PO_STATS##modifier((net)->mib.statname##_statistics, field, (val));\
})

167 168
/* MIBs */

169
#define IP6_INC_STATS(net, idev,field)		\
170
		_DEVINC(net, ipv6, 64, idev, field)
171
#define IP6_INC_STATS_BH(net, idev,field)	\
172
		_DEVINC(net, ipv6, 64_BH, idev, field)
173
#define IP6_ADD_STATS(net, idev,field,val)	\
174
		_DEVADD(net, ipv6, 64, idev, field, val)
175
#define IP6_ADD_STATS_BH(net, idev,field,val)	\
176
		_DEVADD(net, ipv6, 64_BH, idev, field, val)
177
#define IP6_UPD_PO_STATS(net, idev,field,val)   \
178
		_DEVUPD(net, ipv6, 64, idev, field, val)
179
#define IP6_UPD_PO_STATS_BH(net, idev,field,val)   \
180
		_DEVUPD(net, ipv6, 64_BH, idev, field, val)
181
#define ICMP6_INC_STATS(net, idev, field)	\
182
		_DEVINCATOMIC(net, icmpv6, , idev, field)
183
#define ICMP6_INC_STATS_BH(net, idev, field)	\
184
		_DEVINCATOMIC(net, icmpv6, _BH, idev, field)
185 186

#define ICMP6MSGOUT_INC_STATS(net, idev, field)		\
187
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field +256)
188
#define ICMP6MSGOUT_INC_STATS_BH(net, idev, field)	\
189
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field +256)
190
#define ICMP6MSGIN_INC_STATS_BH(net, idev, field)	\
191
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field)
192

E
Eric Dumazet 已提交
193
struct ip6_ra_chain {
L
Linus Torvalds 已提交
194 195 196 197 198 199 200 201 202 203 204 205 206 207
	struct ip6_ra_chain	*next;
	struct sock		*sk;
	int			sel;
	void			(*destructor)(struct sock *);
};

extern struct ip6_ra_chain	*ip6_ra_chain;
extern rwlock_t ip6_ra_lock;

/*
   This structure is prepared by protocol, when parsing
   ancillary data and passed to IPv6.
 */

E
Eric Dumazet 已提交
208
struct ipv6_txoptions {
L
Linus Torvalds 已提交
209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224
	/* Length of this structure */
	int			tot_len;

	/* length of extension headers   */

	__u16			opt_flen;	/* after fragment hdr */
	__u16			opt_nflen;	/* before fragment hdr */

	struct ipv6_opt_hdr	*hopopt;
	struct ipv6_opt_hdr	*dst0opt;
	struct ipv6_rt_hdr	*srcrt;	/* Routing Header */
	struct ipv6_opt_hdr	*dst1opt;

	/* Option buffer, as read by IPV6_PKTOPTIONS, starts here. */
};

E
Eric Dumazet 已提交
225
struct ip6_flowlabel {
226
	struct ip6_flowlabel __rcu *next;
A
Al Viro 已提交
227
	__be32			label;
228
	atomic_t		users;
L
Linus Torvalds 已提交
229 230 231
	struct in6_addr		dst;
	struct ipv6_txoptions	*opt;
	unsigned long		linger;
232
	struct rcu_head		rcu;
L
Linus Torvalds 已提交
233
	u8			share;
234 235 236 237
	union {
		struct pid *pid;
		kuid_t uid;
	} owner;
L
Linus Torvalds 已提交
238 239
	unsigned long		lastuse;
	unsigned long		expires;
240
	struct net		*fl_net;
L
Linus Torvalds 已提交
241 242
};

243 244
#define IPV6_FLOWINFO_MASK	cpu_to_be32(0x0FFFFFFF)
#define IPV6_FLOWLABEL_MASK	cpu_to_be32(0x000FFFFF)
245
#define IPV6_TCLASS_MASK (IPV6_FLOWINFO_MASK & ~IPV6_FLOWLABEL_MASK)
246
#define IPV6_TCLASS_SHIFT	20
L
Linus Torvalds 已提交
247

E
Eric Dumazet 已提交
248
struct ipv6_fl_socklist {
249 250 251
	struct ipv6_fl_socklist	__rcu	*next;
	struct ip6_flowlabel		*fl;
	struct rcu_head			rcu;
L
Linus Torvalds 已提交
252 253
};

254 255 256 257 258 259
struct ip6_flowlabel *fl6_sock_lookup(struct sock *sk, __be32 label);
struct ipv6_txoptions *fl6_merge_options(struct ipv6_txoptions *opt_space,
					 struct ip6_flowlabel *fl,
					 struct ipv6_txoptions *fopt);
void fl6_free_socklist(struct sock *sk);
int ipv6_flowlabel_opt(struct sock *sk, char __user *optval, int optlen);
260 261
int ipv6_flowlabel_opt_get(struct sock *sk, struct in6_flowlabel_req *freq,
			   int flags);
262 263
int ip6_flowlabel_init(void);
void ip6_flowlabel_cleanup(void);
L
Linus Torvalds 已提交
264 265 266 267 268 269 270

static inline void fl6_sock_release(struct ip6_flowlabel *fl)
{
	if (fl)
		atomic_dec(&fl->users);
}

271
void icmpv6_notify(struct sk_buff *skb, u8 type, u8 code, __be32 info);
272

273 274 275
int icmpv6_push_pending_frames(struct sock *sk, struct flowi6 *fl6,
			       struct icmp6hdr *thdr, int len);

276
int ip6_ra_control(struct sock *sk, int sel);
L
Linus Torvalds 已提交
277

278
int ipv6_parse_hopopts(struct sk_buff *skb);
L
Linus Torvalds 已提交
279

280 281 282 283 284 285 286
struct ipv6_txoptions *ipv6_dup_options(struct sock *sk,
					struct ipv6_txoptions *opt);
struct ipv6_txoptions *ipv6_renew_options(struct sock *sk,
					  struct ipv6_txoptions *opt,
					  int newtype,
					  struct ipv6_opt_hdr __user *newopt,
					  int newoptlen);
287 288
struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
					  struct ipv6_txoptions *opt);
L
Linus Torvalds 已提交
289

290
bool ipv6_opt_accepted(const struct sock *sk, const struct sk_buff *skb);
291

292 293 294 295 296 297 298 299 300
static inline bool ipv6_accept_ra(struct inet6_dev *idev)
{
	/* If forwarding is enabled, RA are not accepted unless the special
	 * hybrid mode (accept_ra=2) is enabled.
	 */
	return idev->cnf.forwarding ? idev->cnf.accept_ra == 2 :
	    idev->cnf.accept_ra;
}

301 302 303
#if IS_ENABLED(CONFIG_IPV6)
static inline int ip6_frag_mem(struct net *net)
{
304
	return sum_frag_mem_limit(&net->ipv6.frags);
305 306
}
#endif
L
Linus Torvalds 已提交
307

308 309
#define IPV6_FRAG_HIGH_THRESH	(4 * 1024*1024)	/* 4194304 */
#define IPV6_FRAG_LOW_THRESH	(3 * 1024*1024)	/* 3145728 */
310
#define IPV6_FRAG_TIMEOUT	(60 * HZ)	/* 60 seconds */
L
Linus Torvalds 已提交
311

312
int __ipv6_addr_type(const struct in6_addr *addr);
313 314 315 316
static inline int ipv6_addr_type(const struct in6_addr *addr)
{
	return __ipv6_addr_type(addr) & 0xffff;
}
L
Linus Torvalds 已提交
317 318 319

static inline int ipv6_addr_scope(const struct in6_addr *addr)
{
320 321 322 323 324
	return __ipv6_addr_type(addr) & IPV6_ADDR_SCOPE_MASK;
}

static inline int __ipv6_addr_src_scope(int type)
{
E
Eric Dumazet 已提交
325
	return (type == IPV6_ADDR_ANY) ? __IPV6_ADDR_SCOPE_INVALID : (type >> 16);
326 327 328 329 330
}

static inline int ipv6_addr_src_scope(const struct in6_addr *addr)
{
	return __ipv6_addr_src_scope(__ipv6_addr_type(addr));
L
Linus Torvalds 已提交
331 332
}

333 334 335 336 337 338 339 340 341 342 343 344
static inline bool __ipv6_addr_needs_scope_id(int type)
{
	return type & IPV6_ADDR_LINKLOCAL ||
	       (type & IPV6_ADDR_MULTICAST &&
		(type & (IPV6_ADDR_LOOPBACK|IPV6_ADDR_LINKLOCAL)));
}

static inline __u32 ipv6_iface_scope_id(const struct in6_addr *addr, int iface)
{
	return __ipv6_addr_needs_scope_id(__ipv6_addr_type(addr)) ? iface : 0;
}

L
Linus Torvalds 已提交
345 346
static inline int ipv6_addr_cmp(const struct in6_addr *a1, const struct in6_addr *a2)
{
347
	return memcmp(a1, a2, sizeof(struct in6_addr));
L
Linus Torvalds 已提交
348 349
}

350
static inline bool
351 352 353
ipv6_masked_addr_cmp(const struct in6_addr *a1, const struct in6_addr *m,
		     const struct in6_addr *a2)
{
354 355 356 357 358 359 360 361
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul1 = (const unsigned long *)a1;
	const unsigned long *ulm = (const unsigned long *)m;
	const unsigned long *ul2 = (const unsigned long *)a2;

	return !!(((ul1[0] ^ ul2[0]) & ulm[0]) |
		  ((ul1[1] ^ ul2[1]) & ulm[1]));
#else
E
Eric Dumazet 已提交
362 363 364 365
	return !!(((a1->s6_addr32[0] ^ a2->s6_addr32[0]) & m->s6_addr32[0]) |
		  ((a1->s6_addr32[1] ^ a2->s6_addr32[1]) & m->s6_addr32[1]) |
		  ((a1->s6_addr32[2] ^ a2->s6_addr32[2]) & m->s6_addr32[2]) |
		  ((a1->s6_addr32[3] ^ a2->s6_addr32[3]) & m->s6_addr32[3]));
366
#endif
367 368
}

L
Linus Torvalds 已提交
369 370 371 372 373 374 375 376
static inline void ipv6_addr_prefix(struct in6_addr *pfx, 
				    const struct in6_addr *addr,
				    int plen)
{
	/* caller must guarantee 0 <= plen <= 128 */
	int o = plen >> 3,
	    b = plen & 0x7;

377
	memset(pfx->s6_addr, 0, sizeof(pfx->s6_addr));
L
Linus Torvalds 已提交
378
	memcpy(pfx->s6_addr, addr, o);
379
	if (b != 0)
L
Linus Torvalds 已提交
380 381 382
		pfx->s6_addr[o] = addr->s6_addr[o] & (0xff00 >> b);
}

383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402
static inline void __ipv6_addr_set_half(__be32 *addr,
					__be32 wh, __be32 wl)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
#if defined(__BIG_ENDIAN)
	if (__builtin_constant_p(wh) && __builtin_constant_p(wl)) {
		*(__force u64 *)addr = ((__force u64)(wh) << 32 | (__force u64)(wl));
		return;
	}
#elif defined(__LITTLE_ENDIAN)
	if (__builtin_constant_p(wl) && __builtin_constant_p(wh)) {
		*(__force u64 *)addr = ((__force u64)(wl) << 32 | (__force u64)(wh));
		return;
	}
#endif
#endif
	addr[0] = wh;
	addr[1] = wl;
}

L
Linus Torvalds 已提交
403
static inline void ipv6_addr_set(struct in6_addr *addr, 
A
Al Viro 已提交
404 405
				     __be32 w1, __be32 w2,
				     __be32 w3, __be32 w4)
L
Linus Torvalds 已提交
406
{
407 408
	__ipv6_addr_set_half(&addr->s6_addr32[0], w1, w2);
	__ipv6_addr_set_half(&addr->s6_addr32[2], w3, w4);
L
Linus Torvalds 已提交
409 410
}

E
Eric Dumazet 已提交
411 412
static inline bool ipv6_addr_equal(const struct in6_addr *a1,
				   const struct in6_addr *a2)
L
Linus Torvalds 已提交
413
{
414 415 416 417 418 419
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul1 = (const unsigned long *)a1;
	const unsigned long *ul2 = (const unsigned long *)a2;

	return ((ul1[0] ^ ul2[0]) | (ul1[1] ^ ul2[1])) == 0UL;
#else
E
Eric Dumazet 已提交
420 421 422 423
	return ((a1->s6_addr32[0] ^ a2->s6_addr32[0]) |
		(a1->s6_addr32[1] ^ a2->s6_addr32[1]) |
		(a1->s6_addr32[2] ^ a2->s6_addr32[2]) |
		(a1->s6_addr32[3] ^ a2->s6_addr32[3])) == 0;
424
#endif
L
Linus Torvalds 已提交
425 426
}

427 428 429 430 431
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
static inline bool __ipv6_prefix_equal64_half(const __be64 *a1,
					      const __be64 *a2,
					      unsigned int len)
{
432
	if (len && ((*a1 ^ *a2) & cpu_to_be64((~0UL) << (64 - len))))
433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451
		return false;
	return true;
}

static inline bool ipv6_prefix_equal(const struct in6_addr *addr1,
				     const struct in6_addr *addr2,
				     unsigned int prefixlen)
{
	const __be64 *a1 = (const __be64 *)addr1;
	const __be64 *a2 = (const __be64 *)addr2;

	if (prefixlen >= 64) {
		if (a1[0] ^ a2[0])
			return false;
		return __ipv6_prefix_equal64_half(a1 + 1, a2 + 1, prefixlen - 64);
	}
	return __ipv6_prefix_equal64_half(a1, a2, prefixlen);
}
#else
452 453 454
static inline bool ipv6_prefix_equal(const struct in6_addr *addr1,
				     const struct in6_addr *addr2,
				     unsigned int prefixlen)
L
Linus Torvalds 已提交
455
{
456 457
	const __be32 *a1 = addr1->s6_addr32;
	const __be32 *a2 = addr2->s6_addr32;
458
	unsigned int pdw, pbi;
L
Linus Torvalds 已提交
459 460 461 462

	/* check complete u32 in prefix */
	pdw = prefixlen >> 5;
	if (pdw && memcmp(a1, a2, pdw << 2))
E
Eric Dumazet 已提交
463
		return false;
L
Linus Torvalds 已提交
464 465 466 467

	/* check incomplete u32 in prefix */
	pbi = prefixlen & 0x1f;
	if (pbi && ((a1[pdw] ^ a2[pdw]) & htonl((0xffffffff) << (32 - pbi))))
E
Eric Dumazet 已提交
468
		return false;
L
Linus Torvalds 已提交
469

E
Eric Dumazet 已提交
470
	return true;
L
Linus Torvalds 已提交
471
}
472
#endif
L
Linus Torvalds 已提交
473

474 475
struct inet_frag_queue;

476 477 478
enum ip6_defrag_users {
	IP6_DEFRAG_LOCAL_DELIVER,
	IP6_DEFRAG_CONNTRACK_IN,
479
	__IP6_DEFRAG_CONNTRACK_IN	= IP6_DEFRAG_CONNTRACK_IN + USHRT_MAX,
480
	IP6_DEFRAG_CONNTRACK_OUT,
481
	__IP6_DEFRAG_CONNTRACK_OUT	= IP6_DEFRAG_CONNTRACK_OUT + USHRT_MAX,
482
	IP6_DEFRAG_CONNTRACK_BRIDGE_IN,
483
	__IP6_DEFRAG_CONNTRACK_BRIDGE_IN = IP6_DEFRAG_CONNTRACK_BRIDGE_IN + USHRT_MAX,
484 485
};

486 487
struct ip6_create_arg {
	__be32 id;
488
	u32 user;
489 490
	const struct in6_addr *src;
	const struct in6_addr *dst;
491
	u8 ecn;
492 493
};

494 495
void ip6_frag_init(struct inet_frag_queue *q, const void *a);
bool ip6_frag_match(const struct inet_frag_queue *q, const void *a);
496

497 498 499 500 501 502 503 504 505 506 507 508 509 510
/*
 *	Equivalent of ipv4 struct ip
 */
struct frag_queue {
	struct inet_frag_queue	q;

	__be32			id;		/* fragment id		*/
	u32			user;
	struct in6_addr		saddr;
	struct in6_addr		daddr;

	int			iif;
	unsigned int		csum;
	__u16			nhoffset;
511
	u8			ecn;
512 513 514 515 516
};

void ip6_expire_frag_queue(struct net *net, struct frag_queue *fq,
			   struct inet_frags *frags);

E
Eric Dumazet 已提交
517
static inline bool ipv6_addr_any(const struct in6_addr *a)
L
Linus Torvalds 已提交
518
{
519 520 521 522 523
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul = (const unsigned long *)a;

	return (ul[0] | ul[1]) == 0UL;
#else
E
Eric Dumazet 已提交
524 525
	return (a->s6_addr32[0] | a->s6_addr32[1] |
		a->s6_addr32[2] | a->s6_addr32[3]) == 0;
526
#endif
L
Linus Torvalds 已提交
527 528
}

E
Eric Dumazet 已提交
529 530 531 532 533 534 535 536 537 538 539 540 541
static inline u32 ipv6_addr_hash(const struct in6_addr *a)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul = (const unsigned long *)a;
	unsigned long x = ul[0] ^ ul[1];

	return (u32)(x ^ (x >> 32));
#else
	return (__force u32)(a->s6_addr32[0] ^ a->s6_addr32[1] ^
			     a->s6_addr32[2] ^ a->s6_addr32[3]);
#endif
}

E
Eric Dumazet 已提交
542
/* more secured version of ipv6_addr_hash() */
543
static inline u32 __ipv6_addr_jhash(const struct in6_addr *a, const u32 initval)
E
Eric Dumazet 已提交
544 545 546 547 548 549
{
	u32 v = (__force u32)a->s6_addr32[0] ^ (__force u32)a->s6_addr32[1];

	return jhash_3words(v,
			    (__force u32)a->s6_addr32[2],
			    (__force u32)a->s6_addr32[3],
550
			    initval);
E
Eric Dumazet 已提交
551 552
}

E
Eric Dumazet 已提交
553
static inline bool ipv6_addr_loopback(const struct in6_addr *a)
554
{
555
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
556
	const __be64 *be = (const __be64 *)a;
557

558
	return (be[0] | (be[1] ^ cpu_to_be64(1))) == 0UL;
559
#else
E
Eric Dumazet 已提交
560
	return (a->s6_addr32[0] | a->s6_addr32[1] |
561
		a->s6_addr32[2] | (a->s6_addr32[3] ^ cpu_to_be32(1))) == 0;
562
#endif
563 564
}

565 566 567 568
/*
 * Note that we must __force cast these to unsigned long to make sparse happy,
 * since all of the endian-annotated types are fixed size regardless of arch.
 */
E
Eric Dumazet 已提交
569
static inline bool ipv6_addr_v4mapped(const struct in6_addr *a)
B
Brian Haley 已提交
570
{
571 572
	return (
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
573
		*(unsigned long *)a |
574
#else
575
		(__force unsigned long)(a->s6_addr32[0] | a->s6_addr32[1]) |
576
#endif
577 578
		(__force unsigned long)(a->s6_addr32[2] ^
					cpu_to_be32(0x0000ffff))) == 0UL;
B
Brian Haley 已提交
579 580
}

581 582 583 584
/*
 * Check for a RFC 4843 ORCHID address
 * (Overlay Routable Cryptographic Hash Identifiers)
 */
E
Eric Dumazet 已提交
585
static inline bool ipv6_addr_orchid(const struct in6_addr *a)
586
{
E
Eric Dumazet 已提交
587
	return (a->s6_addr32[0] & htonl(0xfffffff0)) == htonl(0x20010010);
588 589
}

590 591 592 593 594
static inline bool ipv6_addr_is_multicast(const struct in6_addr *addr)
{
	return (addr->s6_addr32[0] & htonl(0xFF000000)) == htonl(0xFF000000);
}

595 596 597 598 599 600 601 602 603
static inline void ipv6_addr_set_v4mapped(const __be32 addr,
					  struct in6_addr *v4mapped)
{
	ipv6_addr_set(v4mapped,
			0, 0,
			htonl(0x0000FFFF),
			addr);
}

604 605 606 607
/*
 * find the first different bit between two addresses
 * length of address must be a multiple of 32bits
 */
608
static inline int __ipv6_addr_diff32(const void *token1, const void *token2, int addrlen)
609
{
610
	const __be32 *a1 = token1, *a2 = token2;
611 612 613 614 615
	int i;

	addrlen >>= 2;

	for (i = 0; i < addrlen; i++) {
616 617
		__be32 xb = a1[i] ^ a2[i];
		if (xb)
618
			return i * 32 + 31 - __fls(ntohl(xb));
619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636
	}

	/*
	 *	we should *never* get to this point since that 
	 *	would mean the addrs are equal
	 *
	 *	However, we do get to it 8) And exacly, when
	 *	addresses are equal 8)
	 *
	 *	ip route add 1111::/128 via ...
	 *	ip route add 1111::/64 via ...
	 *	and we are here.
	 *
	 *	Ideally, this function should stop comparison
	 *	at prefix length. It does not, but it is still OK,
	 *	if returned value is greater than prefix length.
	 *					--ANK (980803)
	 */
E
Eric Dumazet 已提交
637
	return addrlen << 5;
638 639
}

640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
static inline int __ipv6_addr_diff64(const void *token1, const void *token2, int addrlen)
{
	const __be64 *a1 = token1, *a2 = token2;
	int i;

	addrlen >>= 3;

	for (i = 0; i < addrlen; i++) {
		__be64 xb = a1[i] ^ a2[i];
		if (xb)
			return i * 64 + 63 - __fls(be64_to_cpu(xb));
	}

	return addrlen << 6;
}
#endif

static inline int __ipv6_addr_diff(const void *token1, const void *token2, int addrlen)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	if (__builtin_constant_p(addrlen) && !(addrlen & 7))
		return __ipv6_addr_diff64(token1, token2, addrlen);
#endif
	return __ipv6_addr_diff32(token1, token2, addrlen);
}

667 668 669 670 671
static inline int ipv6_addr_diff(const struct in6_addr *a1, const struct in6_addr *a2)
{
	return __ipv6_addr_diff(a1, a2, sizeof(struct in6_addr));
}

672
int ip6_dst_hoplimit(struct dst_entry *dst);
673

674 675 676 677 678 679 680 681 682 683 684 685 686 687
static inline int ip6_sk_dst_hoplimit(struct ipv6_pinfo *np, struct flowi6 *fl6,
				      struct dst_entry *dst)
{
	int hlimit;

	if (ipv6_addr_is_multicast(&fl6->daddr))
		hlimit = np->mcast_hops;
	else
		hlimit = np->hop_limit;
	if (hlimit < 0)
		hlimit = ip6_dst_hoplimit(dst);
	return hlimit;
}

688
#if IS_ENABLED(CONFIG_IPV6)
689 690 691 692 693 694 695 696 697 698 699 700 701 702
static inline void ip6_set_txhash(struct sock *sk)
{
	struct inet_sock *inet = inet_sk(sk);
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct flow_keys keys;

	keys.src = (__force __be32)ipv6_addr_hash(&np->saddr);
	keys.dst = (__force __be32)ipv6_addr_hash(&sk->sk_v6_daddr);
	keys.port16[0] = inet->inet_sport;
	keys.port16[1] = inet->inet_dport;

	sk->sk_txhash = flow_hash_from_keys(&keys);
}

703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721
static inline __be32 ip6_make_flowlabel(struct net *net, struct sk_buff *skb,
					__be32 flowlabel, bool autolabel)
{
	if (!flowlabel && (autolabel || net->ipv6.sysctl.auto_flowlabels)) {
		__be32 hash;

		hash = skb_get_hash(skb);

		/* Since this is being sent on the wire obfuscate hash a bit
		 * to minimize possbility that any useful information to an
		 * attacker is leaked. Only lower 20 bits are relevant.
		 */
		hash ^= hash >> 12;

		flowlabel = hash & IPV6_FLOWLABEL_MASK;
	}

	return flowlabel;
}
722 723 724 725 726 727 728 729 730
#else
static inline void ip6_set_txhash(struct sock *sk) { }
static inline __be32 ip6_make_flowlabel(struct net *net, struct sk_buff *skb,
					__be32 flowlabel, bool autolabel)
{
	return flowlabel;
}
#endif

731

732 733 734 735 736 737
/*
 *	Header manipulation
 */
static inline void ip6_flow_hdr(struct ipv6hdr *hdr, unsigned int tclass,
				__be32 flowlabel)
{
738
	*(__be32 *)hdr = htonl(0x60000000 | (tclass << 20)) | flowlabel;
739 740
}

741 742 743 744 745
static inline __be32 ip6_flowinfo(const struct ipv6hdr *hdr)
{
	return *(__be32 *)hdr & IPV6_FLOWINFO_MASK;
}

F
Florent Fourcot 已提交
746 747 748 749 750
static inline __be32 ip6_flowlabel(const struct ipv6hdr *hdr)
{
	return *(__be32 *)hdr & IPV6_FLOWLABEL_MASK;
}

751 752 753 754
static inline u8 ip6_tclass(__be32 flowinfo)
{
	return ntohl(flowinfo & IPV6_TCLASS_MASK) >> IPV6_TCLASS_SHIFT;
}
L
Linus Torvalds 已提交
755 756 757 758 759 760 761 762
/*
 *	Prototypes exported by ipv6
 */

/*
 *	rcv function (called from netdevice level)
 */

763 764
int ipv6_rcv(struct sk_buff *skb, struct net_device *dev,
	     struct packet_type *pt, struct net_device *orig_dev);
L
Linus Torvalds 已提交
765

766
int ip6_rcv_finish(struct sk_buff *skb);
767

L
Linus Torvalds 已提交
768 769 770
/*
 *	upper-layer output functions
 */
771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788
int ip6_xmit(struct sock *sk, struct sk_buff *skb, struct flowi6 *fl6,
	     struct ipv6_txoptions *opt, int tclass);

int ip6_find_1stfragopt(struct sk_buff *skb, u8 **nexthdr);

int ip6_append_data(struct sock *sk,
		    int getfrag(void *from, char *to, int offset, int len,
				int odd, struct sk_buff *skb),
		    void *from, int length, int transhdrlen, int hlimit,
		    int tclass, struct ipv6_txoptions *opt, struct flowi6 *fl6,
		    struct rt6_info *rt, unsigned int flags, int dontfrag);

int ip6_push_pending_frames(struct sock *sk);

void ip6_flush_pending_frames(struct sock *sk);

int ip6_dst_lookup(struct sock *sk, struct dst_entry **dst, struct flowi6 *fl6);
struct dst_entry *ip6_dst_lookup_flow(struct sock *sk, struct flowi6 *fl6,
789
				      const struct in6_addr *final_dst);
790
struct dst_entry *ip6_sk_dst_lookup_flow(struct sock *sk, struct flowi6 *fl6,
791
					 const struct in6_addr *final_dst);
792 793
struct dst_entry *ip6_blackhole_route(struct net *net,
				      struct dst_entry *orig_dst);
L
Linus Torvalds 已提交
794 795 796 797 798

/*
 *	skb processing functions
 */

799
int ip6_output(struct sock *sk, struct sk_buff *skb);
800 801 802
int ip6_forward(struct sk_buff *skb);
int ip6_input(struct sk_buff *skb);
int ip6_mc_input(struct sk_buff *skb);
L
Linus Torvalds 已提交
803

804 805
int __ip6_local_out(struct sk_buff *skb);
int ip6_local_out(struct sk_buff *skb);
H
Herbert Xu 已提交
806

L
Linus Torvalds 已提交
807 808 809 810
/*
 *	Extension header (options) processing
 */

811 812 813 814
void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			  u8 *proto, struct in6_addr **daddr_p);
void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			 u8 *proto);
L
Linus Torvalds 已提交
815

816 817
int ipv6_skip_exthdr(const struct sk_buff *, int start, u8 *nexthdrp,
		     __be16 *frag_offp);
L
Linus Torvalds 已提交
818

819
bool ipv6_ext_hdr(u8 nexthdr);
L
Linus Torvalds 已提交
820

821
enum {
822 823 824
	IP6_FH_F_FRAG		= (1 << 0),
	IP6_FH_F_AUTH		= (1 << 1),
	IP6_FH_F_SKIP_RH	= (1 << 2),
825 826 827
};

/* find specified header and get offset to it */
828 829
int ipv6_find_hdr(const struct sk_buff *skb, unsigned int *offset, int target,
		  unsigned short *fragoff, int *fragflg);
830

831
int ipv6_find_tlv(struct sk_buff *skb, int offset, int type);
832

833 834 835
struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
				const struct ipv6_txoptions *opt,
				struct in6_addr *orig);
836

L
Linus Torvalds 已提交
837 838 839 840
/*
 *	socket options (ipv6_sockglue.c)
 */

841 842 843 844 845 846 847 848 849 850
int ipv6_setsockopt(struct sock *sk, int level, int optname,
		    char __user *optval, unsigned int optlen);
int ipv6_getsockopt(struct sock *sk, int level, int optname,
		    char __user *optval, int __user *optlen);
int compat_ipv6_setsockopt(struct sock *sk, int level, int optname,
			   char __user *optval, unsigned int optlen);
int compat_ipv6_getsockopt(struct sock *sk, int level, int optname,
			   char __user *optval, int __user *optlen);

int ip6_datagram_connect(struct sock *sk, struct sockaddr *addr, int addr_len);
851 852
int ip6_datagram_connect_v6_only(struct sock *sk, struct sockaddr *addr,
				 int addr_len);
853

854 855 856 857
int ipv6_recv_error(struct sock *sk, struct msghdr *msg, int len,
		    int *addr_len);
int ipv6_recv_rxpmtu(struct sock *sk, struct msghdr *msg, int len,
		     int *addr_len);
858 859 860 861 862 863 864 865 866 867 868 869
void ipv6_icmp_error(struct sock *sk, struct sk_buff *skb, int err, __be16 port,
		     u32 info, u8 *payload);
void ipv6_local_error(struct sock *sk, int err, struct flowi6 *fl6, u32 info);
void ipv6_local_rxpmtu(struct sock *sk, struct flowi6 *fl6, u32 mtu);

int inet6_release(struct socket *sock);
int inet6_bind(struct socket *sock, struct sockaddr *uaddr, int addr_len);
int inet6_getname(struct socket *sock, struct sockaddr *uaddr, int *uaddr_len,
		  int peer);
int inet6_ioctl(struct socket *sock, unsigned int cmd, unsigned long arg);

int inet6_hash_connect(struct inet_timewait_death_row *death_row,
870 871
			      struct sock *sk);

L
Linus Torvalds 已提交
872 873 874
/*
 * reassembly.c
 */
875 876
extern const struct proto_ops inet6_stream_ops;
extern const struct proto_ops inet6_dgram_ops;
877

878 879 880
struct group_source_req;
struct group_filter;

881 882 883 884 885
int ip6_mc_source(int add, int omode, struct sock *sk,
		  struct group_source_req *pgsr);
int ip6_mc_msfilter(struct sock *sk, struct group_filter *gsf);
int ip6_mc_msfget(struct sock *sk, struct group_filter *gsf,
		  struct group_filter __user *optval, int __user *optlen);
886 887

#ifdef CONFIG_PROC_FS
888 889 890 891 892 893 894 895 896 897 898 899 900 901
int ac6_proc_init(struct net *net);
void ac6_proc_exit(struct net *net);
int raw6_proc_init(void);
void raw6_proc_exit(void);
int tcp6_proc_init(struct net *net);
void tcp6_proc_exit(struct net *net);
int udp6_proc_init(struct net *net);
void udp6_proc_exit(struct net *net);
int udplite6_proc_init(void);
void udplite6_proc_exit(void);
int ipv6_misc_proc_init(void);
void ipv6_misc_proc_exit(void);
int snmp6_register_dev(struct inet6_dev *idev);
int snmp6_unregister_dev(struct inet6_dev *idev);
902

903
#else
904 905 906 907
static inline int ac6_proc_init(struct net *net) { return 0; }
static inline void ac6_proc_exit(struct net *net) { }
static inline int snmp6_register_dev(struct inet6_dev *idev) { return 0; }
static inline int snmp6_unregister_dev(struct inet6_dev *idev) { return 0; }
908
#endif
L
Linus Torvalds 已提交
909

910
#ifdef CONFIG_SYSCTL
911
extern struct ctl_table ipv6_route_table_template[];
L
Linus Torvalds 已提交
912

913 914 915 916
struct ctl_table *ipv6_icmp_sysctl_init(struct net *net);
struct ctl_table *ipv6_route_sysctl_init(struct net *net);
int ipv6_sysctl_register(void);
void ipv6_sysctl_unregister(void);
917
#endif
L
Linus Torvalds 已提交
918

919
#endif /* _NET_IPV6_H */