ipv6.h 25.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 *	Linux INET6 implementation
 *
 *	Authors:
 *	Pedro Roque		<roque@di.fc.ul.pt>
 *
 *	This program is free software; you can redistribute it and/or
 *      modify it under the terms of the GNU General Public License
 *      as published by the Free Software Foundation; either version
 *      2 of the License, or (at your option) any later version.
 */

#ifndef _NET_IPV6_H
#define _NET_IPV6_H

#include <linux/ipv6.h>
#include <linux/hardirq.h>
E
Eric Dumazet 已提交
18
#include <linux/jhash.h>
19
#include <net/if_inet6.h>
L
Linus Torvalds 已提交
20 21
#include <net/ndisc.h>
#include <net/flow.h>
22
#include <net/flow_keys.h>
L
Linus Torvalds 已提交
23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
#include <net/snmp.h>

#define SIN6_LEN_RFC2133	24

#define IPV6_MAXPLEN		65535

/*
 *	NextHeader field of IPv6 header
 */

#define NEXTHDR_HOP		0	/* Hop-by-hop option header. */
#define NEXTHDR_TCP		6	/* TCP segment. */
#define NEXTHDR_UDP		17	/* UDP message. */
#define NEXTHDR_IPV6		41	/* IPv6 in IPv6 */
#define NEXTHDR_ROUTING		43	/* Routing header. */
#define NEXTHDR_FRAGMENT	44	/* Fragmentation/reassembly header. */
X
xeb@mail.ru 已提交
39
#define NEXTHDR_GRE		47	/* GRE header. */
L
Linus Torvalds 已提交
40 41 42 43 44
#define NEXTHDR_ESP		50	/* Encapsulating security payload. */
#define NEXTHDR_AUTH		51	/* Authentication header. */
#define NEXTHDR_ICMP		58	/* ICMP for IPv6. */
#define NEXTHDR_NONE		59	/* No next header */
#define NEXTHDR_DEST		60	/* Destination options header. */
J
Joe Stringer 已提交
45
#define NEXTHDR_SCTP		132	/* SCTP message. */
46
#define NEXTHDR_MOBILITY	135	/* Mobility header. */
L
Linus Torvalds 已提交
47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92

#define NEXTHDR_MAX		255



#define IPV6_DEFAULT_HOPLIMIT   64
#define IPV6_DEFAULT_MCASTHOPS	1

/*
 *	Addr type
 *	
 *	type	-	unicast | multicast
 *	scope	-	local	| site	    | global
 *	v4	-	compat
 *	v4mapped
 *	any
 *	loopback
 */

#define IPV6_ADDR_ANY		0x0000U

#define IPV6_ADDR_UNICAST      	0x0001U	
#define IPV6_ADDR_MULTICAST    	0x0002U	

#define IPV6_ADDR_LOOPBACK	0x0010U
#define IPV6_ADDR_LINKLOCAL	0x0020U
#define IPV6_ADDR_SITELOCAL	0x0040U

#define IPV6_ADDR_COMPATv4	0x0080U

#define IPV6_ADDR_SCOPE_MASK	0x00f0U

#define IPV6_ADDR_MAPPED	0x1000U

/*
 *	Addr scopes
 */
#define IPV6_ADDR_MC_SCOPE(a)	\
	((a)->s6_addr[1] & 0x0f)	/* nonstandard */
#define __IPV6_ADDR_SCOPE_INVALID	-1
#define IPV6_ADDR_SCOPE_NODELOCAL	0x01
#define IPV6_ADDR_SCOPE_LINKLOCAL	0x02
#define IPV6_ADDR_SCOPE_SITELOCAL	0x05
#define IPV6_ADDR_SCOPE_ORGLOCAL	0x08
#define IPV6_ADDR_SCOPE_GLOBAL		0x0e

93 94 95 96 97 98 99 100 101 102
/*
 *	Addr flags
 */
#define IPV6_ADDR_MC_FLAG_TRANSIENT(a)	\
	((a)->s6_addr[1] & 0x10)
#define IPV6_ADDR_MC_FLAG_PREFIX(a)	\
	((a)->s6_addr[1] & 0x20)
#define IPV6_ADDR_MC_FLAG_RENDEZVOUS(a)	\
	((a)->s6_addr[1] & 0x40)

L
Linus Torvalds 已提交
103 104 105 106 107
/*
 *	fragmentation header
 */

struct frag_hdr {
A
Al Viro 已提交
108 109 110 111
	__u8	nexthdr;
	__u8	reserved;
	__be16	frag_off;
	__be32	identification;
L
Linus Torvalds 已提交
112 113
};

114 115
#define	IP6_MF		0x0001
#define	IP6_OFFSET	0xFFF8
L
Linus Torvalds 已提交
116

117 118 119
#define IP6_REPLY_MARK(net, mark) \
	((net)->ipv6.sysctl.fwmark_reflect ? (mark) : 0)

L
Linus Torvalds 已提交
120 121 122 123
#include <net/sock.h>

/* sysctls */
extern int sysctl_mld_max_msf;
124
extern int sysctl_mld_qrv;
125

126
#define _DEVINC(net, statname, modifier, idev, field)			\
127
({									\
128 129
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
130
		SNMP_INC_STATS##modifier((_idev)->stats.statname, (field)); \
131
	SNMP_INC_STATS##modifier((net)->mib.statname##_statistics, (field));\
132
})
133

134 135 136 137 138 139 140 141 142
/* per device counters are atomic_long_t */
#define _DEVINCATOMIC(net, statname, modifier, idev, field)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_INC_STATS_ATOMIC_LONG((_idev)->stats.statname##dev, (field)); \
	SNMP_INC_STATS##modifier((net)->mib.statname##_statistics, (field));\
})

143 144 145 146 147 148 149 150 151
/* per device and per net counters are atomic_long_t */
#define _DEVINC_ATOMIC_ATOMIC(net, statname, idev, field)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_INC_STATS_ATOMIC_LONG((_idev)->stats.statname##dev, (field)); \
	SNMP_INC_STATS_ATOMIC_LONG((net)->mib.statname##_statistics, (field));\
})

152
#define _DEVADD(net, statname, modifier, idev, field, val)		\
153 154 155 156
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_ADD_STATS##modifier((_idev)->stats.statname, (field), (val)); \
157
	SNMP_ADD_STATS##modifier((net)->mib.statname##_statistics, (field), (val));\
158 159
})

160 161 162 163 164 165 166 167
#define _DEVUPD(net, statname, modifier, idev, field, val)		\
({									\
	struct inet6_dev *_idev = (idev);				\
	if (likely(_idev != NULL))					\
		SNMP_UPD_PO_STATS##modifier((_idev)->stats.statname, field, (val)); \
	SNMP_UPD_PO_STATS##modifier((net)->mib.statname##_statistics, field, (val));\
})

168 169
/* MIBs */

170
#define IP6_INC_STATS(net, idev,field)		\
171
		_DEVINC(net, ipv6, 64, idev, field)
172
#define IP6_INC_STATS_BH(net, idev,field)	\
173
		_DEVINC(net, ipv6, 64_BH, idev, field)
174
#define IP6_ADD_STATS(net, idev,field,val)	\
175
		_DEVADD(net, ipv6, 64, idev, field, val)
176
#define IP6_ADD_STATS_BH(net, idev,field,val)	\
177
		_DEVADD(net, ipv6, 64_BH, idev, field, val)
178
#define IP6_UPD_PO_STATS(net, idev,field,val)   \
179
		_DEVUPD(net, ipv6, 64, idev, field, val)
180
#define IP6_UPD_PO_STATS_BH(net, idev,field,val)   \
181
		_DEVUPD(net, ipv6, 64_BH, idev, field, val)
182
#define ICMP6_INC_STATS(net, idev, field)	\
183
		_DEVINCATOMIC(net, icmpv6, , idev, field)
184
#define ICMP6_INC_STATS_BH(net, idev, field)	\
185
		_DEVINCATOMIC(net, icmpv6, _BH, idev, field)
186 187

#define ICMP6MSGOUT_INC_STATS(net, idev, field)		\
188
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field +256)
189
#define ICMP6MSGOUT_INC_STATS_BH(net, idev, field)	\
190
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field +256)
191
#define ICMP6MSGIN_INC_STATS_BH(net, idev, field)	\
192
	_DEVINC_ATOMIC_ATOMIC(net, icmpv6msg, idev, field)
193

E
Eric Dumazet 已提交
194
struct ip6_ra_chain {
L
Linus Torvalds 已提交
195 196 197 198 199 200 201 202 203 204 205 206 207 208
	struct ip6_ra_chain	*next;
	struct sock		*sk;
	int			sel;
	void			(*destructor)(struct sock *);
};

extern struct ip6_ra_chain	*ip6_ra_chain;
extern rwlock_t ip6_ra_lock;

/*
   This structure is prepared by protocol, when parsing
   ancillary data and passed to IPv6.
 */

E
Eric Dumazet 已提交
209
struct ipv6_txoptions {
L
Linus Torvalds 已提交
210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
	/* Length of this structure */
	int			tot_len;

	/* length of extension headers   */

	__u16			opt_flen;	/* after fragment hdr */
	__u16			opt_nflen;	/* before fragment hdr */

	struct ipv6_opt_hdr	*hopopt;
	struct ipv6_opt_hdr	*dst0opt;
	struct ipv6_rt_hdr	*srcrt;	/* Routing Header */
	struct ipv6_opt_hdr	*dst1opt;

	/* Option buffer, as read by IPV6_PKTOPTIONS, starts here. */
};

E
Eric Dumazet 已提交
226
struct ip6_flowlabel {
227
	struct ip6_flowlabel __rcu *next;
A
Al Viro 已提交
228
	__be32			label;
229
	atomic_t		users;
L
Linus Torvalds 已提交
230 231 232
	struct in6_addr		dst;
	struct ipv6_txoptions	*opt;
	unsigned long		linger;
233
	struct rcu_head		rcu;
L
Linus Torvalds 已提交
234
	u8			share;
235 236 237 238
	union {
		struct pid *pid;
		kuid_t uid;
	} owner;
L
Linus Torvalds 已提交
239 240
	unsigned long		lastuse;
	unsigned long		expires;
241
	struct net		*fl_net;
L
Linus Torvalds 已提交
242 243
};

244 245
#define IPV6_FLOWINFO_MASK	cpu_to_be32(0x0FFFFFFF)
#define IPV6_FLOWLABEL_MASK	cpu_to_be32(0x000FFFFF)
246
#define IPV6_TCLASS_MASK (IPV6_FLOWINFO_MASK & ~IPV6_FLOWLABEL_MASK)
247
#define IPV6_TCLASS_SHIFT	20
L
Linus Torvalds 已提交
248

E
Eric Dumazet 已提交
249
struct ipv6_fl_socklist {
250 251 252
	struct ipv6_fl_socklist	__rcu	*next;
	struct ip6_flowlabel		*fl;
	struct rcu_head			rcu;
L
Linus Torvalds 已提交
253 254
};

255 256 257 258 259 260
struct ip6_flowlabel *fl6_sock_lookup(struct sock *sk, __be32 label);
struct ipv6_txoptions *fl6_merge_options(struct ipv6_txoptions *opt_space,
					 struct ip6_flowlabel *fl,
					 struct ipv6_txoptions *fopt);
void fl6_free_socklist(struct sock *sk);
int ipv6_flowlabel_opt(struct sock *sk, char __user *optval, int optlen);
261 262
int ipv6_flowlabel_opt_get(struct sock *sk, struct in6_flowlabel_req *freq,
			   int flags);
263 264
int ip6_flowlabel_init(void);
void ip6_flowlabel_cleanup(void);
L
Linus Torvalds 已提交
265 266 267 268 269 270 271

static inline void fl6_sock_release(struct ip6_flowlabel *fl)
{
	if (fl)
		atomic_dec(&fl->users);
}

272
void icmpv6_notify(struct sk_buff *skb, u8 type, u8 code, __be32 info);
273

274 275 276
int icmpv6_push_pending_frames(struct sock *sk, struct flowi6 *fl6,
			       struct icmp6hdr *thdr, int len);

277
int ip6_ra_control(struct sock *sk, int sel);
L
Linus Torvalds 已提交
278

279
int ipv6_parse_hopopts(struct sk_buff *skb);
L
Linus Torvalds 已提交
280

281 282 283 284 285 286 287
struct ipv6_txoptions *ipv6_dup_options(struct sock *sk,
					struct ipv6_txoptions *opt);
struct ipv6_txoptions *ipv6_renew_options(struct sock *sk,
					  struct ipv6_txoptions *opt,
					  int newtype,
					  struct ipv6_opt_hdr __user *newopt,
					  int newoptlen);
288 289
struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
					  struct ipv6_txoptions *opt);
L
Linus Torvalds 已提交
290

291
bool ipv6_opt_accepted(const struct sock *sk, const struct sk_buff *skb);
292

293 294 295 296 297 298 299 300 301
static inline bool ipv6_accept_ra(struct inet6_dev *idev)
{
	/* If forwarding is enabled, RA are not accepted unless the special
	 * hybrid mode (accept_ra=2) is enabled.
	 */
	return idev->cnf.forwarding ? idev->cnf.accept_ra == 2 :
	    idev->cnf.accept_ra;
}

302 303 304
#if IS_ENABLED(CONFIG_IPV6)
static inline int ip6_frag_mem(struct net *net)
{
305
	return sum_frag_mem_limit(&net->ipv6.frags);
306 307
}
#endif
L
Linus Torvalds 已提交
308

309 310
#define IPV6_FRAG_HIGH_THRESH	(4 * 1024*1024)	/* 4194304 */
#define IPV6_FRAG_LOW_THRESH	(3 * 1024*1024)	/* 3145728 */
311
#define IPV6_FRAG_TIMEOUT	(60 * HZ)	/* 60 seconds */
L
Linus Torvalds 已提交
312

313
int __ipv6_addr_type(const struct in6_addr *addr);
314 315 316 317
static inline int ipv6_addr_type(const struct in6_addr *addr)
{
	return __ipv6_addr_type(addr) & 0xffff;
}
L
Linus Torvalds 已提交
318 319 320

static inline int ipv6_addr_scope(const struct in6_addr *addr)
{
321 322 323 324 325
	return __ipv6_addr_type(addr) & IPV6_ADDR_SCOPE_MASK;
}

static inline int __ipv6_addr_src_scope(int type)
{
E
Eric Dumazet 已提交
326
	return (type == IPV6_ADDR_ANY) ? __IPV6_ADDR_SCOPE_INVALID : (type >> 16);
327 328 329 330 331
}

static inline int ipv6_addr_src_scope(const struct in6_addr *addr)
{
	return __ipv6_addr_src_scope(__ipv6_addr_type(addr));
L
Linus Torvalds 已提交
332 333
}

334 335 336 337 338 339 340 341 342 343 344 345
static inline bool __ipv6_addr_needs_scope_id(int type)
{
	return type & IPV6_ADDR_LINKLOCAL ||
	       (type & IPV6_ADDR_MULTICAST &&
		(type & (IPV6_ADDR_LOOPBACK|IPV6_ADDR_LINKLOCAL)));
}

static inline __u32 ipv6_iface_scope_id(const struct in6_addr *addr, int iface)
{
	return __ipv6_addr_needs_scope_id(__ipv6_addr_type(addr)) ? iface : 0;
}

L
Linus Torvalds 已提交
346 347
static inline int ipv6_addr_cmp(const struct in6_addr *a1, const struct in6_addr *a2)
{
348
	return memcmp(a1, a2, sizeof(struct in6_addr));
L
Linus Torvalds 已提交
349 350
}

351
static inline bool
352 353 354
ipv6_masked_addr_cmp(const struct in6_addr *a1, const struct in6_addr *m,
		     const struct in6_addr *a2)
{
355 356 357 358 359 360 361 362
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul1 = (const unsigned long *)a1;
	const unsigned long *ulm = (const unsigned long *)m;
	const unsigned long *ul2 = (const unsigned long *)a2;

	return !!(((ul1[0] ^ ul2[0]) & ulm[0]) |
		  ((ul1[1] ^ ul2[1]) & ulm[1]));
#else
E
Eric Dumazet 已提交
363 364 365 366
	return !!(((a1->s6_addr32[0] ^ a2->s6_addr32[0]) & m->s6_addr32[0]) |
		  ((a1->s6_addr32[1] ^ a2->s6_addr32[1]) & m->s6_addr32[1]) |
		  ((a1->s6_addr32[2] ^ a2->s6_addr32[2]) & m->s6_addr32[2]) |
		  ((a1->s6_addr32[3] ^ a2->s6_addr32[3]) & m->s6_addr32[3]));
367
#endif
368 369
}

L
Linus Torvalds 已提交
370 371 372 373 374 375 376 377
static inline void ipv6_addr_prefix(struct in6_addr *pfx, 
				    const struct in6_addr *addr,
				    int plen)
{
	/* caller must guarantee 0 <= plen <= 128 */
	int o = plen >> 3,
	    b = plen & 0x7;

378
	memset(pfx->s6_addr, 0, sizeof(pfx->s6_addr));
L
Linus Torvalds 已提交
379
	memcpy(pfx->s6_addr, addr, o);
380
	if (b != 0)
L
Linus Torvalds 已提交
381 382 383
		pfx->s6_addr[o] = addr->s6_addr[o] & (0xff00 >> b);
}

384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403
static inline void __ipv6_addr_set_half(__be32 *addr,
					__be32 wh, __be32 wl)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
#if defined(__BIG_ENDIAN)
	if (__builtin_constant_p(wh) && __builtin_constant_p(wl)) {
		*(__force u64 *)addr = ((__force u64)(wh) << 32 | (__force u64)(wl));
		return;
	}
#elif defined(__LITTLE_ENDIAN)
	if (__builtin_constant_p(wl) && __builtin_constant_p(wh)) {
		*(__force u64 *)addr = ((__force u64)(wl) << 32 | (__force u64)(wh));
		return;
	}
#endif
#endif
	addr[0] = wh;
	addr[1] = wl;
}

L
Linus Torvalds 已提交
404
static inline void ipv6_addr_set(struct in6_addr *addr, 
A
Al Viro 已提交
405 406
				     __be32 w1, __be32 w2,
				     __be32 w3, __be32 w4)
L
Linus Torvalds 已提交
407
{
408 409
	__ipv6_addr_set_half(&addr->s6_addr32[0], w1, w2);
	__ipv6_addr_set_half(&addr->s6_addr32[2], w3, w4);
L
Linus Torvalds 已提交
410 411
}

E
Eric Dumazet 已提交
412 413
static inline bool ipv6_addr_equal(const struct in6_addr *a1,
				   const struct in6_addr *a2)
L
Linus Torvalds 已提交
414
{
415 416 417 418 419 420
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul1 = (const unsigned long *)a1;
	const unsigned long *ul2 = (const unsigned long *)a2;

	return ((ul1[0] ^ ul2[0]) | (ul1[1] ^ ul2[1])) == 0UL;
#else
E
Eric Dumazet 已提交
421 422 423 424
	return ((a1->s6_addr32[0] ^ a2->s6_addr32[0]) |
		(a1->s6_addr32[1] ^ a2->s6_addr32[1]) |
		(a1->s6_addr32[2] ^ a2->s6_addr32[2]) |
		(a1->s6_addr32[3] ^ a2->s6_addr32[3])) == 0;
425
#endif
L
Linus Torvalds 已提交
426 427
}

428 429 430 431 432
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
static inline bool __ipv6_prefix_equal64_half(const __be64 *a1,
					      const __be64 *a2,
					      unsigned int len)
{
433
	if (len && ((*a1 ^ *a2) & cpu_to_be64((~0UL) << (64 - len))))
434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452
		return false;
	return true;
}

static inline bool ipv6_prefix_equal(const struct in6_addr *addr1,
				     const struct in6_addr *addr2,
				     unsigned int prefixlen)
{
	const __be64 *a1 = (const __be64 *)addr1;
	const __be64 *a2 = (const __be64 *)addr2;

	if (prefixlen >= 64) {
		if (a1[0] ^ a2[0])
			return false;
		return __ipv6_prefix_equal64_half(a1 + 1, a2 + 1, prefixlen - 64);
	}
	return __ipv6_prefix_equal64_half(a1, a2, prefixlen);
}
#else
453 454 455
static inline bool ipv6_prefix_equal(const struct in6_addr *addr1,
				     const struct in6_addr *addr2,
				     unsigned int prefixlen)
L
Linus Torvalds 已提交
456
{
457 458
	const __be32 *a1 = addr1->s6_addr32;
	const __be32 *a2 = addr2->s6_addr32;
459
	unsigned int pdw, pbi;
L
Linus Torvalds 已提交
460 461 462 463

	/* check complete u32 in prefix */
	pdw = prefixlen >> 5;
	if (pdw && memcmp(a1, a2, pdw << 2))
E
Eric Dumazet 已提交
464
		return false;
L
Linus Torvalds 已提交
465 466 467 468

	/* check incomplete u32 in prefix */
	pbi = prefixlen & 0x1f;
	if (pbi && ((a1[pdw] ^ a2[pdw]) & htonl((0xffffffff) << (32 - pbi))))
E
Eric Dumazet 已提交
469
		return false;
L
Linus Torvalds 已提交
470

E
Eric Dumazet 已提交
471
	return true;
L
Linus Torvalds 已提交
472
}
473
#endif
L
Linus Torvalds 已提交
474

475 476
struct inet_frag_queue;

477 478 479
enum ip6_defrag_users {
	IP6_DEFRAG_LOCAL_DELIVER,
	IP6_DEFRAG_CONNTRACK_IN,
480
	__IP6_DEFRAG_CONNTRACK_IN	= IP6_DEFRAG_CONNTRACK_IN + USHRT_MAX,
481
	IP6_DEFRAG_CONNTRACK_OUT,
482
	__IP6_DEFRAG_CONNTRACK_OUT	= IP6_DEFRAG_CONNTRACK_OUT + USHRT_MAX,
483
	IP6_DEFRAG_CONNTRACK_BRIDGE_IN,
484
	__IP6_DEFRAG_CONNTRACK_BRIDGE_IN = IP6_DEFRAG_CONNTRACK_BRIDGE_IN + USHRT_MAX,
485 486
};

487 488
struct ip6_create_arg {
	__be32 id;
489
	u32 user;
490 491
	const struct in6_addr *src;
	const struct in6_addr *dst;
492
	u8 ecn;
493 494
};

495 496
void ip6_frag_init(struct inet_frag_queue *q, const void *a);
bool ip6_frag_match(const struct inet_frag_queue *q, const void *a);
497

498 499 500 501 502 503 504 505 506 507 508 509 510 511
/*
 *	Equivalent of ipv4 struct ip
 */
struct frag_queue {
	struct inet_frag_queue	q;

	__be32			id;		/* fragment id		*/
	u32			user;
	struct in6_addr		saddr;
	struct in6_addr		daddr;

	int			iif;
	unsigned int		csum;
	__u16			nhoffset;
512
	u8			ecn;
513 514 515 516 517
};

void ip6_expire_frag_queue(struct net *net, struct frag_queue *fq,
			   struct inet_frags *frags);

E
Eric Dumazet 已提交
518
static inline bool ipv6_addr_any(const struct in6_addr *a)
L
Linus Torvalds 已提交
519
{
520 521 522 523 524
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul = (const unsigned long *)a;

	return (ul[0] | ul[1]) == 0UL;
#else
E
Eric Dumazet 已提交
525 526
	return (a->s6_addr32[0] | a->s6_addr32[1] |
		a->s6_addr32[2] | a->s6_addr32[3]) == 0;
527
#endif
L
Linus Torvalds 已提交
528 529
}

E
Eric Dumazet 已提交
530 531 532 533 534 535 536 537 538 539 540 541 542
static inline u32 ipv6_addr_hash(const struct in6_addr *a)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	const unsigned long *ul = (const unsigned long *)a;
	unsigned long x = ul[0] ^ ul[1];

	return (u32)(x ^ (x >> 32));
#else
	return (__force u32)(a->s6_addr32[0] ^ a->s6_addr32[1] ^
			     a->s6_addr32[2] ^ a->s6_addr32[3]);
#endif
}

E
Eric Dumazet 已提交
543
/* more secured version of ipv6_addr_hash() */
544
static inline u32 __ipv6_addr_jhash(const struct in6_addr *a, const u32 initval)
E
Eric Dumazet 已提交
545 546 547 548 549 550
{
	u32 v = (__force u32)a->s6_addr32[0] ^ (__force u32)a->s6_addr32[1];

	return jhash_3words(v,
			    (__force u32)a->s6_addr32[2],
			    (__force u32)a->s6_addr32[3],
551
			    initval);
E
Eric Dumazet 已提交
552 553
}

E
Eric Dumazet 已提交
554
static inline bool ipv6_addr_loopback(const struct in6_addr *a)
555
{
556
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
557
	const __be64 *be = (const __be64 *)a;
558

559
	return (be[0] | (be[1] ^ cpu_to_be64(1))) == 0UL;
560
#else
E
Eric Dumazet 已提交
561
	return (a->s6_addr32[0] | a->s6_addr32[1] |
562
		a->s6_addr32[2] | (a->s6_addr32[3] ^ cpu_to_be32(1))) == 0;
563
#endif
564 565
}

566 567 568 569
/*
 * Note that we must __force cast these to unsigned long to make sparse happy,
 * since all of the endian-annotated types are fixed size regardless of arch.
 */
E
Eric Dumazet 已提交
570
static inline bool ipv6_addr_v4mapped(const struct in6_addr *a)
B
Brian Haley 已提交
571
{
572 573
	return (
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
574
		*(unsigned long *)a |
575
#else
576
		(__force unsigned long)(a->s6_addr32[0] | a->s6_addr32[1]) |
577
#endif
578 579
		(__force unsigned long)(a->s6_addr32[2] ^
					cpu_to_be32(0x0000ffff))) == 0UL;
B
Brian Haley 已提交
580 581
}

582 583 584 585
/*
 * Check for a RFC 4843 ORCHID address
 * (Overlay Routable Cryptographic Hash Identifiers)
 */
E
Eric Dumazet 已提交
586
static inline bool ipv6_addr_orchid(const struct in6_addr *a)
587
{
E
Eric Dumazet 已提交
588
	return (a->s6_addr32[0] & htonl(0xfffffff0)) == htonl(0x20010010);
589 590
}

591 592 593 594 595
static inline bool ipv6_addr_is_multicast(const struct in6_addr *addr)
{
	return (addr->s6_addr32[0] & htonl(0xFF000000)) == htonl(0xFF000000);
}

596 597 598 599 600 601 602 603 604
static inline void ipv6_addr_set_v4mapped(const __be32 addr,
					  struct in6_addr *v4mapped)
{
	ipv6_addr_set(v4mapped,
			0, 0,
			htonl(0x0000FFFF),
			addr);
}

605 606 607 608
/*
 * find the first different bit between two addresses
 * length of address must be a multiple of 32bits
 */
609
static inline int __ipv6_addr_diff32(const void *token1, const void *token2, int addrlen)
610
{
611
	const __be32 *a1 = token1, *a2 = token2;
612 613 614 615 616
	int i;

	addrlen >>= 2;

	for (i = 0; i < addrlen; i++) {
617 618
		__be32 xb = a1[i] ^ a2[i];
		if (xb)
619
			return i * 32 + 31 - __fls(ntohl(xb));
620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
	}

	/*
	 *	we should *never* get to this point since that 
	 *	would mean the addrs are equal
	 *
	 *	However, we do get to it 8) And exacly, when
	 *	addresses are equal 8)
	 *
	 *	ip route add 1111::/128 via ...
	 *	ip route add 1111::/64 via ...
	 *	and we are here.
	 *
	 *	Ideally, this function should stop comparison
	 *	at prefix length. It does not, but it is still OK,
	 *	if returned value is greater than prefix length.
	 *					--ANK (980803)
	 */
E
Eric Dumazet 已提交
638
	return addrlen << 5;
639 640
}

641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
static inline int __ipv6_addr_diff64(const void *token1, const void *token2, int addrlen)
{
	const __be64 *a1 = token1, *a2 = token2;
	int i;

	addrlen >>= 3;

	for (i = 0; i < addrlen; i++) {
		__be64 xb = a1[i] ^ a2[i];
		if (xb)
			return i * 64 + 63 - __fls(be64_to_cpu(xb));
	}

	return addrlen << 6;
}
#endif

static inline int __ipv6_addr_diff(const void *token1, const void *token2, int addrlen)
{
#if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64
	if (__builtin_constant_p(addrlen) && !(addrlen & 7))
		return __ipv6_addr_diff64(token1, token2, addrlen);
#endif
	return __ipv6_addr_diff32(token1, token2, addrlen);
}

668 669 670 671 672
static inline int ipv6_addr_diff(const struct in6_addr *a1, const struct in6_addr *a2)
{
	return __ipv6_addr_diff(a1, a2, sizeof(struct in6_addr));
}

673
int ip6_dst_hoplimit(struct dst_entry *dst);
674

675 676 677 678 679 680 681 682 683 684 685 686 687 688
static inline int ip6_sk_dst_hoplimit(struct ipv6_pinfo *np, struct flowi6 *fl6,
				      struct dst_entry *dst)
{
	int hlimit;

	if (ipv6_addr_is_multicast(&fl6->daddr))
		hlimit = np->mcast_hops;
	else
		hlimit = np->hop_limit;
	if (hlimit < 0)
		hlimit = ip6_dst_hoplimit(dst);
	return hlimit;
}

689
#if IS_ENABLED(CONFIG_IPV6)
690 691 692 693 694 695 696 697 698 699 700 701 702 703
static inline void ip6_set_txhash(struct sock *sk)
{
	struct inet_sock *inet = inet_sk(sk);
	struct ipv6_pinfo *np = inet6_sk(sk);
	struct flow_keys keys;

	keys.src = (__force __be32)ipv6_addr_hash(&np->saddr);
	keys.dst = (__force __be32)ipv6_addr_hash(&sk->sk_v6_daddr);
	keys.port16[0] = inet->inet_sport;
	keys.port16[1] = inet->inet_dport;

	sk->sk_txhash = flow_hash_from_keys(&keys);
}

704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722
static inline __be32 ip6_make_flowlabel(struct net *net, struct sk_buff *skb,
					__be32 flowlabel, bool autolabel)
{
	if (!flowlabel && (autolabel || net->ipv6.sysctl.auto_flowlabels)) {
		__be32 hash;

		hash = skb_get_hash(skb);

		/* Since this is being sent on the wire obfuscate hash a bit
		 * to minimize possbility that any useful information to an
		 * attacker is leaked. Only lower 20 bits are relevant.
		 */
		hash ^= hash >> 12;

		flowlabel = hash & IPV6_FLOWLABEL_MASK;
	}

	return flowlabel;
}
723 724 725 726 727 728 729 730 731
#else
static inline void ip6_set_txhash(struct sock *sk) { }
static inline __be32 ip6_make_flowlabel(struct net *net, struct sk_buff *skb,
					__be32 flowlabel, bool autolabel)
{
	return flowlabel;
}
#endif

732

733 734 735 736 737 738
/*
 *	Header manipulation
 */
static inline void ip6_flow_hdr(struct ipv6hdr *hdr, unsigned int tclass,
				__be32 flowlabel)
{
739
	*(__be32 *)hdr = htonl(0x60000000 | (tclass << 20)) | flowlabel;
740 741
}

742 743 744 745 746
static inline __be32 ip6_flowinfo(const struct ipv6hdr *hdr)
{
	return *(__be32 *)hdr & IPV6_FLOWINFO_MASK;
}

F
Florent Fourcot 已提交
747 748 749 750 751
static inline __be32 ip6_flowlabel(const struct ipv6hdr *hdr)
{
	return *(__be32 *)hdr & IPV6_FLOWLABEL_MASK;
}

752 753 754 755
static inline u8 ip6_tclass(__be32 flowinfo)
{
	return ntohl(flowinfo & IPV6_TCLASS_MASK) >> IPV6_TCLASS_SHIFT;
}
L
Linus Torvalds 已提交
756 757 758 759 760 761 762 763
/*
 *	Prototypes exported by ipv6
 */

/*
 *	rcv function (called from netdevice level)
 */

764 765
int ipv6_rcv(struct sk_buff *skb, struct net_device *dev,
	     struct packet_type *pt, struct net_device *orig_dev);
L
Linus Torvalds 已提交
766

767
int ip6_rcv_finish(struct sk_buff *skb);
768

L
Linus Torvalds 已提交
769 770 771
/*
 *	upper-layer output functions
 */
772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789
int ip6_xmit(struct sock *sk, struct sk_buff *skb, struct flowi6 *fl6,
	     struct ipv6_txoptions *opt, int tclass);

int ip6_find_1stfragopt(struct sk_buff *skb, u8 **nexthdr);

int ip6_append_data(struct sock *sk,
		    int getfrag(void *from, char *to, int offset, int len,
				int odd, struct sk_buff *skb),
		    void *from, int length, int transhdrlen, int hlimit,
		    int tclass, struct ipv6_txoptions *opt, struct flowi6 *fl6,
		    struct rt6_info *rt, unsigned int flags, int dontfrag);

int ip6_push_pending_frames(struct sock *sk);

void ip6_flush_pending_frames(struct sock *sk);

int ip6_dst_lookup(struct sock *sk, struct dst_entry **dst, struct flowi6 *fl6);
struct dst_entry *ip6_dst_lookup_flow(struct sock *sk, struct flowi6 *fl6,
790
				      const struct in6_addr *final_dst);
791
struct dst_entry *ip6_sk_dst_lookup_flow(struct sock *sk, struct flowi6 *fl6,
792
					 const struct in6_addr *final_dst);
793 794
struct dst_entry *ip6_blackhole_route(struct net *net,
				      struct dst_entry *orig_dst);
L
Linus Torvalds 已提交
795 796 797 798 799

/*
 *	skb processing functions
 */

800
int ip6_output(struct sock *sk, struct sk_buff *skb);
801 802 803
int ip6_forward(struct sk_buff *skb);
int ip6_input(struct sk_buff *skb);
int ip6_mc_input(struct sk_buff *skb);
L
Linus Torvalds 已提交
804

805 806
int __ip6_local_out(struct sk_buff *skb);
int ip6_local_out(struct sk_buff *skb);
H
Herbert Xu 已提交
807

L
Linus Torvalds 已提交
808 809 810 811
/*
 *	Extension header (options) processing
 */

812 813 814 815
void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			  u8 *proto, struct in6_addr **daddr_p);
void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
			 u8 *proto);
L
Linus Torvalds 已提交
816

817 818
int ipv6_skip_exthdr(const struct sk_buff *, int start, u8 *nexthdrp,
		     __be16 *frag_offp);
L
Linus Torvalds 已提交
819

820
bool ipv6_ext_hdr(u8 nexthdr);
L
Linus Torvalds 已提交
821

822
enum {
823 824 825
	IP6_FH_F_FRAG		= (1 << 0),
	IP6_FH_F_AUTH		= (1 << 1),
	IP6_FH_F_SKIP_RH	= (1 << 2),
826 827 828
};

/* find specified header and get offset to it */
829 830
int ipv6_find_hdr(const struct sk_buff *skb, unsigned int *offset, int target,
		  unsigned short *fragoff, int *fragflg);
831

832
int ipv6_find_tlv(struct sk_buff *skb, int offset, int type);
833

834 835 836
struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
				const struct ipv6_txoptions *opt,
				struct in6_addr *orig);
837

L
Linus Torvalds 已提交
838 839 840 841
/*
 *	socket options (ipv6_sockglue.c)
 */

842 843 844 845 846 847 848 849 850 851
int ipv6_setsockopt(struct sock *sk, int level, int optname,
		    char __user *optval, unsigned int optlen);
int ipv6_getsockopt(struct sock *sk, int level, int optname,
		    char __user *optval, int __user *optlen);
int compat_ipv6_setsockopt(struct sock *sk, int level, int optname,
			   char __user *optval, unsigned int optlen);
int compat_ipv6_getsockopt(struct sock *sk, int level, int optname,
			   char __user *optval, int __user *optlen);

int ip6_datagram_connect(struct sock *sk, struct sockaddr *addr, int addr_len);
852 853
int ip6_datagram_connect_v6_only(struct sock *sk, struct sockaddr *addr,
				 int addr_len);
854

855 856 857 858
int ipv6_recv_error(struct sock *sk, struct msghdr *msg, int len,
		    int *addr_len);
int ipv6_recv_rxpmtu(struct sock *sk, struct msghdr *msg, int len,
		     int *addr_len);
859 860 861 862 863 864 865 866 867 868 869 870
void ipv6_icmp_error(struct sock *sk, struct sk_buff *skb, int err, __be16 port,
		     u32 info, u8 *payload);
void ipv6_local_error(struct sock *sk, int err, struct flowi6 *fl6, u32 info);
void ipv6_local_rxpmtu(struct sock *sk, struct flowi6 *fl6, u32 mtu);

int inet6_release(struct socket *sock);
int inet6_bind(struct socket *sock, struct sockaddr *uaddr, int addr_len);
int inet6_getname(struct socket *sock, struct sockaddr *uaddr, int *uaddr_len,
		  int peer);
int inet6_ioctl(struct socket *sock, unsigned int cmd, unsigned long arg);

int inet6_hash_connect(struct inet_timewait_death_row *death_row,
871 872
			      struct sock *sk);

L
Linus Torvalds 已提交
873 874 875
/*
 * reassembly.c
 */
876 877
extern const struct proto_ops inet6_stream_ops;
extern const struct proto_ops inet6_dgram_ops;
878

879 880 881
struct group_source_req;
struct group_filter;

882 883 884 885 886
int ip6_mc_source(int add, int omode, struct sock *sk,
		  struct group_source_req *pgsr);
int ip6_mc_msfilter(struct sock *sk, struct group_filter *gsf);
int ip6_mc_msfget(struct sock *sk, struct group_filter *gsf,
		  struct group_filter __user *optval, int __user *optlen);
887 888

#ifdef CONFIG_PROC_FS
889 890 891 892 893 894 895 896 897 898 899 900 901 902
int ac6_proc_init(struct net *net);
void ac6_proc_exit(struct net *net);
int raw6_proc_init(void);
void raw6_proc_exit(void);
int tcp6_proc_init(struct net *net);
void tcp6_proc_exit(struct net *net);
int udp6_proc_init(struct net *net);
void udp6_proc_exit(struct net *net);
int udplite6_proc_init(void);
void udplite6_proc_exit(void);
int ipv6_misc_proc_init(void);
void ipv6_misc_proc_exit(void);
int snmp6_register_dev(struct inet6_dev *idev);
int snmp6_unregister_dev(struct inet6_dev *idev);
903

904
#else
905 906 907 908
static inline int ac6_proc_init(struct net *net) { return 0; }
static inline void ac6_proc_exit(struct net *net) { }
static inline int snmp6_register_dev(struct inet6_dev *idev) { return 0; }
static inline int snmp6_unregister_dev(struct inet6_dev *idev) { return 0; }
909
#endif
L
Linus Torvalds 已提交
910

911
#ifdef CONFIG_SYSCTL
912
extern struct ctl_table ipv6_route_table_template[];
L
Linus Torvalds 已提交
913

914 915 916 917
struct ctl_table *ipv6_icmp_sysctl_init(struct net *net);
struct ctl_table *ipv6_route_sysctl_init(struct net *net);
int ipv6_sysctl_register(void);
void ipv6_sysctl_unregister(void);
918
#endif
L
Linus Torvalds 已提交
919

920
#endif /* _NET_IPV6_H */