nf_conntrack_proto_icmp.c 10.4 KB
Newer Older
1 2
/* (C) 1999-2001 Paul `Rusty' Russell
 * (C) 2002-2004 Netfilter Core Team <coreteam@netfilter.org>
3
 * (C) 2006-2010 Patrick McHardy <kaber@trash.net>
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 */

#include <linux/types.h>
#include <linux/timer.h>
#include <linux/netfilter.h>
#include <linux/in.h>
#include <linux/icmp.h>
#include <linux/seq_file.h>
#include <net/ip.h>
#include <net/checksum.h>
#include <linux/netfilter_ipv4.h>
#include <net/netfilter/nf_conntrack_tuple.h>
20
#include <net/netfilter/nf_conntrack_l4proto.h>
21
#include <net/netfilter/nf_conntrack_core.h>
22
#include <net/netfilter/nf_conntrack_zones.h>
23
#include <net/netfilter/nf_log.h>
24

25
static unsigned int nf_ct_icmp_timeout __read_mostly = 30*HZ;
26

27 28 29 30 31
static inline struct nf_icmp_net *icmp_pernet(struct net *net)
{
	return &net->ct.nf_ct_proto.icmp;
}

32
static bool icmp_pkt_to_tuple(const struct sk_buff *skb, unsigned int dataoff,
33
			      struct net *net, struct nf_conntrack_tuple *tuple)
34
{
35 36
	const struct icmphdr *hp;
	struct icmphdr _hdr;
37 38 39

	hp = skb_header_pointer(skb, dataoff, sizeof(_hdr), &_hdr);
	if (hp == NULL)
40
		return false;
41 42 43 44 45

	tuple->dst.u.icmp.type = hp->type;
	tuple->src.u.icmp.id = hp->un.echo.id;
	tuple->dst.u.icmp.code = hp->code;

46
	return true;
47 48
}

49 50 51 52 53 54 55 56 57 58 59 60
/* Add 1; spaces filled with 0. */
static const u_int8_t invmap[] = {
	[ICMP_ECHO] = ICMP_ECHOREPLY + 1,
	[ICMP_ECHOREPLY] = ICMP_ECHO + 1,
	[ICMP_TIMESTAMP] = ICMP_TIMESTAMPREPLY + 1,
	[ICMP_TIMESTAMPREPLY] = ICMP_TIMESTAMP + 1,
	[ICMP_INFO_REQUEST] = ICMP_INFO_REPLY + 1,
	[ICMP_INFO_REPLY] = ICMP_INFO_REQUEST + 1,
	[ICMP_ADDRESS] = ICMP_ADDRESSREPLY + 1,
	[ICMP_ADDRESSREPLY] = ICMP_ADDRESS + 1
};

61 62
static bool icmp_invert_tuple(struct nf_conntrack_tuple *tuple,
			      const struct nf_conntrack_tuple *orig)
63
{
64 65
	if (orig->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[orig->dst.u.icmp.type])
66
		return false;
67 68 69 70

	tuple->src.u.icmp.id = orig->src.u.icmp.id;
	tuple->dst.u.icmp.type = invmap[orig->dst.u.icmp.type] - 1;
	tuple->dst.u.icmp.code = orig->dst.u.icmp.code;
71
	return true;
72 73
}

74 75
static unsigned int *icmp_get_timeouts(struct net *net)
{
76
	return &icmp_pernet(net)->timeout;
77 78
}

79 80 81 82 83
/* Returns verdict for packet, or -1 for invalid. */
static int icmp_packet(struct nf_conn *ct,
		       const struct sk_buff *skb,
		       unsigned int dataoff,
		       enum ip_conntrack_info ctinfo,
84
		       u_int8_t pf,
85
		       unsigned int *timeout)
86
{
87 88 89
	/* Do not immediately delete the connection after the first
	   successful reply to avoid excessive conntrackd traffic
	   and also to handle correctly ICMP echo reply duplicates. */
90
	nf_ct_refresh_acct(ct, ctinfo, skb, *timeout);
91 92 93 94 95

	return NF_ACCEPT;
}

/* Called when a new connection for this protocol found. */
96
static bool icmp_new(struct nf_conn *ct, const struct sk_buff *skb,
97
		     unsigned int dataoff, unsigned int *timeouts)
98
{
99 100 101 102 103 104
	static const u_int8_t valid_new[] = {
		[ICMP_ECHO] = 1,
		[ICMP_TIMESTAMP] = 1,
		[ICMP_INFO_REQUEST] = 1,
		[ICMP_ADDRESS] = 1
	};
105

106 107
	if (ct->tuplehash[0].tuple.dst.u.icmp.type >= sizeof(valid_new) ||
	    !valid_new[ct->tuplehash[0].tuple.dst.u.icmp.type]) {
108
		/* Can't create a new ICMP `conn' with this. */
109
		pr_debug("icmp: can't create new conn with type %u\n",
110
			 ct->tuplehash[0].tuple.dst.u.icmp.type);
111
		nf_ct_dump_tuple_ip(&ct->tuplehash[0].tuple);
112
		return false;
113
	}
114
	return true;
115 116 117 118
}

/* Returns conntrack if it dealt with ICMP, and filled in skb fields */
static int
119
icmp_error_message(struct net *net, struct nf_conn *tmpl, struct sk_buff *skb,
120
		 unsigned int hooknum)
121 122
{
	struct nf_conntrack_tuple innertuple, origtuple;
123 124
	const struct nf_conntrack_l4proto *innerproto;
	const struct nf_conntrack_tuple_hash *h;
125
	const struct nf_conntrack_zone *zone;
126
	enum ip_conntrack_info ctinfo;
127
	struct nf_conntrack_zone tmp;
128

129
	WARN_ON(skb_nfct(skb));
130
	zone = nf_ct_zone_tmpl(tmpl, skb, &tmp);
131

132 133 134 135
	/* Are they talking about one of our connections? */
	if (!nf_ct_get_tuplepr(skb,
			       skb_network_offset(skb) + ip_hdrlen(skb)
						       + sizeof(struct icmphdr),
136
			       PF_INET, net, &origtuple)) {
137
		pr_debug("icmp_error_message: failed to get tuple\n");
138 139 140
		return -NF_ACCEPT;
	}

141
	/* rcu_read_lock()ed by nf_hook_thresh */
142
	innerproto = __nf_ct_l4proto_find(PF_INET, origtuple.dst.protonum);
143

144 145 146
	/* Ordinarily, we'd expect the inverted tupleproto, but it's
	   been preserved inside the ICMP. */
	if (!nf_ct_invert_tuple(&innertuple, &origtuple,
147
				&nf_conntrack_l3proto_ipv4, innerproto)) {
148
		pr_debug("icmp_error_message: no match\n");
149 150 151
		return -NF_ACCEPT;
	}

152
	ctinfo = IP_CT_RELATED;
153

154
	h = nf_conntrack_find_get(net, zone, &innertuple);
155
	if (!h) {
156 157
		pr_debug("icmp_error_message: no match\n");
		return -NF_ACCEPT;
158 159
	}

160
	if (NF_CT_DIRECTION(h) == IP_CT_DIR_REPLY)
161
		ctinfo += IP_CT_IS_REPLY;
162

163
	/* Update skb to refer to this connection */
164
	nf_ct_set(skb, nf_ct_tuplehash_to_ctrack(h), ctinfo);
165
	return NF_ACCEPT;
166 167 168 169
}

/* Small and modified version of icmp_rcv */
static int
170 171
icmp_error(struct net *net, struct nf_conn *tmpl,
	   struct sk_buff *skb, unsigned int dataoff,
172
	   u8 pf, unsigned int hooknum)
173
{
174 175
	const struct icmphdr *icmph;
	struct icmphdr _ih;
176 177

	/* Not enough header? */
178
	icmph = skb_header_pointer(skb, ip_hdrlen(skb), sizeof(_ih), &_ih);
179
	if (icmph == NULL) {
180
		if (LOG_INVALID(net, IPPROTO_ICMP))
181 182
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL,
				      NULL, "nf_ct_icmp: short packet ");
183 184 185 186
		return -NF_ACCEPT;
	}

	/* See ip_conntrack_proto_tcp.c */
187
	if (net->ct.sysctl_checksum && hooknum == NF_INET_PRE_ROUTING &&
188
	    nf_ip_checksum(skb, hooknum, dataoff, 0)) {
189
		if (LOG_INVALID(net, IPPROTO_ICMP))
190
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL, NULL,
191 192 193 194 195 196 197 198 199 200 201
				      "nf_ct_icmp: bad HW ICMP checksum ");
		return -NF_ACCEPT;
	}

	/*
	 *	18 is the highest 'known' ICMP type. Anything else is a mystery
	 *
	 *	RFC 1122: 3.2.2  Unknown ICMP messages types MUST be silently
	 *		  discarded.
	 */
	if (icmph->type > NR_ICMP_TYPES) {
202
		if (LOG_INVALID(net, IPPROTO_ICMP))
203
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL, NULL,
204 205 206 207 208
				      "nf_ct_icmp: invalid ICMP type ");
		return -NF_ACCEPT;
	}

	/* Need to track icmp error message? */
209 210 211 212 213
	if (icmph->type != ICMP_DEST_UNREACH &&
	    icmph->type != ICMP_SOURCE_QUENCH &&
	    icmph->type != ICMP_TIME_EXCEEDED &&
	    icmph->type != ICMP_PARAMETERPROB &&
	    icmph->type != ICMP_REDIRECT)
214 215
		return NF_ACCEPT;

216
	return icmp_error_message(net, tmpl, skb, hooknum);
217 218
}

D
Duan Jiong 已提交
219
#if IS_ENABLED(CONFIG_NF_CT_NETLINK)
220 221 222 223

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_conntrack.h>

224
static int icmp_tuple_to_nlattr(struct sk_buff *skb,
225 226
				const struct nf_conntrack_tuple *t)
{
227 228 229 230
	if (nla_put_be16(skb, CTA_PROTO_ICMP_ID, t->src.u.icmp.id) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_TYPE, t->dst.u.icmp.type) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_CODE, t->dst.u.icmp.code))
		goto nla_put_failure;
231 232
	return 0;

233
nla_put_failure:
234 235 236
	return -1;
}

237 238 239 240
static const struct nla_policy icmp_nla_policy[CTA_PROTO_MAX+1] = {
	[CTA_PROTO_ICMP_TYPE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_CODE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_ID]	= { .type = NLA_U16 },
241 242
};

243
static int icmp_nlattr_to_tuple(struct nlattr *tb[],
244 245
				struct nf_conntrack_tuple *tuple)
{
246 247 248
	if (!tb[CTA_PROTO_ICMP_TYPE] ||
	    !tb[CTA_PROTO_ICMP_CODE] ||
	    !tb[CTA_PROTO_ICMP_ID])
249 250
		return -EINVAL;

251 252 253
	tuple->dst.u.icmp.type = nla_get_u8(tb[CTA_PROTO_ICMP_TYPE]);
	tuple->dst.u.icmp.code = nla_get_u8(tb[CTA_PROTO_ICMP_CODE]);
	tuple->src.u.icmp.id = nla_get_be16(tb[CTA_PROTO_ICMP_ID]);
254

255 256
	if (tuple->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[tuple->dst.u.icmp.type])
257 258 259 260
		return -EINVAL;

	return 0;
}
261 262 263 264 265

static int icmp_nlattr_tuple_size(void)
{
	return nla_policy_len(icmp_nla_policy, CTA_PROTO_MAX + 1);
}
266 267
#endif

268 269 270 271 272
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_cttimeout.h>

273 274
static int icmp_timeout_nlattr_to_obj(struct nlattr *tb[],
				      struct net *net, void *data)
275 276
{
	unsigned int *timeout = data;
277
	struct nf_icmp_net *in = icmp_pernet(net);
278 279 280 281 282 283

	if (tb[CTA_TIMEOUT_ICMP_TIMEOUT]) {
		*timeout =
			ntohl(nla_get_be32(tb[CTA_TIMEOUT_ICMP_TIMEOUT])) * HZ;
	} else {
		/* Set default ICMP timeout. */
284
		*timeout = in->timeout;
285 286 287 288 289 290 291 292 293
	}
	return 0;
}

static int
icmp_timeout_obj_to_nlattr(struct sk_buff *skb, const void *data)
{
	const unsigned int *timeout = data;

294 295
	if (nla_put_be32(skb, CTA_TIMEOUT_ICMP_TIMEOUT, htonl(*timeout / HZ)))
		goto nla_put_failure;
296 297 298 299 300 301 302 303 304 305 306 307
	return 0;

nla_put_failure:
	return -ENOSPC;
}

static const struct nla_policy
icmp_timeout_nla_policy[CTA_TIMEOUT_ICMP_MAX+1] = {
	[CTA_TIMEOUT_ICMP_TIMEOUT]	= { .type = NLA_U32 },
};
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */

308 309 310 311 312 313
#ifdef CONFIG_SYSCTL
static struct ctl_table icmp_sysctl_table[] = {
	{
		.procname	= "nf_conntrack_icmp_timeout",
		.maxlen		= sizeof(unsigned int),
		.mode		= 0644,
A
Alexey Dobriyan 已提交
314
		.proc_handler	= proc_dointvec_jiffies,
315
	},
316
	{ }
317 318 319
};
#endif /* CONFIG_SYSCTL */

320 321
static int icmp_kmemdup_sysctl_table(struct nf_proto_net *pn,
				     struct nf_icmp_net *in)
322 323 324 325 326 327 328
{
#ifdef CONFIG_SYSCTL
	pn->ctl_table = kmemdup(icmp_sysctl_table,
				sizeof(icmp_sysctl_table),
				GFP_KERNEL);
	if (!pn->ctl_table)
		return -ENOMEM;
329

330
	pn->ctl_table[0].data = &in->timeout;
331 332 333 334 335 336 337 338 339 340 341
#endif
	return 0;
}

static int icmp_init_net(struct net *net, u_int16_t proto)
{
	struct nf_icmp_net *in = icmp_pernet(net);
	struct nf_proto_net *pn = &in->pn;

	in->timeout = nf_ct_icmp_timeout;

342
	return icmp_kmemdup_sysctl_table(pn, in);
343 344
}

345 346 347 348 349
static struct nf_proto_net *icmp_get_net_proto(struct net *net)
{
	return &net->ct.nf_ct_proto.icmp.pn;
}

350
struct nf_conntrack_l4proto nf_conntrack_l4proto_icmp __read_mostly =
351 352
{
	.l3proto		= PF_INET,
353
	.l4proto		= IPPROTO_ICMP,
354 355 356
	.pkt_to_tuple		= icmp_pkt_to_tuple,
	.invert_tuple		= icmp_invert_tuple,
	.packet			= icmp_packet,
357
	.get_timeouts		= icmp_get_timeouts,
358 359 360
	.new			= icmp_new,
	.error			= icmp_error,
	.destroy		= NULL,
361
	.me			= NULL,
D
Duan Jiong 已提交
362
#if IS_ENABLED(CONFIG_NF_CT_NETLINK)
363
	.tuple_to_nlattr	= icmp_tuple_to_nlattr,
364
	.nlattr_tuple_size	= icmp_nlattr_tuple_size,
365
	.nlattr_to_tuple	= icmp_nlattr_to_tuple,
366
	.nla_policy		= icmp_nla_policy,
367
#endif
368 369 370 371 372 373 374 375 376
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)
	.ctnl_timeout		= {
		.nlattr_to_obj	= icmp_timeout_nlattr_to_obj,
		.obj_to_nlattr	= icmp_timeout_obj_to_nlattr,
		.nlattr_max	= CTA_TIMEOUT_ICMP_MAX,
		.obj_size	= sizeof(unsigned int),
		.nla_policy	= icmp_timeout_nla_policy,
	},
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */
377
	.init_net		= icmp_init_net,
378
	.get_net_proto		= icmp_get_net_proto,
379
};