nf_conntrack_proto_icmp.c 11.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
/* (C) 1999-2001 Paul `Rusty' Russell
 * (C) 2002-2004 Netfilter Core Team <coreteam@netfilter.org>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 */

#include <linux/types.h>
#include <linux/timer.h>
#include <linux/netfilter.h>
#include <linux/in.h>
#include <linux/icmp.h>
#include <linux/seq_file.h>
#include <net/ip.h>
#include <net/checksum.h>
#include <linux/netfilter_ipv4.h>
#include <net/netfilter/nf_conntrack_tuple.h>
19
#include <net/netfilter/nf_conntrack_l4proto.h>
20
#include <net/netfilter/nf_conntrack_core.h>
21
#include <net/netfilter/nf_conntrack_zones.h>
22
#include <net/netfilter/nf_log.h>
23

24
static unsigned int nf_ct_icmp_timeout __read_mostly = 30*HZ;
25

26 27 28 29 30
static inline struct nf_icmp_net *icmp_pernet(struct net *net)
{
	return &net->ct.nf_ct_proto.icmp;
}

31 32
static bool icmp_pkt_to_tuple(const struct sk_buff *skb, unsigned int dataoff,
			      struct nf_conntrack_tuple *tuple)
33
{
34 35
	const struct icmphdr *hp;
	struct icmphdr _hdr;
36 37 38

	hp = skb_header_pointer(skb, dataoff, sizeof(_hdr), &_hdr);
	if (hp == NULL)
39
		return false;
40 41 42 43 44

	tuple->dst.u.icmp.type = hp->type;
	tuple->src.u.icmp.id = hp->un.echo.id;
	tuple->dst.u.icmp.code = hp->code;

45
	return true;
46 47
}

48 49 50 51 52 53 54 55 56 57 58 59
/* Add 1; spaces filled with 0. */
static const u_int8_t invmap[] = {
	[ICMP_ECHO] = ICMP_ECHOREPLY + 1,
	[ICMP_ECHOREPLY] = ICMP_ECHO + 1,
	[ICMP_TIMESTAMP] = ICMP_TIMESTAMPREPLY + 1,
	[ICMP_TIMESTAMPREPLY] = ICMP_TIMESTAMP + 1,
	[ICMP_INFO_REQUEST] = ICMP_INFO_REPLY + 1,
	[ICMP_INFO_REPLY] = ICMP_INFO_REQUEST + 1,
	[ICMP_ADDRESS] = ICMP_ADDRESSREPLY + 1,
	[ICMP_ADDRESSREPLY] = ICMP_ADDRESS + 1
};

60 61
static bool icmp_invert_tuple(struct nf_conntrack_tuple *tuple,
			      const struct nf_conntrack_tuple *orig)
62
{
63 64
	if (orig->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[orig->dst.u.icmp.type])
65
		return false;
66 67 68 69

	tuple->src.u.icmp.id = orig->src.u.icmp.id;
	tuple->dst.u.icmp.type = invmap[orig->dst.u.icmp.type] - 1;
	tuple->dst.u.icmp.code = orig->dst.u.icmp.code;
70
	return true;
71 72 73 74 75 76 77 78 79 80 81 82
}

/* Print out the per-protocol part of the tuple. */
static int icmp_print_tuple(struct seq_file *s,
			    const struct nf_conntrack_tuple *tuple)
{
	return seq_printf(s, "type=%u code=%u id=%u ",
			  tuple->dst.u.icmp.type,
			  tuple->dst.u.icmp.code,
			  ntohs(tuple->src.u.icmp.id));
}

83 84
static unsigned int *icmp_get_timeouts(struct net *net)
{
85
	return &icmp_pernet(net)->timeout;
86 87
}

88 89 90 91 92
/* Returns verdict for packet, or -1 for invalid. */
static int icmp_packet(struct nf_conn *ct,
		       const struct sk_buff *skb,
		       unsigned int dataoff,
		       enum ip_conntrack_info ctinfo,
93
		       u_int8_t pf,
94 95
		       unsigned int hooknum,
		       unsigned int *timeout)
96
{
97 98 99
	/* Do not immediately delete the connection after the first
	   successful reply to avoid excessive conntrackd traffic
	   and also to handle correctly ICMP echo reply duplicates. */
100
	nf_ct_refresh_acct(ct, ctinfo, skb, *timeout);
101 102 103 104 105

	return NF_ACCEPT;
}

/* Called when a new connection for this protocol found. */
106
static bool icmp_new(struct nf_conn *ct, const struct sk_buff *skb,
107
		     unsigned int dataoff, unsigned int *timeouts)
108
{
109 110 111 112 113 114
	static const u_int8_t valid_new[] = {
		[ICMP_ECHO] = 1,
		[ICMP_TIMESTAMP] = 1,
		[ICMP_INFO_REQUEST] = 1,
		[ICMP_ADDRESS] = 1
	};
115

116 117
	if (ct->tuplehash[0].tuple.dst.u.icmp.type >= sizeof(valid_new) ||
	    !valid_new[ct->tuplehash[0].tuple.dst.u.icmp.type]) {
118
		/* Can't create a new ICMP `conn' with this. */
119
		pr_debug("icmp: can't create new conn with type %u\n",
120
			 ct->tuplehash[0].tuple.dst.u.icmp.type);
121
		nf_ct_dump_tuple_ip(&ct->tuplehash[0].tuple);
122
		return false;
123
	}
124
	return true;
125 126 127 128
}

/* Returns conntrack if it dealt with ICMP, and filled in skb fields */
static int
129
icmp_error_message(struct net *net, struct nf_conn *tmpl, struct sk_buff *skb,
130 131
		 enum ip_conntrack_info *ctinfo,
		 unsigned int hooknum)
132 133
{
	struct nf_conntrack_tuple innertuple, origtuple;
134 135
	const struct nf_conntrack_l4proto *innerproto;
	const struct nf_conntrack_tuple_hash *h;
136
	u16 zone = tmpl ? nf_ct_zone(tmpl) : NF_CT_DEFAULT_ZONE;
137 138 139

	NF_CT_ASSERT(skb->nfct == NULL);

140 141 142 143 144 145
	/* Are they talking about one of our connections? */
	if (!nf_ct_get_tuplepr(skb,
			       skb_network_offset(skb) + ip_hdrlen(skb)
						       + sizeof(struct icmphdr),
			       PF_INET, &origtuple)) {
		pr_debug("icmp_error_message: failed to get tuple\n");
146 147 148
		return -NF_ACCEPT;
	}

149
	/* rcu_read_lock()ed by nf_hook_slow */
150
	innerproto = __nf_ct_l4proto_find(PF_INET, origtuple.dst.protonum);
151

152 153 154
	/* Ordinarily, we'd expect the inverted tupleproto, but it's
	   been preserved inside the ICMP. */
	if (!nf_ct_invert_tuple(&innertuple, &origtuple,
155
				&nf_conntrack_l3proto_ipv4, innerproto)) {
156
		pr_debug("icmp_error_message: no match\n");
157 158 159 160 161
		return -NF_ACCEPT;
	}

	*ctinfo = IP_CT_RELATED;

162
	h = nf_conntrack_find_get(net, zone, &innertuple);
163
	if (!h) {
164 165
		pr_debug("icmp_error_message: no match\n");
		return -NF_ACCEPT;
166 167
	}

168 169 170
	if (NF_CT_DIRECTION(h) == IP_CT_DIR_REPLY)
		*ctinfo += IP_CT_IS_REPLY;

171 172 173
	/* Update skb to refer to this connection */
	skb->nfct = &nf_ct_tuplehash_to_ctrack(h)->ct_general;
	skb->nfctinfo = *ctinfo;
174
	return NF_ACCEPT;
175 176 177 178
}

/* Small and modified version of icmp_rcv */
static int
179 180
icmp_error(struct net *net, struct nf_conn *tmpl,
	   struct sk_buff *skb, unsigned int dataoff,
181
	   enum ip_conntrack_info *ctinfo, u_int8_t pf, unsigned int hooknum)
182
{
183 184
	const struct icmphdr *icmph;
	struct icmphdr _ih;
185 186

	/* Not enough header? */
187
	icmph = skb_header_pointer(skb, ip_hdrlen(skb), sizeof(_ih), &_ih);
188
	if (icmph == NULL) {
189
		if (LOG_INVALID(net, IPPROTO_ICMP))
190 191 192 193 194 195
			nf_log_packet(PF_INET, 0, skb, NULL, NULL, NULL,
				      "nf_ct_icmp: short packet ");
		return -NF_ACCEPT;
	}

	/* See ip_conntrack_proto_tcp.c */
196
	if (net->ct.sysctl_checksum && hooknum == NF_INET_PRE_ROUTING &&
197
	    nf_ip_checksum(skb, hooknum, dataoff, 0)) {
198
		if (LOG_INVALID(net, IPPROTO_ICMP))
199 200 201 202 203 204 205 206 207 208 209 210
			nf_log_packet(PF_INET, 0, skb, NULL, NULL, NULL,
				      "nf_ct_icmp: bad HW ICMP checksum ");
		return -NF_ACCEPT;
	}

	/*
	 *	18 is the highest 'known' ICMP type. Anything else is a mystery
	 *
	 *	RFC 1122: 3.2.2  Unknown ICMP messages types MUST be silently
	 *		  discarded.
	 */
	if (icmph->type > NR_ICMP_TYPES) {
211
		if (LOG_INVALID(net, IPPROTO_ICMP))
212 213 214 215 216 217
			nf_log_packet(PF_INET, 0, skb, NULL, NULL, NULL,
				      "nf_ct_icmp: invalid ICMP type ");
		return -NF_ACCEPT;
	}

	/* Need to track icmp error message? */
218 219 220 221 222
	if (icmph->type != ICMP_DEST_UNREACH &&
	    icmph->type != ICMP_SOURCE_QUENCH &&
	    icmph->type != ICMP_TIME_EXCEEDED &&
	    icmph->type != ICMP_PARAMETERPROB &&
	    icmph->type != ICMP_REDIRECT)
223 224
		return NF_ACCEPT;

225
	return icmp_error_message(net, tmpl, skb, ctinfo, hooknum);
226 227
}

228
#if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
229 230 231 232

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_conntrack.h>

233
static int icmp_tuple_to_nlattr(struct sk_buff *skb,
234 235
				const struct nf_conntrack_tuple *t)
{
236 237 238 239
	if (nla_put_be16(skb, CTA_PROTO_ICMP_ID, t->src.u.icmp.id) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_TYPE, t->dst.u.icmp.type) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_CODE, t->dst.u.icmp.code))
		goto nla_put_failure;
240 241
	return 0;

242
nla_put_failure:
243 244 245
	return -1;
}

246 247 248 249
static const struct nla_policy icmp_nla_policy[CTA_PROTO_MAX+1] = {
	[CTA_PROTO_ICMP_TYPE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_CODE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_ID]	= { .type = NLA_U16 },
250 251
};

252
static int icmp_nlattr_to_tuple(struct nlattr *tb[],
253 254
				struct nf_conntrack_tuple *tuple)
{
255 256 257
	if (!tb[CTA_PROTO_ICMP_TYPE] ||
	    !tb[CTA_PROTO_ICMP_CODE] ||
	    !tb[CTA_PROTO_ICMP_ID])
258 259
		return -EINVAL;

260 261 262
	tuple->dst.u.icmp.type = nla_get_u8(tb[CTA_PROTO_ICMP_TYPE]);
	tuple->dst.u.icmp.code = nla_get_u8(tb[CTA_PROTO_ICMP_CODE]);
	tuple->src.u.icmp.id = nla_get_be16(tb[CTA_PROTO_ICMP_ID]);
263

264 265
	if (tuple->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[tuple->dst.u.icmp.type])
266 267 268 269
		return -EINVAL;

	return 0;
}
270 271 272 273 274

static int icmp_nlattr_tuple_size(void)
{
	return nla_policy_len(icmp_nla_policy, CTA_PROTO_MAX + 1);
}
275 276
#endif

277 278 279 280 281
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_cttimeout.h>

282 283
static int icmp_timeout_nlattr_to_obj(struct nlattr *tb[],
				      struct net *net, void *data)
284 285
{
	unsigned int *timeout = data;
286
	struct nf_icmp_net *in = icmp_pernet(net);
287 288 289 290 291 292

	if (tb[CTA_TIMEOUT_ICMP_TIMEOUT]) {
		*timeout =
			ntohl(nla_get_be32(tb[CTA_TIMEOUT_ICMP_TIMEOUT])) * HZ;
	} else {
		/* Set default ICMP timeout. */
293
		*timeout = in->timeout;
294 295 296 297 298 299 300 301 302
	}
	return 0;
}

static int
icmp_timeout_obj_to_nlattr(struct sk_buff *skb, const void *data)
{
	const unsigned int *timeout = data;

303 304
	if (nla_put_be32(skb, CTA_TIMEOUT_ICMP_TIMEOUT, htonl(*timeout / HZ)))
		goto nla_put_failure;
305 306 307 308 309 310 311 312 313 314 315 316
	return 0;

nla_put_failure:
	return -ENOSPC;
}

static const struct nla_policy
icmp_timeout_nla_policy[CTA_TIMEOUT_ICMP_MAX+1] = {
	[CTA_TIMEOUT_ICMP_TIMEOUT]	= { .type = NLA_U32 },
};
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */

317 318 319 320 321 322
#ifdef CONFIG_SYSCTL
static struct ctl_table icmp_sysctl_table[] = {
	{
		.procname	= "nf_conntrack_icmp_timeout",
		.maxlen		= sizeof(unsigned int),
		.mode		= 0644,
A
Alexey Dobriyan 已提交
323
		.proc_handler	= proc_dointvec_jiffies,
324
	},
325
	{ }
326
};
327 328 329 330 331 332
#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
static struct ctl_table icmp_compat_sysctl_table[] = {
	{
		.procname	= "ip_conntrack_icmp_timeout",
		.maxlen		= sizeof(unsigned int),
		.mode		= 0644,
A
Alexey Dobriyan 已提交
333
		.proc_handler	= proc_dointvec_jiffies,
334
	},
335
	{ }
336 337
};
#endif /* CONFIG_NF_CONNTRACK_PROC_COMPAT */
338 339
#endif /* CONFIG_SYSCTL */

340
static int icmp_init_net(struct net *net, u_int16_t proto)
341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367
{
	struct nf_icmp_net *in = icmp_pernet(net);
	struct nf_proto_net *pn = (struct nf_proto_net *)in;
	in->timeout = nf_ct_icmp_timeout;

#ifdef CONFIG_SYSCTL
	pn->ctl_table = kmemdup(icmp_sysctl_table,
				sizeof(icmp_sysctl_table),
				GFP_KERNEL);
	if (!pn->ctl_table)
		return -ENOMEM;
	pn->ctl_table[0].data = &in->timeout;
#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
	pn->ctl_compat_table = kmemdup(icmp_compat_sysctl_table,
				       sizeof(icmp_compat_sysctl_table),
				       GFP_KERNEL);
	if (!pn->ctl_compat_table) {
		kfree(pn->ctl_table);
		pn->ctl_table = NULL;
		return -ENOMEM;
	}
	pn->ctl_compat_table[0].data = &in->timeout;
#endif
#endif
	return 0;
}

368
struct nf_conntrack_l4proto nf_conntrack_l4proto_icmp __read_mostly =
369 370
{
	.l3proto		= PF_INET,
371
	.l4proto		= IPPROTO_ICMP,
372 373 374 375 376
	.name			= "icmp",
	.pkt_to_tuple		= icmp_pkt_to_tuple,
	.invert_tuple		= icmp_invert_tuple,
	.print_tuple		= icmp_print_tuple,
	.packet			= icmp_packet,
377
	.get_timeouts		= icmp_get_timeouts,
378 379 380
	.new			= icmp_new,
	.error			= icmp_error,
	.destroy		= NULL,
381
	.me			= NULL,
382
#if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
383
	.tuple_to_nlattr	= icmp_tuple_to_nlattr,
384
	.nlattr_tuple_size	= icmp_nlattr_tuple_size,
385
	.nlattr_to_tuple	= icmp_nlattr_to_tuple,
386
	.nla_policy		= icmp_nla_policy,
387
#endif
388 389 390 391 392 393 394 395 396
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)
	.ctnl_timeout		= {
		.nlattr_to_obj	= icmp_timeout_nlattr_to_obj,
		.obj_to_nlattr	= icmp_timeout_obj_to_nlattr,
		.nlattr_max	= CTA_TIMEOUT_ICMP_MAX,
		.obj_size	= sizeof(unsigned int),
		.nla_policy	= icmp_timeout_nla_policy,
	},
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */
397
	.init_net		= icmp_init_net,
398
};