nf_conntrack_proto_icmp.c 10.8 KB
Newer Older
1 2
/* (C) 1999-2001 Paul `Rusty' Russell
 * (C) 2002-2004 Netfilter Core Team <coreteam@netfilter.org>
3
 * (C) 2006-2010 Patrick McHardy <kaber@trash.net>
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 */

#include <linux/types.h>
#include <linux/timer.h>
#include <linux/netfilter.h>
#include <linux/in.h>
#include <linux/icmp.h>
#include <linux/seq_file.h>
#include <net/ip.h>
#include <net/checksum.h>
#include <linux/netfilter_ipv4.h>
#include <net/netfilter/nf_conntrack_tuple.h>
20
#include <net/netfilter/nf_conntrack_l4proto.h>
21
#include <net/netfilter/nf_conntrack_core.h>
22
#include <net/netfilter/nf_conntrack_zones.h>
23
#include <net/netfilter/nf_log.h>
24

25
static unsigned int nf_ct_icmp_timeout __read_mostly = 30*HZ;
26

27 28 29 30 31
static inline struct nf_icmp_net *icmp_pernet(struct net *net)
{
	return &net->ct.nf_ct_proto.icmp;
}

32
static bool icmp_pkt_to_tuple(const struct sk_buff *skb, unsigned int dataoff,
33
			      struct net *net, struct nf_conntrack_tuple *tuple)
34
{
35 36
	const struct icmphdr *hp;
	struct icmphdr _hdr;
37 38 39

	hp = skb_header_pointer(skb, dataoff, sizeof(_hdr), &_hdr);
	if (hp == NULL)
40
		return false;
41 42 43 44 45

	tuple->dst.u.icmp.type = hp->type;
	tuple->src.u.icmp.id = hp->un.echo.id;
	tuple->dst.u.icmp.code = hp->code;

46
	return true;
47 48
}

49 50 51 52 53 54 55 56 57 58 59 60
/* Add 1; spaces filled with 0. */
static const u_int8_t invmap[] = {
	[ICMP_ECHO] = ICMP_ECHOREPLY + 1,
	[ICMP_ECHOREPLY] = ICMP_ECHO + 1,
	[ICMP_TIMESTAMP] = ICMP_TIMESTAMPREPLY + 1,
	[ICMP_TIMESTAMPREPLY] = ICMP_TIMESTAMP + 1,
	[ICMP_INFO_REQUEST] = ICMP_INFO_REPLY + 1,
	[ICMP_INFO_REPLY] = ICMP_INFO_REQUEST + 1,
	[ICMP_ADDRESS] = ICMP_ADDRESSREPLY + 1,
	[ICMP_ADDRESSREPLY] = ICMP_ADDRESS + 1
};

61 62
static bool icmp_invert_tuple(struct nf_conntrack_tuple *tuple,
			      const struct nf_conntrack_tuple *orig)
63
{
64 65
	if (orig->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[orig->dst.u.icmp.type])
66
		return false;
67 68 69 70

	tuple->src.u.icmp.id = orig->src.u.icmp.id;
	tuple->dst.u.icmp.type = invmap[orig->dst.u.icmp.type] - 1;
	tuple->dst.u.icmp.code = orig->dst.u.icmp.code;
71
	return true;
72 73 74
}

/* Print out the per-protocol part of the tuple. */
75
static void icmp_print_tuple(struct seq_file *s,
76 77
			    const struct nf_conntrack_tuple *tuple)
{
78 79 80 81
	seq_printf(s, "type=%u code=%u id=%u ",
		   tuple->dst.u.icmp.type,
		   tuple->dst.u.icmp.code,
		   ntohs(tuple->src.u.icmp.id));
82 83
}

84 85
static unsigned int *icmp_get_timeouts(struct net *net)
{
86
	return &icmp_pernet(net)->timeout;
87 88
}

89 90 91 92 93
/* Returns verdict for packet, or -1 for invalid. */
static int icmp_packet(struct nf_conn *ct,
		       const struct sk_buff *skb,
		       unsigned int dataoff,
		       enum ip_conntrack_info ctinfo,
94
		       u_int8_t pf,
95 96
		       unsigned int hooknum,
		       unsigned int *timeout)
97
{
98 99 100
	/* Do not immediately delete the connection after the first
	   successful reply to avoid excessive conntrackd traffic
	   and also to handle correctly ICMP echo reply duplicates. */
101
	nf_ct_refresh_acct(ct, ctinfo, skb, *timeout);
102 103 104 105 106

	return NF_ACCEPT;
}

/* Called when a new connection for this protocol found. */
107
static bool icmp_new(struct nf_conn *ct, const struct sk_buff *skb,
108
		     unsigned int dataoff, unsigned int *timeouts)
109
{
110 111 112 113 114 115
	static const u_int8_t valid_new[] = {
		[ICMP_ECHO] = 1,
		[ICMP_TIMESTAMP] = 1,
		[ICMP_INFO_REQUEST] = 1,
		[ICMP_ADDRESS] = 1
	};
116

117 118
	if (ct->tuplehash[0].tuple.dst.u.icmp.type >= sizeof(valid_new) ||
	    !valid_new[ct->tuplehash[0].tuple.dst.u.icmp.type]) {
119
		/* Can't create a new ICMP `conn' with this. */
120
		pr_debug("icmp: can't create new conn with type %u\n",
121
			 ct->tuplehash[0].tuple.dst.u.icmp.type);
122
		nf_ct_dump_tuple_ip(&ct->tuplehash[0].tuple);
123
		return false;
124
	}
125
	return true;
126 127 128 129
}

/* Returns conntrack if it dealt with ICMP, and filled in skb fields */
static int
130
icmp_error_message(struct net *net, struct nf_conn *tmpl, struct sk_buff *skb,
131 132
		 enum ip_conntrack_info *ctinfo,
		 unsigned int hooknum)
133 134
{
	struct nf_conntrack_tuple innertuple, origtuple;
135 136
	const struct nf_conntrack_l4proto *innerproto;
	const struct nf_conntrack_tuple_hash *h;
137
	const struct nf_conntrack_zone *zone;
138
	struct nf_conntrack_zone tmp;
139 140

	NF_CT_ASSERT(skb->nfct == NULL);
141
	zone = nf_ct_zone_tmpl(tmpl, skb, &tmp);
142

143 144 145 146
	/* Are they talking about one of our connections? */
	if (!nf_ct_get_tuplepr(skb,
			       skb_network_offset(skb) + ip_hdrlen(skb)
						       + sizeof(struct icmphdr),
147
			       PF_INET, net, &origtuple)) {
148
		pr_debug("icmp_error_message: failed to get tuple\n");
149 150 151
		return -NF_ACCEPT;
	}

152
	/* rcu_read_lock()ed by nf_hook_slow */
153
	innerproto = __nf_ct_l4proto_find(PF_INET, origtuple.dst.protonum);
154

155 156 157
	/* Ordinarily, we'd expect the inverted tupleproto, but it's
	   been preserved inside the ICMP. */
	if (!nf_ct_invert_tuple(&innertuple, &origtuple,
158
				&nf_conntrack_l3proto_ipv4, innerproto)) {
159
		pr_debug("icmp_error_message: no match\n");
160 161 162 163 164
		return -NF_ACCEPT;
	}

	*ctinfo = IP_CT_RELATED;

165
	h = nf_conntrack_find_get(net, zone, &innertuple);
166
	if (!h) {
167 168
		pr_debug("icmp_error_message: no match\n");
		return -NF_ACCEPT;
169 170
	}

171 172 173
	if (NF_CT_DIRECTION(h) == IP_CT_DIR_REPLY)
		*ctinfo += IP_CT_IS_REPLY;

174 175 176
	/* Update skb to refer to this connection */
	skb->nfct = &nf_ct_tuplehash_to_ctrack(h)->ct_general;
	skb->nfctinfo = *ctinfo;
177
	return NF_ACCEPT;
178 179 180 181
}

/* Small and modified version of icmp_rcv */
static int
182 183
icmp_error(struct net *net, struct nf_conn *tmpl,
	   struct sk_buff *skb, unsigned int dataoff,
184
	   enum ip_conntrack_info *ctinfo, u_int8_t pf, unsigned int hooknum)
185
{
186 187
	const struct icmphdr *icmph;
	struct icmphdr _ih;
188 189

	/* Not enough header? */
190
	icmph = skb_header_pointer(skb, ip_hdrlen(skb), sizeof(_ih), &_ih);
191
	if (icmph == NULL) {
192
		if (LOG_INVALID(net, IPPROTO_ICMP))
193 194
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL,
				      NULL, "nf_ct_icmp: short packet ");
195 196 197 198
		return -NF_ACCEPT;
	}

	/* See ip_conntrack_proto_tcp.c */
199
	if (net->ct.sysctl_checksum && hooknum == NF_INET_PRE_ROUTING &&
200
	    nf_ip_checksum(skb, hooknum, dataoff, 0)) {
201
		if (LOG_INVALID(net, IPPROTO_ICMP))
202
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL, NULL,
203 204 205 206 207 208 209 210 211 212 213
				      "nf_ct_icmp: bad HW ICMP checksum ");
		return -NF_ACCEPT;
	}

	/*
	 *	18 is the highest 'known' ICMP type. Anything else is a mystery
	 *
	 *	RFC 1122: 3.2.2  Unknown ICMP messages types MUST be silently
	 *		  discarded.
	 */
	if (icmph->type > NR_ICMP_TYPES) {
214
		if (LOG_INVALID(net, IPPROTO_ICMP))
215
			nf_log_packet(net, PF_INET, 0, skb, NULL, NULL, NULL,
216 217 218 219 220
				      "nf_ct_icmp: invalid ICMP type ");
		return -NF_ACCEPT;
	}

	/* Need to track icmp error message? */
221 222 223 224 225
	if (icmph->type != ICMP_DEST_UNREACH &&
	    icmph->type != ICMP_SOURCE_QUENCH &&
	    icmph->type != ICMP_TIME_EXCEEDED &&
	    icmph->type != ICMP_PARAMETERPROB &&
	    icmph->type != ICMP_REDIRECT)
226 227
		return NF_ACCEPT;

228
	return icmp_error_message(net, tmpl, skb, ctinfo, hooknum);
229 230
}

D
Duan Jiong 已提交
231
#if IS_ENABLED(CONFIG_NF_CT_NETLINK)
232 233 234 235

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_conntrack.h>

236
static int icmp_tuple_to_nlattr(struct sk_buff *skb,
237 238
				const struct nf_conntrack_tuple *t)
{
239 240 241 242
	if (nla_put_be16(skb, CTA_PROTO_ICMP_ID, t->src.u.icmp.id) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_TYPE, t->dst.u.icmp.type) ||
	    nla_put_u8(skb, CTA_PROTO_ICMP_CODE, t->dst.u.icmp.code))
		goto nla_put_failure;
243 244
	return 0;

245
nla_put_failure:
246 247 248
	return -1;
}

249 250 251 252
static const struct nla_policy icmp_nla_policy[CTA_PROTO_MAX+1] = {
	[CTA_PROTO_ICMP_TYPE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_CODE]	= { .type = NLA_U8 },
	[CTA_PROTO_ICMP_ID]	= { .type = NLA_U16 },
253 254
};

255
static int icmp_nlattr_to_tuple(struct nlattr *tb[],
256 257
				struct nf_conntrack_tuple *tuple)
{
258 259 260
	if (!tb[CTA_PROTO_ICMP_TYPE] ||
	    !tb[CTA_PROTO_ICMP_CODE] ||
	    !tb[CTA_PROTO_ICMP_ID])
261 262
		return -EINVAL;

263 264 265
	tuple->dst.u.icmp.type = nla_get_u8(tb[CTA_PROTO_ICMP_TYPE]);
	tuple->dst.u.icmp.code = nla_get_u8(tb[CTA_PROTO_ICMP_CODE]);
	tuple->src.u.icmp.id = nla_get_be16(tb[CTA_PROTO_ICMP_ID]);
266

267 268
	if (tuple->dst.u.icmp.type >= sizeof(invmap) ||
	    !invmap[tuple->dst.u.icmp.type])
269 270 271 272
		return -EINVAL;

	return 0;
}
273 274 275 276 277

static int icmp_nlattr_tuple_size(void)
{
	return nla_policy_len(icmp_nla_policy, CTA_PROTO_MAX + 1);
}
278 279
#endif

280 281 282 283 284
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)

#include <linux/netfilter/nfnetlink.h>
#include <linux/netfilter/nfnetlink_cttimeout.h>

285 286
static int icmp_timeout_nlattr_to_obj(struct nlattr *tb[],
				      struct net *net, void *data)
287 288
{
	unsigned int *timeout = data;
289
	struct nf_icmp_net *in = icmp_pernet(net);
290 291 292 293 294 295

	if (tb[CTA_TIMEOUT_ICMP_TIMEOUT]) {
		*timeout =
			ntohl(nla_get_be32(tb[CTA_TIMEOUT_ICMP_TIMEOUT])) * HZ;
	} else {
		/* Set default ICMP timeout. */
296
		*timeout = in->timeout;
297 298 299 300 301 302 303 304 305
	}
	return 0;
}

static int
icmp_timeout_obj_to_nlattr(struct sk_buff *skb, const void *data)
{
	const unsigned int *timeout = data;

306 307
	if (nla_put_be32(skb, CTA_TIMEOUT_ICMP_TIMEOUT, htonl(*timeout / HZ)))
		goto nla_put_failure;
308 309 310 311 312 313 314 315 316 317 318 319
	return 0;

nla_put_failure:
	return -ENOSPC;
}

static const struct nla_policy
icmp_timeout_nla_policy[CTA_TIMEOUT_ICMP_MAX+1] = {
	[CTA_TIMEOUT_ICMP_TIMEOUT]	= { .type = NLA_U32 },
};
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */

320 321 322 323 324 325
#ifdef CONFIG_SYSCTL
static struct ctl_table icmp_sysctl_table[] = {
	{
		.procname	= "nf_conntrack_icmp_timeout",
		.maxlen		= sizeof(unsigned int),
		.mode		= 0644,
A
Alexey Dobriyan 已提交
326
		.proc_handler	= proc_dointvec_jiffies,
327
	},
328
	{ }
329 330 331
};
#endif /* CONFIG_SYSCTL */

332 333
static int icmp_kmemdup_sysctl_table(struct nf_proto_net *pn,
				     struct nf_icmp_net *in)
334 335 336 337 338 339 340
{
#ifdef CONFIG_SYSCTL
	pn->ctl_table = kmemdup(icmp_sysctl_table,
				sizeof(icmp_sysctl_table),
				GFP_KERNEL);
	if (!pn->ctl_table)
		return -ENOMEM;
341

342
	pn->ctl_table[0].data = &in->timeout;
343 344 345 346 347 348 349 350 351 352 353
#endif
	return 0;
}

static int icmp_init_net(struct net *net, u_int16_t proto)
{
	struct nf_icmp_net *in = icmp_pernet(net);
	struct nf_proto_net *pn = &in->pn;

	in->timeout = nf_ct_icmp_timeout;

354
	return icmp_kmemdup_sysctl_table(pn, in);
355 356
}

357 358 359 360 361
static struct nf_proto_net *icmp_get_net_proto(struct net *net)
{
	return &net->ct.nf_ct_proto.icmp.pn;
}

362
struct nf_conntrack_l4proto nf_conntrack_l4proto_icmp __read_mostly =
363 364
{
	.l3proto		= PF_INET,
365
	.l4proto		= IPPROTO_ICMP,
366 367 368 369 370
	.name			= "icmp",
	.pkt_to_tuple		= icmp_pkt_to_tuple,
	.invert_tuple		= icmp_invert_tuple,
	.print_tuple		= icmp_print_tuple,
	.packet			= icmp_packet,
371
	.get_timeouts		= icmp_get_timeouts,
372 373 374
	.new			= icmp_new,
	.error			= icmp_error,
	.destroy		= NULL,
375
	.me			= NULL,
D
Duan Jiong 已提交
376
#if IS_ENABLED(CONFIG_NF_CT_NETLINK)
377
	.tuple_to_nlattr	= icmp_tuple_to_nlattr,
378
	.nlattr_tuple_size	= icmp_nlattr_tuple_size,
379
	.nlattr_to_tuple	= icmp_nlattr_to_tuple,
380
	.nla_policy		= icmp_nla_policy,
381
#endif
382 383 384 385 386 387 388 389 390
#if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)
	.ctnl_timeout		= {
		.nlattr_to_obj	= icmp_timeout_nlattr_to_obj,
		.obj_to_nlattr	= icmp_timeout_obj_to_nlattr,
		.nlattr_max	= CTA_TIMEOUT_ICMP_MAX,
		.obj_size	= sizeof(unsigned int),
		.nla_policy	= icmp_timeout_nla_policy,
	},
#endif /* CONFIG_NF_CT_NETLINK_TIMEOUT */
391
	.init_net		= icmp_init_net,
392
	.get_net_proto		= icmp_get_net_proto,
393
};