offload.c 8.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49
/*
 * Copyright (C) 2016 Netronome Systems, Inc.
 *
 * This software is dual licensed under the GNU General License Version 2,
 * June 1991 as shown in the file COPYING in the top-level directory of this
 * source tree or the BSD 2-Clause License provided below.  You have the
 * option to license this software under the complete terms of either license.
 *
 * The BSD 2-Clause License:
 *
 *     Redistribution and use in source and binary forms, with or
 *     without modification, are permitted provided that the following
 *     conditions are met:
 *
 *      1. Redistributions of source code must retain the above
 *         copyright notice, this list of conditions and the following
 *         disclaimer.
 *
 *      2. Redistributions in binary form must reproduce the above
 *         copyright notice, this list of conditions and the following
 *         disclaimer in the documentation and/or other materials
 *         provided with the distribution.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */

/*
 * nfp_net_offload.c
 * Netronome network device driver: TC offload functions for PF and VF
 */

#include <linux/kernel.h>
#include <linux/netdevice.h>
#include <linux/pci.h>
#include <linux/jiffies.h>
#include <linux/timer.h>
#include <linux/list.h>

#include <net/pkt_cls.h>
#include <net/tc_act/tc_gact.h>
#include <net/tc_act/tc_mirred.h>

50 51 52
#include "main.h"
#include "../nfp_net_ctrl.h"
#include "../nfp_net.h"
53

54 55 56
void nfp_net_filter_stats_timer(unsigned long data)
{
	struct nfp_net *nn = (void *)data;
57
	struct nfp_net_bpf_priv *priv;
58 59
	struct nfp_stat_pair latest;

60 61 62
	priv = nn->app_priv;

	spin_lock_bh(&priv->rx_filter_lock);
63

64
	if (nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF)
65
		mod_timer(&priv->rx_filter_stats_timer,
66 67
			  jiffies + NFP_NET_STAT_POLL_IVL);

68
	spin_unlock_bh(&priv->rx_filter_lock);
69 70 71 72

	latest.pkts = nn_readq(nn, NFP_NET_CFG_STATS_APP1_FRAMES);
	latest.bytes = nn_readq(nn, NFP_NET_CFG_STATS_APP1_BYTES);

73 74
	if (latest.pkts != priv->rx_filter.pkts)
		priv->rx_filter_change = jiffies;
75

76
	priv->rx_filter = latest;
77 78 79 80
}

static void nfp_net_bpf_stats_reset(struct nfp_net *nn)
{
81 82 83 84 85 86
	struct nfp_net_bpf_priv *priv = nn->app_priv;

	priv->rx_filter.pkts = nn_readq(nn, NFP_NET_CFG_STATS_APP1_FRAMES);
	priv->rx_filter.bytes = nn_readq(nn, NFP_NET_CFG_STATS_APP1_BYTES);
	priv->rx_filter_prev = priv->rx_filter;
	priv->rx_filter_change = jiffies;
87 88 89 90 91
}

static int
nfp_net_bpf_stats_update(struct nfp_net *nn, struct tc_cls_bpf_offload *cls_bpf)
{
92
	struct nfp_net_bpf_priv *priv = nn->app_priv;
93 94
	u64 bytes, pkts;

95 96
	pkts = priv->rx_filter.pkts - priv->rx_filter_prev.pkts;
	bytes = priv->rx_filter.bytes - priv->rx_filter_prev.bytes;
97 98
	bytes -= pkts * ETH_HLEN;

99
	priv->rx_filter_prev = priv->rx_filter;
100

101
	tcf_exts_stats_update(cls_bpf->exts,
102
			      bytes, pkts, priv->rx_filter_change);
103 104 105 106

	return 0;
}

107 108 109 110 111 112
static int
nfp_net_bpf_get_act(struct nfp_net *nn, struct tc_cls_bpf_offload *cls_bpf)
{
	const struct tc_action *a;
	LIST_HEAD(actions);

113 114 115
	if (!cls_bpf->exts)
		return NN_ACT_XDP;

116
	/* TC direct action */
117
	if (cls_bpf->exts_integrated) {
118
		if (!tcf_exts_has_actions(cls_bpf->exts))
119 120
			return NN_ACT_DIRECT;

121
		return -EOPNOTSUPP;
122
	}
123 124

	/* TC legacy mode */
125
	if (!tcf_exts_has_one_action(cls_bpf->exts))
126
		return -EOPNOTSUPP;
127 128 129 130 131

	tcf_exts_to_list(cls_bpf->exts, &actions);
	list_for_each_entry(a, &actions, list) {
		if (is_tcf_gact_shot(a))
			return NN_ACT_TC_DROP;
132

133
		if (is_tcf_mirred_egress_redirect(a) &&
134
		    tcf_mirred_ifindex(a) == nn->dp.netdev->ifindex)
135
			return NN_ACT_TC_REDIR;
136 137
	}

138
	return -EOPNOTSUPP;
139 140 141 142 143 144 145 146 147 148 149 150 151 152
}

static int
nfp_net_bpf_offload_prepare(struct nfp_net *nn,
			    struct tc_cls_bpf_offload *cls_bpf,
			    struct nfp_bpf_result *res,
			    void **code, dma_addr_t *dma_addr, u16 max_instr)
{
	unsigned int code_sz = max_instr * sizeof(u64);
	enum nfp_bpf_action_type act;
	u16 start_off, done_off;
	unsigned int max_mtu;
	int ret;

153
	if (!IS_ENABLED(CONFIG_BPF_SYSCALL))
154
		return -EOPNOTSUPP;
155

156 157 158 159 160 161
	ret = nfp_net_bpf_get_act(nn, cls_bpf);
	if (ret < 0)
		return ret;
	act = ret;

	max_mtu = nn_readb(nn, NFP_NET_CFG_BPF_INL_MTU) * 64 - 32;
162
	if (max_mtu < nn->dp.netdev->mtu) {
163
		nn_info(nn, "BPF offload not supported with MTU larger than HW packet split boundary\n");
164
		return -EOPNOTSUPP;
165 166 167 168 169
	}

	start_off = nn_readw(nn, NFP_NET_CFG_BPF_START);
	done_off = nn_readw(nn, NFP_NET_CFG_BPF_DONE);

170
	*code = dma_zalloc_coherent(nn->dp.dev, code_sz, dma_addr, GFP_KERNEL);
171 172 173 174 175 176 177 178 179 180 181
	if (!*code)
		return -ENOMEM;

	ret = nfp_bpf_jit(cls_bpf->prog, *code, act, start_off, done_off,
			  max_instr, res);
	if (ret)
		goto out;

	return 0;

out:
182
	dma_free_coherent(nn->dp.dev, code_sz, *code, *dma_addr);
183 184 185 186 187 188 189 190 191
	return ret;
}

static void
nfp_net_bpf_load_and_start(struct nfp_net *nn, u32 tc_flags,
			   void *code, dma_addr_t dma_addr,
			   unsigned int code_sz, unsigned int n_instr,
			   bool dense_mode)
{
192
	struct nfp_net_bpf_priv *priv = nn->app_priv;
193 194 195
	u64 bpf_addr = dma_addr;
	int err;

196
	nn->dp.bpf_offload_skip_sw = !!(tc_flags & TCA_CLS_FLAGS_SKIP_SW);
197 198 199 200 201 202 203 204 205 206 207 208 209

	if (dense_mode)
		bpf_addr |= NFP_NET_CFG_BPF_CFG_8CTX;

	nn_writew(nn, NFP_NET_CFG_BPF_SIZE, n_instr);
	nn_writeq(nn, NFP_NET_CFG_BPF_ADDR, bpf_addr);

	/* Load up the JITed code */
	err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_BPF);
	if (err)
		nn_err(nn, "FW command error while loading BPF: %d\n", err);

	/* Enable passing packets through BPF function */
210 211
	nn->dp.ctrl |= NFP_NET_CFG_CTRL_BPF;
	nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl);
212 213 214 215
	err = nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN);
	if (err)
		nn_err(nn, "FW command error while enabling BPF: %d\n", err);

216
	dma_free_coherent(nn->dp.dev, code_sz, code, dma_addr);
217 218

	nfp_net_bpf_stats_reset(nn);
219 220
	mod_timer(&priv->rx_filter_stats_timer,
		  jiffies + NFP_NET_STAT_POLL_IVL);
221 222 223 224
}

static int nfp_net_bpf_stop(struct nfp_net *nn)
{
225 226
	struct nfp_net_bpf_priv *priv = nn->app_priv;

227
	if (!(nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF))
228 229
		return 0;

230
	spin_lock_bh(&priv->rx_filter_lock);
231
	nn->dp.ctrl &= ~NFP_NET_CFG_CTRL_BPF;
232
	spin_unlock_bh(&priv->rx_filter_lock);
233
	nn_writel(nn, NFP_NET_CFG_CTRL, nn->dp.ctrl);
234

235
	del_timer_sync(&priv->rx_filter_stats_timer);
236
	nn->dp.bpf_offload_skip_sw = 0;
237 238 239 240

	return nfp_net_reconfig(nn, NFP_NET_CFG_UPDATE_GEN);
}

241
int nfp_net_bpf_offload(struct nfp_net *nn, struct tc_cls_bpf_offload *cls_bpf)
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259
{
	struct nfp_bpf_result res;
	dma_addr_t dma_addr;
	u16 max_instr;
	void *code;
	int err;

	max_instr = nn_readw(nn, NFP_NET_CFG_BPF_MAX_LEN);

	switch (cls_bpf->command) {
	case TC_CLSBPF_REPLACE:
		/* There is nothing stopping us from implementing seamless
		 * replace but the simple method of loading I adopted in
		 * the firmware does not handle atomic replace (i.e. we have to
		 * stop the BPF offload and re-enable it).  Leaking-in a few
		 * frames which didn't have BPF applied in the hardware should
		 * be fine if software fallback is available, though.
		 */
260
		if (nn->dp.bpf_offload_skip_sw)
261 262 263 264 265 266 267 268 269 270 271 272 273 274
			return -EBUSY;

		err = nfp_net_bpf_offload_prepare(nn, cls_bpf, &res, &code,
						  &dma_addr, max_instr);
		if (err)
			return err;

		nfp_net_bpf_stop(nn);
		nfp_net_bpf_load_and_start(nn, cls_bpf->gen_flags, code,
					   dma_addr, max_instr * sizeof(u64),
					   res.n_instr, res.dense_mode);
		return 0;

	case TC_CLSBPF_ADD:
275
		if (nn->dp.ctrl & NFP_NET_CFG_CTRL_BPF)
276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
			return -EBUSY;

		err = nfp_net_bpf_offload_prepare(nn, cls_bpf, &res, &code,
						  &dma_addr, max_instr);
		if (err)
			return err;

		nfp_net_bpf_load_and_start(nn, cls_bpf->gen_flags, code,
					   dma_addr, max_instr * sizeof(u64),
					   res.n_instr, res.dense_mode);
		return 0;

	case TC_CLSBPF_DESTROY:
		return nfp_net_bpf_stop(nn);

291 292 293
	case TC_CLSBPF_STATS:
		return nfp_net_bpf_stats_update(nn, cls_bpf);

294
	default:
295
		return -EOPNOTSUPP;
296 297
	}
}