dma.c 31.9 KB
Newer Older
1
/*
2
 * Intel I/OAT DMA Linux driver
3
 * Copyright(c) 2004 - 2009 Intel Corporation.
4 5
 *
 * This program is free software; you can redistribute it and/or modify it
6 7
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
8 9 10 11 12 13 14
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
15 16 17 18 19
 * this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * The full GNU General Public License is included in this distribution in
 * the file called "COPYING".
20 21 22 23 24 25 26 27 28 29
 *
 */

/*
 * This driver supports an Intel I/OAT DMA engine, which does asynchronous
 * copy operations.
 */

#include <linux/init.h>
#include <linux/module.h>
30
#include <linux/slab.h>
31 32 33 34
#include <linux/pci.h>
#include <linux/interrupt.h>
#include <linux/dmaengine.h>
#include <linux/delay.h>
35
#include <linux/dma-mapping.h>
36
#include <linux/workqueue.h>
37
#include <linux/prefetch.h>
38
#include <linux/i7300_idle.h>
D
Dan Williams 已提交
39 40 41
#include "dma.h"
#include "registers.h"
#include "hw.h"
42

43 44
#include "../dmaengine.h"

45
int ioat_pending_level = 4;
46 47 48 49
module_param(ioat_pending_level, int, 0644);
MODULE_PARM_DESC(ioat_pending_level,
		 "high-water mark for pushing ioat descriptors (default: 4)");

50
/* internal functions */
51 52
static void ioat1_cleanup(struct ioat_dma_chan *ioat);
static void ioat1_dma_start_null_desc(struct ioat_dma_chan *ioat);
53 54 55 56 57 58 59 60 61

/**
 * ioat_dma_do_interrupt - handler used for single vector interrupt mode
 * @irq: interrupt id
 * @data: interrupt data
 */
static irqreturn_t ioat_dma_do_interrupt(int irq, void *data)
{
	struct ioatdma_device *instance = data;
62
	struct ioat_chan_common *chan;
63 64 65 66 67 68 69 70 71 72 73 74 75 76 77
	unsigned long attnstatus;
	int bit;
	u8 intrctrl;

	intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET);

	if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN))
		return IRQ_NONE;

	if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) {
		writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
		return IRQ_NONE;
	}

	attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET);
78
	for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) {
79 80
		chan = ioat_chan_by_index(instance, bit);
		tasklet_schedule(&chan->cleanup_task);
81 82 83 84 85 86 87 88 89 90 91 92 93
	}

	writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
	return IRQ_HANDLED;
}

/**
 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode
 * @irq: interrupt id
 * @data: interrupt data
 */
static irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data)
{
94
	struct ioat_chan_common *chan = data;
95

96
	tasklet_schedule(&chan->cleanup_task);
97 98 99 100

	return IRQ_HANDLED;
}

101
/* common channel initialization */
102
void ioat_init_channel(struct ioatdma_device *device, struct ioat_chan_common *chan, int idx)
103 104
{
	struct dma_device *dma = &device->common;
105 106
	struct dma_chan *c = &chan->common;
	unsigned long data = (unsigned long) c;
107 108 109 110 111

	chan->device = device;
	chan->reg_base = device->reg_base + (0x80 * (idx + 1));
	spin_lock_init(&chan->cleanup_lock);
	chan->common.device = dma;
112
	dma_cookie_init(&chan->common);
113 114
	list_add_tail(&chan->common.device_node, &dma->channels);
	device->idx[idx] = chan;
115
	init_timer(&chan->timer);
116 117 118
	chan->timer.function = device->timer_fn;
	chan->timer.data = data;
	tasklet_init(&chan->cleanup_task, device->cleanup_fn, data);
119 120 121
	tasklet_disable(&chan->cleanup_task);
}

122
/**
123
 * ioat1_dma_enumerate_channels - find and initialize the device's channels
124 125
 * @device: the device to be enumerated
 */
126
static int ioat1_enumerate_channels(struct ioatdma_device *device)
127 128 129 130
{
	u8 xfercap_scale;
	u32 xfercap;
	int i;
131
	struct ioat_dma_chan *ioat;
132
	struct device *dev = &device->pdev->dev;
133
	struct dma_device *dma = &device->common;
134

135 136
	INIT_LIST_HEAD(&dma->channels);
	dma->chancnt = readb(device->reg_base + IOAT_CHANCNT_OFFSET);
137 138 139 140 141 142
	dma->chancnt &= 0x1f; /* bits [4:0] valid */
	if (dma->chancnt > ARRAY_SIZE(device->idx)) {
		dev_warn(dev, "(%d) exceeds max supported channels (%zu)\n",
			 dma->chancnt, ARRAY_SIZE(device->idx));
		dma->chancnt = ARRAY_SIZE(device->idx);
	}
143
	xfercap_scale = readb(device->reg_base + IOAT_XFERCAP_OFFSET);
144
	xfercap_scale &= 0x1f; /* bits [4:0] valid */
145
	xfercap = (xfercap_scale == 0 ? -1 : (1UL << xfercap_scale));
D
Dan Williams 已提交
146
	dev_dbg(dev, "%s: xfercap = %d\n", __func__, xfercap);
147

148
#ifdef  CONFIG_I7300_IDLE_IOAT_CHANNEL
149 150
	if (i7300_idle_platform_probe(NULL, NULL, 1) == 0)
		dma->chancnt--;
A
Andy Henroid 已提交
151
#endif
152
	for (i = 0; i < dma->chancnt; i++) {
153
		ioat = devm_kzalloc(dev, sizeof(*ioat), GFP_KERNEL);
154
		if (!ioat)
155 156
			break;

157
		ioat_init_channel(device, &ioat->base, i);
158 159 160 161
		ioat->xfercap = xfercap;
		spin_lock_init(&ioat->desc_lock);
		INIT_LIST_HEAD(&ioat->free_desc);
		INIT_LIST_HEAD(&ioat->used_desc);
162
	}
163 164
	dma->chancnt = i;
	return i;
165 166
}

S
Shannon Nelson 已提交
167 168 169 170 171
/**
 * ioat_dma_memcpy_issue_pending - push potentially unrecognized appended
 *                                 descriptors to hw
 * @chan: DMA channel handle
 */
172
static inline void
173
__ioat1_dma_memcpy_issue_pending(struct ioat_dma_chan *ioat)
S
Shannon Nelson 已提交
174
{
175 176
	void __iomem *reg_base = ioat->base.reg_base;

D
Dan Williams 已提交
177 178
	dev_dbg(to_dev(&ioat->base), "%s: pending: %d\n",
		__func__, ioat->pending);
179 180
	ioat->pending = 0;
	writeb(IOAT_CHANCMD_APPEND, reg_base + IOAT1_CHANCMD_OFFSET);
S
Shannon Nelson 已提交
181 182 183 184
}

static void ioat1_dma_memcpy_issue_pending(struct dma_chan *chan)
{
185
	struct ioat_dma_chan *ioat = to_ioat_chan(chan);
S
Shannon Nelson 已提交
186

187 188 189 190
	if (ioat->pending > 0) {
		spin_lock_bh(&ioat->desc_lock);
		__ioat1_dma_memcpy_issue_pending(ioat);
		spin_unlock_bh(&ioat->desc_lock);
S
Shannon Nelson 已提交
191 192 193
	}
}

194
/**
195
 * ioat1_reset_channel - restart a channel
196
 * @ioat: IOAT DMA channel handle
197
 */
198
static void ioat1_reset_channel(struct ioat_dma_chan *ioat)
199
{
200 201
	struct ioat_chan_common *chan = &ioat->base;
	void __iomem *reg_base = chan->reg_base;
202 203
	u32 chansts, chanerr;

204
	dev_warn(to_dev(chan), "reset\n");
205
	chanerr = readl(reg_base + IOAT_CHANERR_OFFSET);
206
	chansts = *chan->completion & IOAT_CHANSTS_STATUS;
207
	if (chanerr) {
208
		dev_err(to_dev(chan),
209
			"chan%d, CHANSTS = 0x%08x CHANERR = 0x%04x, clearing\n",
210 211
			chan_num(chan), chansts, chanerr);
		writel(chanerr, reg_base + IOAT_CHANERR_OFFSET);
212 213 214 215 216 217 218 219 220 221
	}

	/*
	 * whack it upside the head with a reset
	 * and wait for things to settle out.
	 * force the pending count to a really big negative
	 * to make sure no one forces an issue_pending
	 * while we're waiting.
	 */

222
	ioat->pending = INT_MIN;
223
	writeb(IOAT_CHANCMD_RESET,
224
	       reg_base + IOAT_CHANCMD_OFFSET(chan->device->version));
225 226
	set_bit(IOAT_RESET_PENDING, &chan->state);
	mod_timer(&chan->timer, jiffies + RESET_DELAY);
227 228
}

229
static dma_cookie_t ioat1_tx_submit(struct dma_async_tx_descriptor *tx)
230
{
231 232
	struct dma_chan *c = tx->chan;
	struct ioat_dma_chan *ioat = to_ioat_chan(c);
233
	struct ioat_desc_sw *desc = tx_to_ioat_desc(tx);
234
	struct ioat_chan_common *chan = &ioat->base;
235 236
	struct ioat_desc_sw *first;
	struct ioat_desc_sw *chain_tail;
237 238
	dma_cookie_t cookie;

239
	spin_lock_bh(&ioat->desc_lock);
240
	/* cookie incr and addition to used_list must be atomic */
241
	cookie = dma_cookie_assign(tx);
D
Dan Williams 已提交
242
	dev_dbg(to_dev(&ioat->base), "%s: cookie: %d\n", __func__, cookie);
243 244

	/* write address into NextDescriptor field of last desc in chain */
D
Dan Williams 已提交
245
	first = to_ioat_desc(desc->tx_list.next);
246
	chain_tail = to_ioat_desc(ioat->used_desc.prev);
247 248 249
	/* make descriptor updates globally visible before chaining */
	wmb();
	chain_tail->hw->next = first->txd.phys;
D
Dan Williams 已提交
250
	list_splice_tail_init(&desc->tx_list, &ioat->used_desc);
D
Dan Williams 已提交
251 252
	dump_desc_dbg(ioat, chain_tail);
	dump_desc_dbg(ioat, first);
253

254 255 256
	if (!test_and_set_bit(IOAT_COMPLETION_PENDING, &chan->state))
		mod_timer(&chan->timer, jiffies + COMPLETION_TIMEOUT);

D
Dan Williams 已提交
257
	ioat->active += desc->hw->tx_cnt;
D
Dan Williams 已提交
258
	ioat->pending += desc->hw->tx_cnt;
259 260 261
	if (ioat->pending >= ioat_pending_level)
		__ioat1_dma_memcpy_issue_pending(ioat);
	spin_unlock_bh(&ioat->desc_lock);
262

263 264 265 266 267
	return cookie;
}

/**
 * ioat_dma_alloc_descriptor - allocate and return a sw and hw descriptor pair
268
 * @ioat: the channel supplying the memory pool for the descriptors
269 270
 * @flags: allocation flags
 */
271
static struct ioat_desc_sw *
272
ioat_dma_alloc_descriptor(struct ioat_dma_chan *ioat, gfp_t flags)
273 274 275
{
	struct ioat_dma_descriptor *desc;
	struct ioat_desc_sw *desc_sw;
276
	struct ioatdma_device *ioatdma_device;
277 278
	dma_addr_t phys;

279
	ioatdma_device = ioat->base.device;
280
	desc = pci_pool_alloc(ioatdma_device->dma_pool, flags, &phys);
281 282 283 284 285
	if (unlikely(!desc))
		return NULL;

	desc_sw = kzalloc(sizeof(*desc_sw), flags);
	if (unlikely(!desc_sw)) {
286
		pci_pool_free(ioatdma_device->dma_pool, desc, phys);
287 288 289 290
		return NULL;
	}

	memset(desc, 0, sizeof(*desc));
291

D
Dan Williams 已提交
292
	INIT_LIST_HEAD(&desc_sw->tx_list);
293 294
	dma_async_tx_descriptor_init(&desc_sw->txd, &ioat->base.common);
	desc_sw->txd.tx_submit = ioat1_tx_submit;
295
	desc_sw->hw = desc;
296
	desc_sw->txd.phys = phys;
D
Dan Williams 已提交
297
	set_desc_id(desc_sw, -1);
298 299 300 301

	return desc_sw;
}

302 303 304
static int ioat_initial_desc_count = 256;
module_param(ioat_initial_desc_count, int, 0644);
MODULE_PARM_DESC(ioat_initial_desc_count,
305
		 "ioat1: initial descriptors per channel (default: 256)");
306
/**
307
 * ioat1_dma_alloc_chan_resources - returns the number of allocated descriptors
308 309
 * @chan: the channel to be filled out
 */
310
static int ioat1_dma_alloc_chan_resources(struct dma_chan *c)
311
{
312 313
	struct ioat_dma_chan *ioat = to_ioat_chan(c);
	struct ioat_chan_common *chan = &ioat->base;
S
Shannon Nelson 已提交
314
	struct ioat_desc_sw *desc;
315 316 317 318
	u32 chanerr;
	int i;
	LIST_HEAD(tmp_list);

319
	/* have we already been set up? */
320 321
	if (!list_empty(&ioat->free_desc))
		return ioat->desccount;
322

323
	/* Setup register to interrupt and write completion status on error */
324
	writew(IOAT_CHANCTRL_RUN, chan->reg_base + IOAT_CHANCTRL_OFFSET);
325

326
	chanerr = readl(chan->reg_base + IOAT_CHANERR_OFFSET);
327
	if (chanerr) {
328 329
		dev_err(to_dev(chan), "CHANERR = %x, clearing\n", chanerr);
		writel(chanerr, chan->reg_base + IOAT_CHANERR_OFFSET);
330 331 332
	}

	/* Allocate descriptors */
333
	for (i = 0; i < ioat_initial_desc_count; i++) {
334
		desc = ioat_dma_alloc_descriptor(ioat, GFP_KERNEL);
335
		if (!desc) {
336
			dev_err(to_dev(chan), "Only %d initial descriptors\n", i);
337 338
			break;
		}
D
Dan Williams 已提交
339
		set_desc_id(desc, i);
340 341
		list_add_tail(&desc->node, &tmp_list);
	}
342 343 344 345
	spin_lock_bh(&ioat->desc_lock);
	ioat->desccount = i;
	list_splice(&tmp_list, &ioat->free_desc);
	spin_unlock_bh(&ioat->desc_lock);
346 347 348

	/* allocate a completion writeback area */
	/* doing 2 32bit writes to mmio since 1 64b write doesn't work */
349 350 351 352
	chan->completion = pci_pool_alloc(chan->device->completion_pool,
					  GFP_KERNEL, &chan->completion_dma);
	memset(chan->completion, 0, sizeof(*chan->completion));
	writel(((u64) chan->completion_dma) & 0x00000000FFFFFFFF,
353
	       chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
354
	writel(((u64) chan->completion_dma) >> 32,
355 356 357
	       chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);

	tasklet_enable(&chan->cleanup_task);
358
	ioat1_dma_start_null_desc(ioat);  /* give chain to dma device */
D
Dan Williams 已提交
359 360
	dev_dbg(to_dev(chan), "%s: allocated %d descriptors\n",
		__func__, ioat->desccount);
361
	return ioat->desccount;
362 363
}

364
/**
365
 * ioat1_dma_free_chan_resources - release all the descriptors
366 367
 * @chan: the channel to be cleaned
 */
368
static void ioat1_dma_free_chan_resources(struct dma_chan *c)
369
{
370 371 372
	struct ioat_dma_chan *ioat = to_ioat_chan(c);
	struct ioat_chan_common *chan = &ioat->base;
	struct ioatdma_device *ioatdma_device = chan->device;
373 374 375
	struct ioat_desc_sw *desc, *_desc;
	int in_use_descs = 0;

376 377 378
	/* Before freeing channel resources first check
	 * if they have been previously allocated for this channel.
	 */
379
	if (ioat->desccount == 0)
380 381
		return;

382
	tasklet_disable(&chan->cleanup_task);
383
	del_timer_sync(&chan->timer);
384
	ioat1_cleanup(ioat);
385

386 387 388
	/* Delay 100ms after reset to allow internal DMA logic to quiesce
	 * before removing DMA descriptor resources.
	 */
389
	writeb(IOAT_CHANCMD_RESET,
390
	       chan->reg_base + IOAT_CHANCMD_OFFSET(chan->device->version));
391
	mdelay(100);
392

393
	spin_lock_bh(&ioat->desc_lock);
D
Dan Williams 已提交
394 395 396 397
	list_for_each_entry_safe(desc, _desc, &ioat->used_desc, node) {
		dev_dbg(to_dev(chan), "%s: freeing %d from used list\n",
			__func__, desc_id(desc));
		dump_desc_dbg(ioat, desc);
398 399 400 401 402 403 404 405 406
		in_use_descs++;
		list_del(&desc->node);
		pci_pool_free(ioatdma_device->dma_pool, desc->hw,
			      desc->txd.phys);
		kfree(desc);
	}
	list_for_each_entry_safe(desc, _desc,
				 &ioat->free_desc, node) {
		list_del(&desc->node);
407
		pci_pool_free(ioatdma_device->dma_pool, desc->hw,
408
			      desc->txd.phys);
409 410
		kfree(desc);
	}
411
	spin_unlock_bh(&ioat->desc_lock);
412

413
	pci_pool_free(ioatdma_device->completion_pool,
414 415
		      chan->completion,
		      chan->completion_dma);
416 417 418

	/* one is ok since we left it on there on purpose */
	if (in_use_descs > 1)
419
		dev_err(to_dev(chan), "Freeing %d in use descriptors!\n",
420 421
			in_use_descs - 1);

422 423
	chan->last_completion = 0;
	chan->completion_dma = 0;
424 425
	ioat->pending = 0;
	ioat->desccount = 0;
426
}
427

428
/**
429 430
 * ioat1_dma_get_next_descriptor - return the next available descriptor
 * @ioat: IOAT DMA channel handle
431 432 433 434 435
 *
 * Gets the next descriptor from the chain, and must be called with the
 * channel's desc_lock held.  Allocates more descriptors if the channel
 * has run out.
 */
436
static struct ioat_desc_sw *
437
ioat1_dma_get_next_descriptor(struct ioat_dma_chan *ioat)
438
{
S
Shannon Nelson 已提交
439
	struct ioat_desc_sw *new;
440

441 442
	if (!list_empty(&ioat->free_desc)) {
		new = to_ioat_desc(ioat->free_desc.next);
443 444 445
		list_del(&new->node);
	} else {
		/* try to get another desc */
446
		new = ioat_dma_alloc_descriptor(ioat, GFP_ATOMIC);
S
Shannon Nelson 已提交
447
		if (!new) {
448
			dev_err(to_dev(&ioat->base), "alloc failed\n");
S
Shannon Nelson 已提交
449 450
			return NULL;
		}
451
	}
D
Dan Williams 已提交
452 453
	dev_dbg(to_dev(&ioat->base), "%s: allocated: %d\n",
		__func__, desc_id(new));
454 455
	prefetch(new->hw);
	return new;
456 457
}

458
static struct dma_async_tx_descriptor *
459
ioat1_dma_prep_memcpy(struct dma_chan *c, dma_addr_t dma_dest,
460
		      dma_addr_t dma_src, size_t len, unsigned long flags)
461
{
462
	struct ioat_dma_chan *ioat = to_ioat_chan(c);
463 464 465 466 467 468 469 470
	struct ioat_desc_sw *desc;
	size_t copy;
	LIST_HEAD(chain);
	dma_addr_t src = dma_src;
	dma_addr_t dest = dma_dest;
	size_t total_len = len;
	struct ioat_dma_descriptor *hw = NULL;
	int tx_cnt = 0;
471

472
	spin_lock_bh(&ioat->desc_lock);
473
	desc = ioat1_dma_get_next_descriptor(ioat);
474 475 476
	do {
		if (!desc)
			break;
477

478
		tx_cnt++;
479
		copy = min_t(size_t, len, ioat->xfercap);
480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495

		hw = desc->hw;
		hw->size = copy;
		hw->ctl = 0;
		hw->src_addr = src;
		hw->dst_addr = dest;

		list_add_tail(&desc->node, &chain);

		len -= copy;
		dest += copy;
		src += copy;
		if (len) {
			struct ioat_desc_sw *next;

			async_tx_ack(&desc->txd);
496
			next = ioat1_dma_get_next_descriptor(ioat);
497
			hw->next = next ? next->txd.phys : 0;
D
Dan Williams 已提交
498
			dump_desc_dbg(ioat, desc);
499 500 501 502 503 504
			desc = next;
		} else
			hw->next = 0;
	} while (len);

	if (!desc) {
505 506 507
		struct ioat_chan_common *chan = &ioat->base;

		dev_err(to_dev(chan),
508
			"chan%d - get_next_desc failed\n", chan_num(chan));
509 510
		list_splice(&chain, &ioat->free_desc);
		spin_unlock_bh(&ioat->desc_lock);
S
Shannon Nelson 已提交
511
		return NULL;
512
	}
513
	spin_unlock_bh(&ioat->desc_lock);
514 515 516

	desc->txd.flags = flags;
	desc->len = total_len;
D
Dan Williams 已提交
517
	list_splice(&chain, &desc->tx_list);
518 519
	hw->ctl_f.int_en = !!(flags & DMA_PREP_INTERRUPT);
	hw->ctl_f.compl_write = 1;
D
Dan Williams 已提交
520
	hw->tx_cnt = tx_cnt;
D
Dan Williams 已提交
521
	dump_desc_dbg(ioat, desc);
522 523

	return &desc->txd;
524 525
}

526
static void ioat1_cleanup_event(unsigned long data)
527
{
528
	struct ioat_dma_chan *ioat = to_ioat_chan((void *) data);
529

530 531
	ioat1_cleanup(ioat);
	writew(IOAT_CHANCTRL_RUN, ioat->base.reg_base + IOAT_CHANCTRL_OFFSET);
532 533
}

534
dma_addr_t ioat_get_current_completion(struct ioat_chan_common *chan)
535
{
536
	dma_addr_t phys_complete;
537
	u64 completion;
538

539
	completion = *chan->completion;
540
	phys_complete = ioat_chansts_to_addr(completion);
541

D
Dan Williams 已提交
542 543 544
	dev_dbg(to_dev(chan), "%s: phys_complete: %#llx\n", __func__,
		(unsigned long long) phys_complete);

545 546
	if (is_ioat_halted(completion)) {
		u32 chanerr = readl(chan->reg_base + IOAT_CHANERR_OFFSET);
547
		dev_err(to_dev(chan), "Channel halted, chanerr = %x\n",
548
			chanerr);
549 550 551 552

		/* TODO do something to salvage the situation */
	}

553 554 555
	return phys_complete;
}

556
bool ioat_cleanup_preamble(struct ioat_chan_common *chan,
557
			   dma_addr_t *phys_complete)
558
{
559 560 561 562 563
	*phys_complete = ioat_get_current_completion(chan);
	if (*phys_complete == chan->last_completion)
		return false;
	clear_bit(IOAT_COMPLETION_ACK, &chan->state);
	mod_timer(&chan->timer, jiffies + COMPLETION_TIMEOUT);
564

565 566
	return true;
}
567

568
static void __cleanup(struct ioat_dma_chan *ioat, dma_addr_t phys_complete)
569 570 571 572
{
	struct ioat_chan_common *chan = &ioat->base;
	struct list_head *_desc, *n;
	struct dma_async_tx_descriptor *tx;
573

574 575
	dev_dbg(to_dev(chan), "%s: phys_complete: %llx\n",
		 __func__, (unsigned long long) phys_complete);
576 577 578 579 580
	list_for_each_safe(_desc, n, &ioat->used_desc) {
		struct ioat_desc_sw *desc;

		prefetch(n);
		desc = list_entry(_desc, typeof(*desc), node);
581 582 583 584 585 586
		tx = &desc->txd;
		/*
		 * Incoming DMA requests may use multiple descriptors,
		 * due to exceeding xfercap, perhaps. If so, only the
		 * last one will have a cookie, and require unmapping.
		 */
D
Dan Williams 已提交
587
		dump_desc_dbg(ioat, desc);
588
		if (tx->cookie) {
589
			dma_cookie_complete(tx);
590
			dma_descriptor_unmap(tx);
D
Dan Williams 已提交
591
			ioat->active -= desc->hw->tx_cnt;
592 593 594
			if (tx->callback) {
				tx->callback(tx->callback_param);
				tx->callback = NULL;
595
			}
596
		}
597

598 599 600 601 602 603 604 605 606 607
		if (tx->phys != phys_complete) {
			/*
			 * a completed entry, but not the last, so clean
			 * up if the client is done with the descriptor
			 */
			if (async_tx_test_ack(tx))
				list_move_tail(&desc->node, &ioat->free_desc);
		} else {
			/*
			 * last used desc. Do not remove, so we can
608
			 * append from it.
609
			 */
610 611 612 613 614 615 616 617 618 619

			/* if nothing else is pending, cancel the
			 * completion timeout
			 */
			if (n == &ioat->used_desc) {
				dev_dbg(to_dev(chan),
					"%s cancel completion timeout\n",
					__func__);
				clear_bit(IOAT_COMPLETION_PENDING, &chan->state);
			}
620

621
			/* TODO check status bits? */
622 623 624 625
			break;
		}
	}

626 627 628 629 630 631 632 633 634 635 636 637 638 639
	chan->last_completion = phys_complete;
}

/**
 * ioat1_cleanup - cleanup up finished descriptors
 * @chan: ioat channel to be cleaned up
 *
 * To prevent lock contention we defer cleanup when the locks are
 * contended with a terminal timeout that forces cleanup and catches
 * completion notification errors.
 */
static void ioat1_cleanup(struct ioat_dma_chan *ioat)
{
	struct ioat_chan_common *chan = &ioat->base;
640
	dma_addr_t phys_complete;
641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658

	prefetch(chan->completion);

	if (!spin_trylock_bh(&chan->cleanup_lock))
		return;

	if (!ioat_cleanup_preamble(chan, &phys_complete)) {
		spin_unlock_bh(&chan->cleanup_lock);
		return;
	}

	if (!spin_trylock_bh(&ioat->desc_lock)) {
		spin_unlock_bh(&chan->cleanup_lock);
		return;
	}

	__cleanup(ioat, phys_complete);

659
	spin_unlock_bh(&ioat->desc_lock);
660 661
	spin_unlock_bh(&chan->cleanup_lock);
}
662

663 664
static void ioat1_timer_event(unsigned long data)
{
665
	struct ioat_dma_chan *ioat = to_ioat_chan((void *) data);
666
	struct ioat_chan_common *chan = &ioat->base;
667

668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685
	dev_dbg(to_dev(chan), "%s: state: %lx\n", __func__, chan->state);

	spin_lock_bh(&chan->cleanup_lock);
	if (test_and_clear_bit(IOAT_RESET_PENDING, &chan->state)) {
		struct ioat_desc_sw *desc;

		spin_lock_bh(&ioat->desc_lock);

		/* restart active descriptors */
		desc = to_ioat_desc(ioat->used_desc.prev);
		ioat_set_chainaddr(ioat, desc->txd.phys);
		ioat_start(chan);

		ioat->pending = 0;
		set_bit(IOAT_COMPLETION_PENDING, &chan->state);
		mod_timer(&chan->timer, jiffies + COMPLETION_TIMEOUT);
		spin_unlock_bh(&ioat->desc_lock);
	} else if (test_bit(IOAT_COMPLETION_PENDING, &chan->state)) {
686
		dma_addr_t phys_complete;
687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708

		spin_lock_bh(&ioat->desc_lock);
		/* if we haven't made progress and we have already
		 * acknowledged a pending completion once, then be more
		 * forceful with a restart
		 */
		if (ioat_cleanup_preamble(chan, &phys_complete))
			__cleanup(ioat, phys_complete);
		else if (test_bit(IOAT_COMPLETION_ACK, &chan->state))
			ioat1_reset_channel(ioat);
		else {
			u64 status = ioat_chansts(chan);

			/* manually update the last completion address */
			if (ioat_chansts_to_addr(status) != 0)
				*chan->completion = status;

			set_bit(IOAT_COMPLETION_ACK, &chan->state);
			mod_timer(&chan->timer, jiffies + COMPLETION_TIMEOUT);
		}
		spin_unlock_bh(&ioat->desc_lock);
	}
709
	spin_unlock_bh(&chan->cleanup_lock);
710 711
}

712
enum dma_status
713 714
ioat_dma_tx_status(struct dma_chan *c, dma_cookie_t cookie,
		   struct dma_tx_state *txstate)
715
{
716 717
	struct ioat_chan_common *chan = to_chan_common(c);
	struct ioatdma_device *device = chan->device;
718
	enum dma_status ret;
719

720 721 722
	ret = dma_cookie_status(c, cookie, txstate);
	if (ret == DMA_SUCCESS)
		return ret;
723

724
	device->cleanup_fn((unsigned long) c);
725

726
	return dma_cookie_status(c, cookie, txstate);
727 728
}

729
static void ioat1_dma_start_null_desc(struct ioat_dma_chan *ioat)
730
{
731
	struct ioat_chan_common *chan = &ioat->base;
732
	struct ioat_desc_sw *desc;
733
	struct ioat_dma_descriptor *hw;
734

735
	spin_lock_bh(&ioat->desc_lock);
736

737
	desc = ioat1_dma_get_next_descriptor(ioat);
738 739

	if (!desc) {
740
		dev_err(to_dev(chan),
741
			"Unable to start null desc - get next desc failed\n");
742
		spin_unlock_bh(&ioat->desc_lock);
743 744 745
		return;
	}

746 747 748 749 750
	hw = desc->hw;
	hw->ctl = 0;
	hw->ctl_f.null = 1;
	hw->ctl_f.int_en = 1;
	hw->ctl_f.compl_write = 1;
751
	/* set size to non-zero value (channel returns error when size is 0) */
752 753 754
	hw->size = NULL_DESC_BUFFER_SIZE;
	hw->src_addr = 0;
	hw->dst_addr = 0;
755
	async_tx_ack(&desc->txd);
756 757
	hw->next = 0;
	list_add_tail(&desc->node, &ioat->used_desc);
D
Dan Williams 已提交
758
	dump_desc_dbg(ioat, desc);
759

760 761
	ioat_set_chainaddr(ioat, desc->txd.phys);
	ioat_start(chan);
762
	spin_unlock_bh(&ioat->desc_lock);
763 764 765 766 767 768 769
}

/*
 * Perform a IOAT transaction to verify the HW works.
 */
#define IOAT_TEST_SIZE 2000

770
static void ioat_dma_test_callback(void *dma_async_param)
771
{
772 773 774
	struct completion *cmp = dma_async_param;

	complete(cmp);
775 776
}

777 778 779 780
/**
 * ioat_dma_self_test - Perform a IOAT transaction to verify the HW works.
 * @device: device to be tested
 */
781
int ioat_dma_self_test(struct ioatdma_device *device)
782 783 784 785
{
	int i;
	u8 *src;
	u8 *dest;
786 787
	struct dma_device *dma = &device->common;
	struct device *dev = &device->pdev->dev;
788
	struct dma_chan *dma_chan;
S
Shannon Nelson 已提交
789
	struct dma_async_tx_descriptor *tx;
790
	dma_addr_t dma_dest, dma_src;
791 792
	dma_cookie_t cookie;
	int err = 0;
793
	struct completion cmp;
794
	unsigned long tmo;
795
	unsigned long flags;
796

797
	src = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
798 799
	if (!src)
		return -ENOMEM;
800
	dest = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
801 802 803 804 805 806 807 808 809 810
	if (!dest) {
		kfree(src);
		return -ENOMEM;
	}

	/* Fill in src buffer */
	for (i = 0; i < IOAT_TEST_SIZE; i++)
		src[i] = (u8)i;

	/* Start copy, using first DMA channel */
811
	dma_chan = container_of(dma->channels.next, struct dma_chan,
812
				device_node);
813 814
	if (dma->device_alloc_chan_resources(dma_chan) < 1) {
		dev_err(dev, "selftest cannot allocate chan resource\n");
815 816 817 818
		err = -ENODEV;
		goto out;
	}

819 820
	dma_src = dma_map_single(dev, src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
	dma_dest = dma_map_single(dev, dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
821
	flags = DMA_PREP_INTERRUPT;
822
	tx = device->common.device_prep_dma_memcpy(dma_chan, dma_dest, dma_src,
823
						   IOAT_TEST_SIZE, flags);
824
	if (!tx) {
825
		dev_err(dev, "Self-test prep failed, disabling\n");
826
		err = -ENODEV;
827
		goto unmap_dma;
828 829
	}

830
	async_tx_ack(tx);
831
	init_completion(&cmp);
832
	tx->callback = ioat_dma_test_callback;
833
	tx->callback_param = &cmp;
834
	cookie = tx->tx_submit(tx);
835
	if (cookie < 0) {
836
		dev_err(dev, "Self-test setup failed, disabling\n");
837
		err = -ENODEV;
838
		goto unmap_dma;
839
	}
840
	dma->device_issue_pending(dma_chan);
D
Dan Williams 已提交
841

842
	tmo = wait_for_completion_timeout(&cmp, msecs_to_jiffies(3000));
843

844
	if (tmo == 0 ||
845
	    dma->device_tx_status(dma_chan, cookie, NULL)
846
					!= DMA_SUCCESS) {
847
		dev_err(dev, "Self-test copy timed out, disabling\n");
848
		err = -ENODEV;
849
		goto unmap_dma;
850 851
	}
	if (memcmp(src, dest, IOAT_TEST_SIZE)) {
852
		dev_err(dev, "Self-test copy failed compare, disabling\n");
853 854 855 856
		err = -ENODEV;
		goto free_resources;
	}

857 858 859
unmap_dma:
	dma_unmap_single(dev, dma_src, IOAT_TEST_SIZE, DMA_TO_DEVICE);
	dma_unmap_single(dev, dma_dest, IOAT_TEST_SIZE, DMA_FROM_DEVICE);
860
free_resources:
861
	dma->device_free_chan_resources(dma_chan);
862 863 864 865 866 867
out:
	kfree(src);
	kfree(dest);
	return err;
}

868 869 870 871
static char ioat_interrupt_style[32] = "msix";
module_param_string(ioat_interrupt_style, ioat_interrupt_style,
		    sizeof(ioat_interrupt_style), 0644);
MODULE_PARM_DESC(ioat_interrupt_style,
872
		 "set ioat interrupt style: msix (default), msi, intx");
873 874 875 876 877

/**
 * ioat_dma_setup_interrupts - setup interrupt handler
 * @device: ioat device
 */
878
int ioat_dma_setup_interrupts(struct ioatdma_device *device)
879
{
880
	struct ioat_chan_common *chan;
881 882 883 884 885
	struct pci_dev *pdev = device->pdev;
	struct device *dev = &pdev->dev;
	struct msix_entry *msix;
	int i, j, msixcnt;
	int err = -EINVAL;
886 887 888 889 890 891 892 893
	u8 intrctrl = 0;

	if (!strcmp(ioat_interrupt_style, "msix"))
		goto msix;
	if (!strcmp(ioat_interrupt_style, "msi"))
		goto msi;
	if (!strcmp(ioat_interrupt_style, "intx"))
		goto intx;
894
	dev_err(dev, "invalid ioat_interrupt_style %s\n", ioat_interrupt_style);
895
	goto err_no_irq;
896 897 898 899 900 901 902

msix:
	/* The number of MSI-X vectors should equal the number of channels */
	msixcnt = device->common.chancnt;
	for (i = 0; i < msixcnt; i++)
		device->msix_entries[i].entry = i;

903
	err = pci_enable_msix(pdev, device->msix_entries, msixcnt);
904
	if (err)
905 906 907
		goto msi;

	for (i = 0; i < msixcnt; i++) {
908
		msix = &device->msix_entries[i];
909
		chan = ioat_chan_by_index(device, i);
910 911
		err = devm_request_irq(dev, msix->vector,
				       ioat_dma_do_interrupt_msix, 0,
912
				       "ioat-msix", chan);
913 914
		if (err) {
			for (j = 0; j < i; j++) {
915
				msix = &device->msix_entries[j];
916 917
				chan = ioat_chan_by_index(device, j);
				devm_free_irq(dev, msix->vector, chan);
918
			}
919
			goto msi;
920 921 922
		}
	}
	intrctrl |= IOAT_INTRCTRL_MSIX_VECTOR_CONTROL;
923
	device->irq_mode = IOAT_MSIX;
924 925 926
	goto done;

msi:
927
	err = pci_enable_msi(pdev);
928 929 930
	if (err)
		goto intx;

931 932
	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt, 0,
			       "ioat-msi", device);
933
	if (err) {
934
		pci_disable_msi(pdev);
935 936
		goto intx;
	}
D
Dan Williams 已提交
937
	device->irq_mode = IOAT_MSI;
938 939 940
	goto done;

intx:
941 942
	err = devm_request_irq(dev, pdev->irq, ioat_dma_do_interrupt,
			       IRQF_SHARED, "ioat-intx", device);
943 944 945
	if (err)
		goto err_no_irq;

946
	device->irq_mode = IOAT_INTX;
947
done:
948 949
	if (device->intr_quirk)
		device->intr_quirk(device);
950 951 952 953 954 955 956
	intrctrl |= IOAT_INTRCTRL_MASTER_INT_EN;
	writeb(intrctrl, device->reg_base + IOAT_INTRCTRL_OFFSET);
	return 0;

err_no_irq:
	/* Disable all interrupt generation */
	writeb(0, device->reg_base + IOAT_INTRCTRL_OFFSET);
957
	device->irq_mode = IOAT_NOIRQ;
958 959
	dev_err(dev, "no usable interrupts\n");
	return err;
960
}
961
EXPORT_SYMBOL(ioat_dma_setup_interrupts);
962

963
static void ioat_disable_interrupts(struct ioatdma_device *device)
964 965 966 967 968
{
	/* Disable all interrupt generation */
	writeb(0, device->reg_base + IOAT_INTRCTRL_OFFSET);
}

969
int ioat_probe(struct ioatdma_device *device)
970
{
971 972 973
	int err = -ENODEV;
	struct dma_device *dma = &device->common;
	struct pci_dev *pdev = device->pdev;
974
	struct device *dev = &pdev->dev;
975 976 977

	/* DMA coherent memory pool for DMA descriptor allocations */
	device->dma_pool = pci_pool_create("dma_desc_pool", pdev,
978 979
					   sizeof(struct ioat_dma_descriptor),
					   64, 0);
980 981 982 983 984
	if (!device->dma_pool) {
		err = -ENOMEM;
		goto err_dma_pool;
	}

985 986 987
	device->completion_pool = pci_pool_create("completion_pool", pdev,
						  sizeof(u64), SMP_CACHE_BYTES,
						  SMP_CACHE_BYTES);
988

989 990 991 992 993
	if (!device->completion_pool) {
		err = -ENOMEM;
		goto err_completion_pool;
	}

994
	device->enumerate_channels(device);
995

996 997
	dma_cap_set(DMA_MEMCPY, dma->cap_mask);
	dma->dev = &pdev->dev;
998

999
	if (!dma->chancnt) {
1000
		dev_err(dev, "channel enumeration error\n");
1001 1002 1003
		goto err_setup_interrupts;
	}

1004
	err = ioat_dma_setup_interrupts(device);
1005
	if (err)
1006
		goto err_setup_interrupts;
1007

D
Dan Williams 已提交
1008
	err = device->self_test(device);
1009 1010 1011
	if (err)
		goto err_self_test;

1012
	return 0;
1013 1014

err_self_test:
1015
	ioat_disable_interrupts(device);
1016
err_setup_interrupts:
1017 1018 1019 1020
	pci_pool_destroy(device->completion_pool);
err_completion_pool:
	pci_pool_destroy(device->dma_pool);
err_dma_pool:
1021 1022 1023
	return err;
}

1024
int ioat_register(struct ioatdma_device *device)
1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050
{
	int err = dma_async_device_register(&device->common);

	if (err) {
		ioat_disable_interrupts(device);
		pci_pool_destroy(device->completion_pool);
		pci_pool_destroy(device->dma_pool);
	}

	return err;
}

/* ioat1_intr_quirk - fix up dma ctrl register to enable / disable msi */
static void ioat1_intr_quirk(struct ioatdma_device *device)
{
	struct pci_dev *pdev = device->pdev;
	u32 dmactrl;

	pci_read_config_dword(pdev, IOAT_PCI_DMACTRL_OFFSET, &dmactrl);
	if (pdev->msi_enabled)
		dmactrl |= IOAT_PCI_DMACTRL_MSI_EN;
	else
		dmactrl &= ~IOAT_PCI_DMACTRL_MSI_EN;
	pci_write_config_dword(pdev, IOAT_PCI_DMACTRL_OFFSET, dmactrl);
}

D
Dan Williams 已提交
1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070
static ssize_t ring_size_show(struct dma_chan *c, char *page)
{
	struct ioat_dma_chan *ioat = to_ioat_chan(c);

	return sprintf(page, "%d\n", ioat->desccount);
}
static struct ioat_sysfs_entry ring_size_attr = __ATTR_RO(ring_size);

static ssize_t ring_active_show(struct dma_chan *c, char *page)
{
	struct ioat_dma_chan *ioat = to_ioat_chan(c);

	return sprintf(page, "%d\n", ioat->active);
}
static struct ioat_sysfs_entry ring_active_attr = __ATTR_RO(ring_active);

static ssize_t cap_show(struct dma_chan *c, char *page)
{
	struct dma_device *dma = c->device;

1071
	return sprintf(page, "copy%s%s%s%s%s\n",
D
Dan Williams 已提交
1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112
		       dma_has_cap(DMA_PQ, dma->cap_mask) ? " pq" : "",
		       dma_has_cap(DMA_PQ_VAL, dma->cap_mask) ? " pq_val" : "",
		       dma_has_cap(DMA_XOR, dma->cap_mask) ? " xor" : "",
		       dma_has_cap(DMA_XOR_VAL, dma->cap_mask) ? " xor_val" : "",
		       dma_has_cap(DMA_INTERRUPT, dma->cap_mask) ? " intr" : "");

}
struct ioat_sysfs_entry ioat_cap_attr = __ATTR_RO(cap);

static ssize_t version_show(struct dma_chan *c, char *page)
{
	struct dma_device *dma = c->device;
	struct ioatdma_device *device = to_ioatdma_device(dma);

	return sprintf(page, "%d.%d\n",
		       device->version >> 4, device->version & 0xf);
}
struct ioat_sysfs_entry ioat_version_attr = __ATTR_RO(version);

static struct attribute *ioat1_attrs[] = {
	&ring_size_attr.attr,
	&ring_active_attr.attr,
	&ioat_cap_attr.attr,
	&ioat_version_attr.attr,
	NULL,
};

static ssize_t
ioat_attr_show(struct kobject *kobj, struct attribute *attr, char *page)
{
	struct ioat_sysfs_entry *entry;
	struct ioat_chan_common *chan;

	entry = container_of(attr, struct ioat_sysfs_entry, attr);
	chan = container_of(kobj, struct ioat_chan_common, kobj);

	if (!entry->show)
		return -EIO;
	return entry->show(&chan->common, page);
}

1113
const struct sysfs_ops ioat_sysfs_ops = {
D
Dan Williams 已提交
1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156
	.show	= ioat_attr_show,
};

static struct kobj_type ioat1_ktype = {
	.sysfs_ops = &ioat_sysfs_ops,
	.default_attrs = ioat1_attrs,
};

void ioat_kobject_add(struct ioatdma_device *device, struct kobj_type *type)
{
	struct dma_device *dma = &device->common;
	struct dma_chan *c;

	list_for_each_entry(c, &dma->channels, device_node) {
		struct ioat_chan_common *chan = to_chan_common(c);
		struct kobject *parent = &c->dev->device.kobj;
		int err;

		err = kobject_init_and_add(&chan->kobj, type, parent, "quickdata");
		if (err) {
			dev_warn(to_dev(chan),
				 "sysfs init error (%d), continuing...\n", err);
			kobject_put(&chan->kobj);
			set_bit(IOAT_KOBJ_INIT_FAIL, &chan->state);
		}
	}
}

void ioat_kobject_del(struct ioatdma_device *device)
{
	struct dma_device *dma = &device->common;
	struct dma_chan *c;

	list_for_each_entry(c, &dma->channels, device_node) {
		struct ioat_chan_common *chan = to_chan_common(c);

		if (!test_bit(IOAT_KOBJ_INIT_FAIL, &chan->state)) {
			kobject_del(&chan->kobj);
			kobject_put(&chan->kobj);
		}
	}
}

1157
int ioat1_dma_probe(struct ioatdma_device *device, int dca)
1158 1159 1160 1161 1162 1163
{
	struct pci_dev *pdev = device->pdev;
	struct dma_device *dma;
	int err;

	device->intr_quirk = ioat1_intr_quirk;
1164
	device->enumerate_channels = ioat1_enumerate_channels;
D
Dan Williams 已提交
1165
	device->self_test = ioat_dma_self_test;
1166 1167
	device->timer_fn = ioat1_timer_event;
	device->cleanup_fn = ioat1_cleanup_event;
1168 1169 1170
	dma = &device->common;
	dma->device_prep_dma_memcpy = ioat1_dma_prep_memcpy;
	dma->device_issue_pending = ioat1_dma_memcpy_issue_pending;
1171 1172
	dma->device_alloc_chan_resources = ioat1_dma_alloc_chan_resources;
	dma->device_free_chan_resources = ioat1_dma_free_chan_resources;
1173
	dma->device_tx_status = ioat_dma_tx_status;
1174 1175 1176 1177 1178 1179 1180 1181

	err = ioat_probe(device);
	if (err)
		return err;
	ioat_set_tcp_copy_break(4096);
	err = ioat_register(device);
	if (err)
		return err;
D
Dan Williams 已提交
1182 1183
	ioat_kobject_add(device, &ioat1_ktype);

1184 1185 1186 1187 1188 1189
	if (dca)
		device->dca = ioat_dca_init(pdev, device->reg_base);

	return err;
}

1190
void ioat_dma_remove(struct ioatdma_device *device)
1191
{
1192
	struct dma_device *dma = &device->common;
1193

1194
	ioat_disable_interrupts(device);
1195

D
Dan Williams 已提交
1196 1197
	ioat_kobject_del(device);

1198
	dma_async_device_unregister(dma);
1199

1200 1201
	pci_pool_destroy(device->dma_pool);
	pci_pool_destroy(device->completion_pool);
1202

1203
	INIT_LIST_HEAD(&dma->channels);
1204
}