mv_xor.c 34.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * offload engine driver for the Marvell XOR engine
 * Copyright (C) 2007, 2008, Marvell International Ltd.
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 */

#include <linux/init.h>
16
#include <linux/slab.h>
17 18 19 20
#include <linux/delay.h>
#include <linux/dma-mapping.h>
#include <linux/spinlock.h>
#include <linux/interrupt.h>
21
#include <linux/of_device.h>
22 23
#include <linux/platform_device.h>
#include <linux/memory.h>
24
#include <linux/clk.h>
25 26 27
#include <linux/of.h>
#include <linux/of_irq.h>
#include <linux/irqdomain.h>
28
#include <linux/cpumask.h>
29
#include <linux/platform_data/dma-mv_xor.h>
30 31

#include "dmaengine.h"
32 33
#include "mv_xor.h"

34 35 36
enum mv_xor_type {
	XOR_ORION,
	XOR_ARMADA_38X,
37
	XOR_ARMADA_37XX,
38 39
};

40 41 42 43 44
enum mv_xor_mode {
	XOR_MODE_IN_REG,
	XOR_MODE_IN_DESC,
};

45 46 47
static void mv_xor_issue_pending(struct dma_chan *chan);

#define to_mv_xor_chan(chan)		\
48
	container_of(chan, struct mv_xor_chan, dmachan)
49 50 51 52

#define to_mv_xor_slot(tx)		\
	container_of(tx, struct mv_xor_desc_slot, async_tx)

53
#define mv_chan_to_devp(chan)           \
54
	((chan)->dmadev.dev)
55

56
static void mv_desc_init(struct mv_xor_desc_slot *desc,
57 58
			 dma_addr_t addr, u32 byte_count,
			 enum dma_ctrl_flags flags)
59 60 61
{
	struct mv_xor_desc *hw_desc = desc->hw_desc;

62
	hw_desc->status = XOR_DESC_DMA_OWNED;
63
	hw_desc->phy_next_desc = 0;
64 65 66
	/* Enable end-of-descriptor interrupts only for DMA_PREP_INTERRUPT */
	hw_desc->desc_command = (flags & DMA_PREP_INTERRUPT) ?
				XOR_DESC_EOD_INT_EN : 0;
67
	hw_desc->phy_dest_addr = addr;
68 69 70
	hw_desc->byte_count = byte_count;
}

71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
static void mv_desc_set_mode(struct mv_xor_desc_slot *desc)
{
	struct mv_xor_desc *hw_desc = desc->hw_desc;

	switch (desc->type) {
	case DMA_XOR:
	case DMA_INTERRUPT:
		hw_desc->desc_command |= XOR_DESC_OPERATION_XOR;
		break;
	case DMA_MEMCPY:
		hw_desc->desc_command |= XOR_DESC_OPERATION_MEMCPY;
		break;
	default:
		BUG();
		return;
	}
}

89 90 91 92 93 94 95 96 97 98 99 100
static void mv_desc_set_next_desc(struct mv_xor_desc_slot *desc,
				  u32 next_desc_addr)
{
	struct mv_xor_desc *hw_desc = desc->hw_desc;
	BUG_ON(hw_desc->phy_next_desc);
	hw_desc->phy_next_desc = next_desc_addr;
}

static void mv_desc_set_src_addr(struct mv_xor_desc_slot *desc,
				 int index, dma_addr_t addr)
{
	struct mv_xor_desc *hw_desc = desc->hw_desc;
101
	hw_desc->phy_src_addr[mv_phy_src_idx(index)] = addr;
102 103 104 105 106 107
	if (desc->type == DMA_XOR)
		hw_desc->desc_command |= (1 << index);
}

static u32 mv_chan_get_current_desc(struct mv_xor_chan *chan)
{
108
	return readl_relaxed(XOR_CURR_DESC(chan));
109 110 111 112 113
}

static void mv_chan_set_next_descriptor(struct mv_xor_chan *chan,
					u32 next_desc_addr)
{
114
	writel_relaxed(next_desc_addr, XOR_NEXT_DESC(chan));
115 116 117 118
}

static void mv_chan_unmask_interrupts(struct mv_xor_chan *chan)
{
119
	u32 val = readl_relaxed(XOR_INTR_MASK(chan));
120
	val |= XOR_INTR_MASK_VALUE << (chan->idx * 16);
121
	writel_relaxed(val, XOR_INTR_MASK(chan));
122 123 124 125
}

static u32 mv_chan_get_intr_cause(struct mv_xor_chan *chan)
{
126
	u32 intr_cause = readl_relaxed(XOR_INTR_CAUSE(chan));
127 128 129 130
	intr_cause = (intr_cause >> (chan->idx * 16)) & 0xFFFF;
	return intr_cause;
}

131
static void mv_chan_clear_eoc_cause(struct mv_xor_chan *chan)
132
{
133 134 135 136
	u32 val;

	val = XOR_INT_END_OF_DESC | XOR_INT_END_OF_CHAIN | XOR_INT_STOPPED;
	val = ~(val << (chan->idx * 16));
137
	dev_dbg(mv_chan_to_devp(chan), "%s, val 0x%08x\n", __func__, val);
138
	writel_relaxed(val, XOR_INTR_CAUSE(chan));
139 140
}

141
static void mv_chan_clear_err_status(struct mv_xor_chan *chan)
142 143
{
	u32 val = 0xFFFF0000 >> (chan->idx * 16);
144
	writel_relaxed(val, XOR_INTR_CAUSE(chan));
145 146
}

147
static void mv_chan_set_mode(struct mv_xor_chan *chan,
148
			     u32 op_mode)
149
{
150
	u32 config = readl_relaxed(XOR_CONFIG(chan));
151

152 153 154
	config &= ~0x7;
	config |= op_mode;

155 156 157 158 159 160
#if defined(__BIG_ENDIAN)
	config |= XOR_DESCRIPTOR_SWAP;
#else
	config &= ~XOR_DESCRIPTOR_SWAP;
#endif

161
	writel_relaxed(config, XOR_CONFIG(chan));
162 163 164 165
}

static void mv_chan_activate(struct mv_xor_chan *chan)
{
166
	dev_dbg(mv_chan_to_devp(chan), " activate chan.\n");
167 168 169

	/* writel ensures all descriptors are flushed before activation */
	writel(BIT(0), XOR_ACTIVATION(chan));
170 171 172 173
}

static char mv_chan_is_busy(struct mv_xor_chan *chan)
{
174
	u32 state = readl_relaxed(XOR_ACTIVATION(chan));
175 176 177 178 179 180 181

	state = (state >> 4) & 0x3;

	return (state == 1) ? 1 : 0;
}

/*
182 183
 * mv_chan_start_new_chain - program the engine to operate on new
 * chain headed by sw_desc
184 185
 * Caller must hold &mv_chan->lock while calling this function
 */
186 187
static void mv_chan_start_new_chain(struct mv_xor_chan *mv_chan,
				    struct mv_xor_desc_slot *sw_desc)
188
{
189
	dev_dbg(mv_chan_to_devp(mv_chan), "%s %d: sw_desc %p\n",
190 191
		__func__, __LINE__, sw_desc);

192 193 194
	/* set the hardware chain */
	mv_chan_set_next_descriptor(mv_chan, sw_desc->async_tx.phys);

195
	mv_chan->pending++;
196
	mv_xor_issue_pending(&mv_chan->dmachan);
197 198 199
}

static dma_cookie_t
200 201 202
mv_desc_run_tx_complete_actions(struct mv_xor_desc_slot *desc,
				struct mv_xor_chan *mv_chan,
				dma_cookie_t cookie)
203 204 205 206 207 208 209 210 211 212 213 214 215
{
	BUG_ON(desc->async_tx.cookie < 0);

	if (desc->async_tx.cookie > 0) {
		cookie = desc->async_tx.cookie;

		/* call the callback (must not sleep or submit new
		 * operations to this channel)
		 */
		if (desc->async_tx.callback)
			desc->async_tx.callback(
				desc->async_tx.callback_param);

216
		dma_descriptor_unmap(&desc->async_tx);
217 218 219
	}

	/* run dependent operations */
220
	dma_run_dependencies(&desc->async_tx);
221 222 223 224 225

	return cookie;
}

static int
226
mv_chan_clean_completed_slots(struct mv_xor_chan *mv_chan)
227 228 229
{
	struct mv_xor_desc_slot *iter, *_iter;

230
	dev_dbg(mv_chan_to_devp(mv_chan), "%s %d\n", __func__, __LINE__);
231
	list_for_each_entry_safe(iter, _iter, &mv_chan->completed_slots,
232
				 node) {
233

234 235
		if (async_tx_test_ack(&iter->async_tx))
			list_move_tail(&iter->node, &mv_chan->free_slots);
236 237 238 239 240
	}
	return 0;
}

static int
241 242
mv_desc_clean_slot(struct mv_xor_desc_slot *desc,
		   struct mv_xor_chan *mv_chan)
243
{
244
	dev_dbg(mv_chan_to_devp(mv_chan), "%s %d: desc %p flags %d\n",
245
		__func__, __LINE__, desc, desc->async_tx.flags);
246

247 248 249
	/* the client is allowed to attach dependent operations
	 * until 'ack' is set
	 */
250
	if (!async_tx_test_ack(&desc->async_tx))
251
		/* move this slot to the completed_slots */
252 253 254
		list_move_tail(&desc->node, &mv_chan->completed_slots);
	else
		list_move_tail(&desc->node, &mv_chan->free_slots);
255 256 257 258

	return 0;
}

259
/* This function must be called with the mv_xor_chan spinlock held */
260
static void mv_chan_slot_cleanup(struct mv_xor_chan *mv_chan)
261 262 263 264 265
{
	struct mv_xor_desc_slot *iter, *_iter;
	dma_cookie_t cookie = 0;
	int busy = mv_chan_is_busy(mv_chan);
	u32 current_desc = mv_chan_get_current_desc(mv_chan);
266 267
	int current_cleaned = 0;
	struct mv_xor_desc *hw_desc;
268

269 270
	dev_dbg(mv_chan_to_devp(mv_chan), "%s %d\n", __func__, __LINE__);
	dev_dbg(mv_chan_to_devp(mv_chan), "current_desc %x\n", current_desc);
271
	mv_chan_clean_completed_slots(mv_chan);
272 273 274 275 276 277

	/* free completed slots from the chain starting with
	 * the oldest descriptor
	 */

	list_for_each_entry_safe(iter, _iter, &mv_chan->chain,
278
				 node) {
279

280 281 282
		/* clean finished descriptors */
		hw_desc = iter->hw_desc;
		if (hw_desc->status & XOR_DESC_SUCCESS) {
283 284
			cookie = mv_desc_run_tx_complete_actions(iter, mv_chan,
								 cookie);
285

286
			/* done processing desc, clean slot */
287
			mv_desc_clean_slot(iter, mv_chan);
288 289 290 291 292 293 294 295 296

			/* break if we did cleaned the current */
			if (iter->async_tx.phys == current_desc) {
				current_cleaned = 1;
				break;
			}
		} else {
			if (iter->async_tx.phys == current_desc) {
				current_cleaned = 0;
297
				break;
298
			}
299 300 301 302
		}
	}

	if ((busy == 0) && !list_empty(&mv_chan->chain)) {
303 304 305 306 307 308 309
		if (current_cleaned) {
			/*
			 * current descriptor cleaned and removed, run
			 * from list head
			 */
			iter = list_entry(mv_chan->chain.next,
					  struct mv_xor_desc_slot,
310
					  node);
311
			mv_chan_start_new_chain(mv_chan, iter);
312
		} else {
313
			if (!list_is_last(&iter->node, &mv_chan->chain)) {
314 315 316 317
				/*
				 * descriptors are still waiting after
				 * current, trigger them
				 */
318
				iter = list_entry(iter->node.next,
319
						  struct mv_xor_desc_slot,
320
						  node);
321
				mv_chan_start_new_chain(mv_chan, iter);
322 323 324 325 326 327 328 329
			} else {
				/*
				 * some descriptors are still waiting
				 * to be cleaned
				 */
				tasklet_schedule(&mv_chan->irq_tasklet);
			}
		}
330 331 332
	}

	if (cookie > 0)
333
		mv_chan->dmachan.completed_cookie = cookie;
334 335 336 337 338
}

static void mv_xor_tasklet(unsigned long data)
{
	struct mv_xor_chan *chan = (struct mv_xor_chan *) data;
339 340

	spin_lock_bh(&chan->lock);
341
	mv_chan_slot_cleanup(chan);
342
	spin_unlock_bh(&chan->lock);
343 344 345
}

static struct mv_xor_desc_slot *
346
mv_chan_alloc_slot(struct mv_xor_chan *mv_chan)
347
{
348
	struct mv_xor_desc_slot *iter;
349

350 351 352 353 354 355 356 357 358 359
	spin_lock_bh(&mv_chan->lock);

	if (!list_empty(&mv_chan->free_slots)) {
		iter = list_first_entry(&mv_chan->free_slots,
					struct mv_xor_desc_slot,
					node);

		list_move_tail(&iter->node, &mv_chan->allocated_slots);

		spin_unlock_bh(&mv_chan->lock);
360

361 362 363 364 365 366
		/* pre-ack descriptor */
		async_tx_ack(&iter->async_tx);
		iter->async_tx.cookie = -EBUSY;

		return iter;

367
	}
368 369

	spin_unlock_bh(&mv_chan->lock);
370 371 372 373 374 375 376 377 378 379 380 381 382

	/* try to free some slots if the allocation fails */
	tasklet_schedule(&mv_chan->irq_tasklet);

	return NULL;
}

/************************ DMA engine API functions ****************************/
static dma_cookie_t
mv_xor_tx_submit(struct dma_async_tx_descriptor *tx)
{
	struct mv_xor_desc_slot *sw_desc = to_mv_xor_slot(tx);
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(tx->chan);
383
	struct mv_xor_desc_slot *old_chain_tail;
384 385 386
	dma_cookie_t cookie;
	int new_hw_chain = 1;

387
	dev_dbg(mv_chan_to_devp(mv_chan),
388 389 390 391
		"%s sw_desc %p: async_tx %p\n",
		__func__, sw_desc, &sw_desc->async_tx);

	spin_lock_bh(&mv_chan->lock);
392
	cookie = dma_cookie_assign(tx);
393 394

	if (list_empty(&mv_chan->chain))
395
		list_move_tail(&sw_desc->node, &mv_chan->chain);
396 397 398 399 400
	else {
		new_hw_chain = 0;

		old_chain_tail = list_entry(mv_chan->chain.prev,
					    struct mv_xor_desc_slot,
401 402
					    node);
		list_move_tail(&sw_desc->node, &mv_chan->chain);
403

404 405
		dev_dbg(mv_chan_to_devp(mv_chan), "Append to last desc %pa\n",
			&old_chain_tail->async_tx.phys);
406 407

		/* fix up the hardware chain */
408
		mv_desc_set_next_desc(old_chain_tail, sw_desc->async_tx.phys);
409 410 411 412 413 414 415 416 417 418 419 420 421 422

		/* if the channel is not busy */
		if (!mv_chan_is_busy(mv_chan)) {
			u32 current_desc = mv_chan_get_current_desc(mv_chan);
			/*
			 * and the curren desc is the end of the chain before
			 * the append, then we need to start the channel
			 */
			if (current_desc == old_chain_tail->async_tx.phys)
				new_hw_chain = 1;
		}
	}

	if (new_hw_chain)
423
		mv_chan_start_new_chain(mv_chan, sw_desc);
424 425 426 427 428 429 430

	spin_unlock_bh(&mv_chan->lock);

	return cookie;
}

/* returns the number of allocated descriptors */
431
static int mv_xor_alloc_chan_resources(struct dma_chan *chan)
432
{
433 434
	void *virt_desc;
	dma_addr_t dma_desc;
435 436 437
	int idx;
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);
	struct mv_xor_desc_slot *slot = NULL;
438
	int num_descs_in_pool = MV_XOR_POOL_SIZE/MV_XOR_SLOT_SIZE;
439 440 441 442 443 444

	/* Allocate descriptor slots */
	idx = mv_chan->slots_allocated;
	while (idx < num_descs_in_pool) {
		slot = kzalloc(sizeof(*slot), GFP_KERNEL);
		if (!slot) {
445 446 447
			dev_info(mv_chan_to_devp(mv_chan),
				 "channel only initialized %d descriptor slots",
				 idx);
448 449
			break;
		}
450 451
		virt_desc = mv_chan->dma_desc_pool_virt;
		slot->hw_desc = virt_desc + idx * MV_XOR_SLOT_SIZE;
452 453 454

		dma_async_tx_descriptor_init(&slot->async_tx, chan);
		slot->async_tx.tx_submit = mv_xor_tx_submit;
455
		INIT_LIST_HEAD(&slot->node);
456 457
		dma_desc = mv_chan->dma_desc_pool;
		slot->async_tx.phys = dma_desc + idx * MV_XOR_SLOT_SIZE;
458 459 460 461
		slot->idx = idx++;

		spin_lock_bh(&mv_chan->lock);
		mv_chan->slots_allocated = idx;
462
		list_add_tail(&slot->node, &mv_chan->free_slots);
463 464 465
		spin_unlock_bh(&mv_chan->lock);
	}

466
	dev_dbg(mv_chan_to_devp(mv_chan),
467 468
		"allocated %d descriptor slots\n",
		mv_chan->slots_allocated);
469 470 471 472 473 474 475 476 477

	return mv_chan->slots_allocated ? : -ENOMEM;
}

static struct dma_async_tx_descriptor *
mv_xor_prep_dma_xor(struct dma_chan *chan, dma_addr_t dest, dma_addr_t *src,
		    unsigned int src_cnt, size_t len, unsigned long flags)
{
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);
478
	struct mv_xor_desc_slot *sw_desc;
479 480 481 482

	if (unlikely(len < MV_XOR_MIN_BYTE_COUNT))
		return NULL;

483
	BUG_ON(len > MV_XOR_MAX_BYTE_COUNT);
484

485
	dev_dbg(mv_chan_to_devp(mv_chan),
486
		"%s src_cnt: %d len: %zu dest %pad flags: %ld\n",
487
		__func__, src_cnt, len, &dest, flags);
488

489
	sw_desc = mv_chan_alloc_slot(mv_chan);
490 491 492
	if (sw_desc) {
		sw_desc->type = DMA_XOR;
		sw_desc->async_tx.flags = flags;
493
		mv_desc_init(sw_desc, dest, len, flags);
494 495
		if (mv_chan->op_in_desc == XOR_MODE_IN_DESC)
			mv_desc_set_mode(sw_desc);
496
		while (src_cnt--)
497
			mv_desc_set_src_addr(sw_desc, src_cnt, src[src_cnt]);
498
	}
499

500
	dev_dbg(mv_chan_to_devp(mv_chan),
501 502 503 504 505
		"%s sw_desc %p async_tx %p \n",
		__func__, sw_desc, &sw_desc->async_tx);
	return sw_desc ? &sw_desc->async_tx : NULL;
}

506 507 508 509 510 511 512 513 514 515 516
static struct dma_async_tx_descriptor *
mv_xor_prep_dma_memcpy(struct dma_chan *chan, dma_addr_t dest, dma_addr_t src,
		size_t len, unsigned long flags)
{
	/*
	 * A MEMCPY operation is identical to an XOR operation with only
	 * a single source address.
	 */
	return mv_xor_prep_dma_xor(chan, dest, &src, 1, len, flags);
}

517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534
static struct dma_async_tx_descriptor *
mv_xor_prep_dma_interrupt(struct dma_chan *chan, unsigned long flags)
{
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);
	dma_addr_t src, dest;
	size_t len;

	src = mv_chan->dummy_src_addr;
	dest = mv_chan->dummy_dst_addr;
	len = MV_XOR_MIN_BYTE_COUNT;

	/*
	 * We implement the DMA_INTERRUPT operation as a minimum sized
	 * XOR operation with a single dummy source address.
	 */
	return mv_xor_prep_dma_xor(chan, dest, &src, 1, len, flags);
}

535 536 537 538 539 540 541
static void mv_xor_free_chan_resources(struct dma_chan *chan)
{
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);
	struct mv_xor_desc_slot *iter, *_iter;
	int in_use_descs = 0;

	spin_lock_bh(&mv_chan->lock);
542

543
	mv_chan_slot_cleanup(mv_chan);
544 545

	list_for_each_entry_safe(iter, _iter, &mv_chan->chain,
546
					node) {
547
		in_use_descs++;
548
		list_move_tail(&iter->node, &mv_chan->free_slots);
549 550
	}
	list_for_each_entry_safe(iter, _iter, &mv_chan->completed_slots,
551 552 553 554 555 556
				 node) {
		in_use_descs++;
		list_move_tail(&iter->node, &mv_chan->free_slots);
	}
	list_for_each_entry_safe(iter, _iter, &mv_chan->allocated_slots,
				 node) {
557
		in_use_descs++;
558
		list_move_tail(&iter->node, &mv_chan->free_slots);
559 560
	}
	list_for_each_entry_safe_reverse(
561 562
		iter, _iter, &mv_chan->free_slots, node) {
		list_del(&iter->node);
563 564 565 566
		kfree(iter);
		mv_chan->slots_allocated--;
	}

567
	dev_dbg(mv_chan_to_devp(mv_chan), "%s slots_allocated %d\n",
568 569 570 571
		__func__, mv_chan->slots_allocated);
	spin_unlock_bh(&mv_chan->lock);

	if (in_use_descs)
572
		dev_err(mv_chan_to_devp(mv_chan),
573 574 575 576
			"freeing %d in use descriptors!\n", in_use_descs);
}

/**
577
 * mv_xor_status - poll the status of an XOR transaction
578 579
 * @chan: XOR channel handle
 * @cookie: XOR transaction identifier
580
 * @txstate: XOR transactions state holder (or NULL)
581
 */
582
static enum dma_status mv_xor_status(struct dma_chan *chan,
583
					  dma_cookie_t cookie,
584
					  struct dma_tx_state *txstate)
585 586 587 588
{
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);
	enum dma_status ret;

589
	ret = dma_cookie_status(chan, cookie, txstate);
590
	if (ret == DMA_COMPLETE)
591
		return ret;
592 593

	spin_lock_bh(&mv_chan->lock);
594
	mv_chan_slot_cleanup(mv_chan);
595
	spin_unlock_bh(&mv_chan->lock);
596

597
	return dma_cookie_status(chan, cookie, txstate);
598 599
}

600
static void mv_chan_dump_regs(struct mv_xor_chan *chan)
601 602 603
{
	u32 val;

604
	val = readl_relaxed(XOR_CONFIG(chan));
605
	dev_err(mv_chan_to_devp(chan), "config       0x%08x\n", val);
606

607
	val = readl_relaxed(XOR_ACTIVATION(chan));
608
	dev_err(mv_chan_to_devp(chan), "activation   0x%08x\n", val);
609

610
	val = readl_relaxed(XOR_INTR_CAUSE(chan));
611
	dev_err(mv_chan_to_devp(chan), "intr cause   0x%08x\n", val);
612

613
	val = readl_relaxed(XOR_INTR_MASK(chan));
614
	dev_err(mv_chan_to_devp(chan), "intr mask    0x%08x\n", val);
615

616
	val = readl_relaxed(XOR_ERROR_CAUSE(chan));
617
	dev_err(mv_chan_to_devp(chan), "error cause  0x%08x\n", val);
618

619
	val = readl_relaxed(XOR_ERROR_ADDR(chan));
620
	dev_err(mv_chan_to_devp(chan), "error addr   0x%08x\n", val);
621 622
}

623 624
static void mv_chan_err_interrupt_handler(struct mv_xor_chan *chan,
					  u32 intr_cause)
625
{
626 627 628
	if (intr_cause & XOR_INT_ERR_DECODE) {
		dev_dbg(mv_chan_to_devp(chan), "ignoring address decode error\n");
		return;
629 630
	}

631
	dev_err(mv_chan_to_devp(chan), "error on chan %d. intr cause 0x%08x\n",
632
		chan->idx, intr_cause);
633

634
	mv_chan_dump_regs(chan);
635
	WARN_ON(1);
636 637 638 639 640 641 642
}

static irqreturn_t mv_xor_interrupt_handler(int irq, void *data)
{
	struct mv_xor_chan *chan = data;
	u32 intr_cause = mv_chan_get_intr_cause(chan);

643
	dev_dbg(mv_chan_to_devp(chan), "intr cause %x\n", intr_cause);
644

645
	if (intr_cause & XOR_INTR_ERRORS)
646
		mv_chan_err_interrupt_handler(chan, intr_cause);
647 648 649

	tasklet_schedule(&chan->irq_tasklet);

650
	mv_chan_clear_eoc_cause(chan);
651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668

	return IRQ_HANDLED;
}

static void mv_xor_issue_pending(struct dma_chan *chan)
{
	struct mv_xor_chan *mv_chan = to_mv_xor_chan(chan);

	if (mv_chan->pending >= MV_XOR_THRESHOLD) {
		mv_chan->pending = 0;
		mv_chan_activate(mv_chan);
	}
}

/*
 * Perform a transaction to verify the HW works.
 */

669
static int mv_chan_memcpy_self_test(struct mv_xor_chan *mv_chan)
670
{
671
	int i, ret;
672 673 674 675 676
	void *src, *dest;
	dma_addr_t src_dma, dest_dma;
	struct dma_chan *dma_chan;
	dma_cookie_t cookie;
	struct dma_async_tx_descriptor *tx;
677
	struct dmaengine_unmap_data *unmap;
678 679
	int err = 0;

680
	src = kmalloc(sizeof(u8) * PAGE_SIZE, GFP_KERNEL);
681 682 683
	if (!src)
		return -ENOMEM;

684
	dest = kzalloc(sizeof(u8) * PAGE_SIZE, GFP_KERNEL);
685 686 687 688 689 690
	if (!dest) {
		kfree(src);
		return -ENOMEM;
	}

	/* Fill in src buffer */
691
	for (i = 0; i < PAGE_SIZE; i++)
692 693
		((u8 *) src)[i] = (u8)i;

694
	dma_chan = &mv_chan->dmachan;
695
	if (mv_xor_alloc_chan_resources(dma_chan) < 1) {
696 697 698 699
		err = -ENODEV;
		goto out;
	}

700 701 702 703 704 705
	unmap = dmaengine_get_unmap_data(dma_chan->device->dev, 2, GFP_KERNEL);
	if (!unmap) {
		err = -ENOMEM;
		goto free_resources;
	}

706 707 708
	src_dma = dma_map_page(dma_chan->device->dev, virt_to_page(src),
			       (size_t)src & ~PAGE_MASK, PAGE_SIZE,
			       DMA_TO_DEVICE);
709
	unmap->addr[0] = src_dma;
710

711 712 713 714 715 716 717
	ret = dma_mapping_error(dma_chan->device->dev, src_dma);
	if (ret) {
		err = -ENOMEM;
		goto free_resources;
	}
	unmap->to_cnt = 1;

718 719 720
	dest_dma = dma_map_page(dma_chan->device->dev, virt_to_page(dest),
				(size_t)dest & ~PAGE_MASK, PAGE_SIZE,
				DMA_FROM_DEVICE);
721 722
	unmap->addr[1] = dest_dma;

723 724 725 726 727 728
	ret = dma_mapping_error(dma_chan->device->dev, dest_dma);
	if (ret) {
		err = -ENOMEM;
		goto free_resources;
	}
	unmap->from_cnt = 1;
729
	unmap->len = PAGE_SIZE;
730 731

	tx = mv_xor_prep_dma_memcpy(dma_chan, dest_dma, src_dma,
732
				    PAGE_SIZE, 0);
733 734 735 736 737 738 739
	if (!tx) {
		dev_err(dma_chan->device->dev,
			"Self-test cannot prepare operation, disabling\n");
		err = -ENODEV;
		goto free_resources;
	}

740
	cookie = mv_xor_tx_submit(tx);
741 742 743 744 745 746 747
	if (dma_submit_error(cookie)) {
		dev_err(dma_chan->device->dev,
			"Self-test submit error, disabling\n");
		err = -ENODEV;
		goto free_resources;
	}

748 749 750 751
	mv_xor_issue_pending(dma_chan);
	async_tx_ack(tx);
	msleep(1);

752
	if (mv_xor_status(dma_chan, cookie, NULL) !=
753
	    DMA_COMPLETE) {
754 755
		dev_err(dma_chan->device->dev,
			"Self-test copy timed out, disabling\n");
756 757 758 759
		err = -ENODEV;
		goto free_resources;
	}

760
	dma_sync_single_for_cpu(dma_chan->device->dev, dest_dma,
761 762
				PAGE_SIZE, DMA_FROM_DEVICE);
	if (memcmp(src, dest, PAGE_SIZE)) {
763 764
		dev_err(dma_chan->device->dev,
			"Self-test copy failed compare, disabling\n");
765 766 767 768 769
		err = -ENODEV;
		goto free_resources;
	}

free_resources:
770
	dmaengine_unmap_put(unmap);
771 772 773 774 775 776 777 778
	mv_xor_free_chan_resources(dma_chan);
out:
	kfree(src);
	kfree(dest);
	return err;
}

#define MV_XOR_NUM_SRC_TEST 4 /* must be <= 15 */
B
Bill Pemberton 已提交
779
static int
780
mv_chan_xor_self_test(struct mv_xor_chan *mv_chan)
781
{
782
	int i, src_idx, ret;
783 784 785 786 787
	struct page *dest;
	struct page *xor_srcs[MV_XOR_NUM_SRC_TEST];
	dma_addr_t dma_srcs[MV_XOR_NUM_SRC_TEST];
	dma_addr_t dest_dma;
	struct dma_async_tx_descriptor *tx;
788
	struct dmaengine_unmap_data *unmap;
789 790 791 792 793
	struct dma_chan *dma_chan;
	dma_cookie_t cookie;
	u8 cmp_byte = 0;
	u32 cmp_word;
	int err = 0;
794
	int src_count = MV_XOR_NUM_SRC_TEST;
795

796
	for (src_idx = 0; src_idx < src_count; src_idx++) {
797
		xor_srcs[src_idx] = alloc_page(GFP_KERNEL);
798 799
		if (!xor_srcs[src_idx]) {
			while (src_idx--)
800
				__free_page(xor_srcs[src_idx]);
801 802
			return -ENOMEM;
		}
803 804 805
	}

	dest = alloc_page(GFP_KERNEL);
806 807
	if (!dest) {
		while (src_idx--)
808
			__free_page(xor_srcs[src_idx]);
809 810
		return -ENOMEM;
	}
811 812

	/* Fill in src buffers */
813
	for (src_idx = 0; src_idx < src_count; src_idx++) {
814 815 816 817 818
		u8 *ptr = page_address(xor_srcs[src_idx]);
		for (i = 0; i < PAGE_SIZE; i++)
			ptr[i] = (1 << src_idx);
	}

819
	for (src_idx = 0; src_idx < src_count; src_idx++)
820 821 822 823 824 825 826
		cmp_byte ^= (u8) (1 << src_idx);

	cmp_word = (cmp_byte << 24) | (cmp_byte << 16) |
		(cmp_byte << 8) | cmp_byte;

	memset(page_address(dest), 0, PAGE_SIZE);

827
	dma_chan = &mv_chan->dmachan;
828
	if (mv_xor_alloc_chan_resources(dma_chan) < 1) {
829 830 831 832
		err = -ENODEV;
		goto out;
	}

833 834 835 836 837 838 839
	unmap = dmaengine_get_unmap_data(dma_chan->device->dev, src_count + 1,
					 GFP_KERNEL);
	if (!unmap) {
		err = -ENOMEM;
		goto free_resources;
	}

840
	/* test xor */
841 842 843 844
	for (i = 0; i < src_count; i++) {
		unmap->addr[i] = dma_map_page(dma_chan->device->dev, xor_srcs[i],
					      0, PAGE_SIZE, DMA_TO_DEVICE);
		dma_srcs[i] = unmap->addr[i];
845 846 847 848 849
		ret = dma_mapping_error(dma_chan->device->dev, unmap->addr[i]);
		if (ret) {
			err = -ENOMEM;
			goto free_resources;
		}
850 851
		unmap->to_cnt++;
	}
852

853 854 855
	unmap->addr[src_count] = dma_map_page(dma_chan->device->dev, dest, 0, PAGE_SIZE,
				      DMA_FROM_DEVICE);
	dest_dma = unmap->addr[src_count];
856 857 858 859 860
	ret = dma_mapping_error(dma_chan->device->dev, unmap->addr[src_count]);
	if (ret) {
		err = -ENOMEM;
		goto free_resources;
	}
861 862
	unmap->from_cnt = 1;
	unmap->len = PAGE_SIZE;
863 864

	tx = mv_xor_prep_dma_xor(dma_chan, dest_dma, dma_srcs,
865
				 src_count, PAGE_SIZE, 0);
866 867 868 869 870 871
	if (!tx) {
		dev_err(dma_chan->device->dev,
			"Self-test cannot prepare operation, disabling\n");
		err = -ENODEV;
		goto free_resources;
	}
872 873

	cookie = mv_xor_tx_submit(tx);
874 875 876 877 878 879 880
	if (dma_submit_error(cookie)) {
		dev_err(dma_chan->device->dev,
			"Self-test submit error, disabling\n");
		err = -ENODEV;
		goto free_resources;
	}

881 882 883 884
	mv_xor_issue_pending(dma_chan);
	async_tx_ack(tx);
	msleep(8);

885
	if (mv_xor_status(dma_chan, cookie, NULL) !=
886
	    DMA_COMPLETE) {
887 888
		dev_err(dma_chan->device->dev,
			"Self-test xor timed out, disabling\n");
889 890 891 892
		err = -ENODEV;
		goto free_resources;
	}

893
	dma_sync_single_for_cpu(dma_chan->device->dev, dest_dma,
894 895 896 897
				PAGE_SIZE, DMA_FROM_DEVICE);
	for (i = 0; i < (PAGE_SIZE / sizeof(u32)); i++) {
		u32 *ptr = page_address(dest);
		if (ptr[i] != cmp_word) {
898
			dev_err(dma_chan->device->dev,
899 900
				"Self-test xor failed compare, disabling. index %d, data %x, expected %x\n",
				i, ptr[i], cmp_word);
901 902 903 904 905 906
			err = -ENODEV;
			goto free_resources;
		}
	}

free_resources:
907
	dmaengine_unmap_put(unmap);
908 909
	mv_xor_free_chan_resources(dma_chan);
out:
910
	src_idx = src_count;
911 912 913 914 915 916
	while (src_idx--)
		__free_page(xor_srcs[src_idx]);
	__free_page(dest);
	return err;
}

917
static int mv_xor_channel_remove(struct mv_xor_chan *mv_chan)
918 919
{
	struct dma_chan *chan, *_chan;
920
	struct device *dev = mv_chan->dmadev.dev;
921

922
	dma_async_device_unregister(&mv_chan->dmadev);
923

924
	dma_free_coherent(dev, MV_XOR_POOL_SIZE,
925
			  mv_chan->dma_desc_pool_virt, mv_chan->dma_desc_pool);
926 927 928 929
	dma_unmap_single(dev, mv_chan->dummy_src_addr,
			 MV_XOR_MIN_BYTE_COUNT, DMA_FROM_DEVICE);
	dma_unmap_single(dev, mv_chan->dummy_dst_addr,
			 MV_XOR_MIN_BYTE_COUNT, DMA_TO_DEVICE);
930

931
	list_for_each_entry_safe(chan, _chan, &mv_chan->dmadev.channels,
932
				 device_node) {
933 934 935
		list_del(&chan->device_node);
	}

936 937
	free_irq(mv_chan->irq, mv_chan);

938 939 940
	return 0;
}

941
static struct mv_xor_chan *
942
mv_xor_channel_add(struct mv_xor_device *xordev,
943
		   struct platform_device *pdev,
944
		   int idx, dma_cap_mask_t cap_mask, int irq)
945 946 947 948 949
{
	int ret = 0;
	struct mv_xor_chan *mv_chan;
	struct dma_device *dma_dev;

950
	mv_chan = devm_kzalloc(&pdev->dev, sizeof(*mv_chan), GFP_KERNEL);
951 952
	if (!mv_chan)
		return ERR_PTR(-ENOMEM);
953

954
	mv_chan->idx = idx;
955
	mv_chan->irq = irq;
956 957 958 959
	if (xordev->xor_type == XOR_ORION)
		mv_chan->op_in_desc = XOR_MODE_IN_REG;
	else
		mv_chan->op_in_desc = XOR_MODE_IN_DESC;
960

961
	dma_dev = &mv_chan->dmadev;
962

963 964 965 966 967 968 969 970 971 972
	/*
	 * These source and destination dummy buffers are used to implement
	 * a DMA_INTERRUPT operation as a minimum-sized XOR operation.
	 * Hence, we only need to map the buffers at initialization-time.
	 */
	mv_chan->dummy_src_addr = dma_map_single(dma_dev->dev,
		mv_chan->dummy_src, MV_XOR_MIN_BYTE_COUNT, DMA_FROM_DEVICE);
	mv_chan->dummy_dst_addr = dma_map_single(dma_dev->dev,
		mv_chan->dummy_dst, MV_XOR_MIN_BYTE_COUNT, DMA_TO_DEVICE);

973 974 975 976
	/* allocate coherent memory for hardware descriptors
	 * note: writecombine gives slightly better performance, but
	 * requires that we explicitly flush the writes
	 */
977
	mv_chan->dma_desc_pool_virt =
978 979
	  dma_alloc_wc(&pdev->dev, MV_XOR_POOL_SIZE, &mv_chan->dma_desc_pool,
		       GFP_KERNEL);
980
	if (!mv_chan->dma_desc_pool_virt)
981
		return ERR_PTR(-ENOMEM);
982 983

	/* discover transaction capabilites from the platform data */
984
	dma_dev->cap_mask = cap_mask;
985 986 987 988 989 990

	INIT_LIST_HEAD(&dma_dev->channels);

	/* set base routines */
	dma_dev->device_alloc_chan_resources = mv_xor_alloc_chan_resources;
	dma_dev->device_free_chan_resources = mv_xor_free_chan_resources;
991
	dma_dev->device_tx_status = mv_xor_status;
992 993 994 995
	dma_dev->device_issue_pending = mv_xor_issue_pending;
	dma_dev->dev = &pdev->dev;

	/* set prep routines based on capability */
996 997
	if (dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask))
		dma_dev->device_prep_dma_interrupt = mv_xor_prep_dma_interrupt;
998 999 1000
	if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask))
		dma_dev->device_prep_dma_memcpy = mv_xor_prep_dma_memcpy;
	if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1001
		dma_dev->max_xor = 8;
1002 1003 1004
		dma_dev->device_prep_dma_xor = mv_xor_prep_dma_xor;
	}

1005
	mv_chan->mmr_base = xordev->xor_base;
1006
	mv_chan->mmr_high_base = xordev->xor_high_base;
1007 1008 1009 1010
	tasklet_init(&mv_chan->irq_tasklet, mv_xor_tasklet, (unsigned long)
		     mv_chan);

	/* clear errors before enabling interrupts */
1011
	mv_chan_clear_err_status(mv_chan);
1012

1013 1014
	ret = request_irq(mv_chan->irq, mv_xor_interrupt_handler,
			  0, dev_name(&pdev->dev), mv_chan);
1015 1016 1017 1018 1019
	if (ret)
		goto err_free_dma;

	mv_chan_unmask_interrupts(mv_chan);

1020
	if (mv_chan->op_in_desc == XOR_MODE_IN_DESC)
1021
		mv_chan_set_mode(mv_chan, XOR_OPERATION_MODE_IN_DESC);
1022
	else
1023
		mv_chan_set_mode(mv_chan, XOR_OPERATION_MODE_XOR);
1024 1025 1026 1027

	spin_lock_init(&mv_chan->lock);
	INIT_LIST_HEAD(&mv_chan->chain);
	INIT_LIST_HEAD(&mv_chan->completed_slots);
1028 1029
	INIT_LIST_HEAD(&mv_chan->free_slots);
	INIT_LIST_HEAD(&mv_chan->allocated_slots);
1030 1031
	mv_chan->dmachan.device = dma_dev;
	dma_cookie_init(&mv_chan->dmachan);
1032

1033
	list_add_tail(&mv_chan->dmachan.device_node, &dma_dev->channels);
1034 1035

	if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask)) {
1036
		ret = mv_chan_memcpy_self_test(mv_chan);
1037 1038
		dev_dbg(&pdev->dev, "memcpy self test returned %d\n", ret);
		if (ret)
1039
			goto err_free_irq;
1040 1041 1042
	}

	if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1043
		ret = mv_chan_xor_self_test(mv_chan);
1044 1045
		dev_dbg(&pdev->dev, "xor self test returned %d\n", ret);
		if (ret)
1046
			goto err_free_irq;
1047 1048
	}

1049 1050
	dev_info(&pdev->dev, "Marvell XOR (%s): ( %s%s%s)\n",
		 mv_chan->op_in_desc ? "Descriptor Mode" : "Registers Mode",
1051 1052 1053
		 dma_has_cap(DMA_XOR, dma_dev->cap_mask) ? "xor " : "",
		 dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask) ? "cpy " : "",
		 dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask) ? "intr " : "");
1054 1055

	dma_async_device_register(dma_dev);
1056
	return mv_chan;
1057

1058 1059
err_free_irq:
	free_irq(mv_chan->irq, mv_chan);
1060
 err_free_dma:
1061
	dma_free_coherent(&pdev->dev, MV_XOR_POOL_SIZE,
1062
			  mv_chan->dma_desc_pool_virt, mv_chan->dma_desc_pool);
1063
	return ERR_PTR(ret);
1064 1065 1066
}

static void
1067
mv_xor_conf_mbus_windows(struct mv_xor_device *xordev,
1068
			 const struct mbus_dram_target_info *dram)
1069
{
1070
	void __iomem *base = xordev->xor_high_base;
1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081
	u32 win_enable = 0;
	int i;

	for (i = 0; i < 8; i++) {
		writel(0, base + WINDOW_BASE(i));
		writel(0, base + WINDOW_SIZE(i));
		if (i < 4)
			writel(0, base + WINDOW_REMAP_HIGH(i));
	}

	for (i = 0; i < dram->num_cs; i++) {
1082
		const struct mbus_dram_window *cs = dram->cs + i;
1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094

		writel((cs->base & 0xffff0000) |
		       (cs->mbus_attr << 8) |
		       dram->mbus_dram_target_id, base + WINDOW_BASE(i));
		writel((cs->size - 1) & 0xffff0000, base + WINDOW_SIZE(i));

		win_enable |= (1 << i);
		win_enable |= 3 << (16 + (2 * i));
	}

	writel(win_enable, base + WINDOW_BAR_ENABLE(0));
	writel(win_enable, base + WINDOW_BAR_ENABLE(1));
1095 1096
	writel(0, base + WINDOW_OVERRIDE_CTRL(0));
	writel(0, base + WINDOW_OVERRIDE_CTRL(1));
1097 1098
}

1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125
static void
mv_xor_conf_mbus_windows_a3700(struct mv_xor_device *xordev)
{
	void __iomem *base = xordev->xor_high_base;
	u32 win_enable = 0;
	int i;

	for (i = 0; i < 8; i++) {
		writel(0, base + WINDOW_BASE(i));
		writel(0, base + WINDOW_SIZE(i));
		if (i < 4)
			writel(0, base + WINDOW_REMAP_HIGH(i));
	}
	/*
	 * For Armada3700 open default 4GB Mbus window. The dram
	 * related configuration are done at AXIS level.
	 */
	writel(0xffff0000, base + WINDOW_SIZE(0));
	win_enable |= 1;
	win_enable |= 3 << 16;

	writel(win_enable, base + WINDOW_BAR_ENABLE(0));
	writel(win_enable, base + WINDOW_BAR_ENABLE(1));
	writel(0, base + WINDOW_OVERRIDE_CTRL(0));
	writel(0, base + WINDOW_OVERRIDE_CTRL(1));
}

1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169
/*
 * Since this XOR driver is basically used only for RAID5, we don't
 * need to care about synchronizing ->suspend with DMA activity,
 * because the DMA engine will naturally be quiet due to the block
 * devices being suspended.
 */
static int mv_xor_suspend(struct platform_device *pdev, pm_message_t state)
{
	struct mv_xor_device *xordev = platform_get_drvdata(pdev);
	int i;

	for (i = 0; i < MV_XOR_MAX_CHANNELS; i++) {
		struct mv_xor_chan *mv_chan = xordev->channels[i];

		if (!mv_chan)
			continue;

		mv_chan->saved_config_reg =
			readl_relaxed(XOR_CONFIG(mv_chan));
		mv_chan->saved_int_mask_reg =
			readl_relaxed(XOR_INTR_MASK(mv_chan));
	}

	return 0;
}

static int mv_xor_resume(struct platform_device *dev)
{
	struct mv_xor_device *xordev = platform_get_drvdata(dev);
	const struct mbus_dram_target_info *dram;
	int i;

	for (i = 0; i < MV_XOR_MAX_CHANNELS; i++) {
		struct mv_xor_chan *mv_chan = xordev->channels[i];

		if (!mv_chan)
			continue;

		writel_relaxed(mv_chan->saved_config_reg,
			       XOR_CONFIG(mv_chan));
		writel_relaxed(mv_chan->saved_int_mask_reg,
			       XOR_INTR_MASK(mv_chan));
	}

1170 1171 1172 1173 1174
	if (xordev->xor_type == XOR_ARMADA_37XX) {
		mv_xor_conf_mbus_windows_a3700(xordev);
		return 0;
	}

1175 1176 1177 1178 1179 1180 1181
	dram = mv_mbus_dram_info();
	if (dram)
		mv_xor_conf_mbus_windows(xordev, dram);

	return 0;
}

1182
static const struct of_device_id mv_xor_dt_ids[] = {
1183 1184
	{ .compatible = "marvell,orion-xor", .data = (void *)XOR_ORION },
	{ .compatible = "marvell,armada-380-xor", .data = (void *)XOR_ARMADA_38X },
1185
	{ .compatible = "marvell,armada-3700-xor", .data = (void *)XOR_ARMADA_37XX },
1186 1187 1188
	{},
};

1189
static unsigned int mv_xor_engine_count;
1190

1191
static int mv_xor_probe(struct platform_device *pdev)
1192
{
1193
	const struct mbus_dram_target_info *dram;
1194
	struct mv_xor_device *xordev;
J
Jingoo Han 已提交
1195
	struct mv_xor_platform_data *pdata = dev_get_platdata(&pdev->dev);
1196
	struct resource *res;
1197
	unsigned int max_engines, max_channels;
1198
	int i, ret;
1199

1200
	dev_notice(&pdev->dev, "Marvell shared XOR driver\n");
1201

1202 1203
	xordev = devm_kzalloc(&pdev->dev, sizeof(*xordev), GFP_KERNEL);
	if (!xordev)
1204 1205 1206 1207 1208 1209
		return -ENOMEM;

	res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
	if (!res)
		return -ENODEV;

1210 1211 1212
	xordev->xor_base = devm_ioremap(&pdev->dev, res->start,
					resource_size(res));
	if (!xordev->xor_base)
1213 1214 1215 1216 1217 1218
		return -EBUSY;

	res = platform_get_resource(pdev, IORESOURCE_MEM, 1);
	if (!res)
		return -ENODEV;

1219 1220 1221
	xordev->xor_high_base = devm_ioremap(&pdev->dev, res->start,
					     resource_size(res));
	if (!xordev->xor_high_base)
1222 1223
		return -EBUSY;

1224
	platform_set_drvdata(pdev, xordev);
1225

1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239

	/*
	 * We need to know which type of XOR device we use before
	 * setting up. In non-dt case it can only be the legacy one.
	 */
	xordev->xor_type = XOR_ORION;
	if (pdev->dev.of_node) {
		const struct of_device_id *of_id =
			of_match_device(mv_xor_dt_ids,
					&pdev->dev);

		xordev->xor_type = (uintptr_t)of_id->data;
	}

1240 1241 1242
	/*
	 * (Re-)program MBUS remapping windows if we are asked to.
	 */
1243 1244 1245 1246 1247 1248 1249
	if (xordev->xor_type == XOR_ARMADA_37XX) {
		mv_xor_conf_mbus_windows_a3700(xordev);
	} else {
		dram = mv_mbus_dram_info();
		if (dram)
			mv_xor_conf_mbus_windows(xordev, dram);
	}
1250

1251 1252 1253
	/* Not all platforms can gate the clock, so it is not
	 * an error if the clock does not exists.
	 */
1254 1255 1256
	xordev->clk = clk_get(&pdev->dev, NULL);
	if (!IS_ERR(xordev->clk))
		clk_prepare_enable(xordev->clk);
1257

1258 1259 1260 1261 1262
	/*
	 * We don't want to have more than one channel per CPU in
	 * order for async_tx to perform well. So we limit the number
	 * of engines and channels so that we take into account this
	 * constraint. Note that we also want to use channels from
1263 1264
	 * separate engines when possible.  For dual-CPU Armada 3700
	 * SoC with single XOR engine allow using its both channels.
1265 1266
	 */
	max_engines = num_present_cpus();
1267 1268 1269 1270 1271 1272
	if (xordev->xor_type == XOR_ARMADA_37XX)
		max_channels =	num_present_cpus();
	else
		max_channels = min_t(unsigned int,
				     MV_XOR_MAX_CHANNELS,
				     DIV_ROUND_UP(num_present_cpus(), 2));
1273 1274 1275 1276

	if (mv_xor_engine_count >= max_engines)
		return 0;

1277 1278 1279 1280 1281
	if (pdev->dev.of_node) {
		struct device_node *np;
		int i = 0;

		for_each_child_of_node(pdev->dev.of_node, np) {
1282
			struct mv_xor_chan *chan;
1283 1284 1285
			dma_cap_mask_t cap_mask;
			int irq;

1286 1287 1288
			if (i >= max_channels)
				continue;

1289
			dma_cap_zero(cap_mask);
1290 1291 1292
			dma_cap_set(DMA_MEMCPY, cap_mask);
			dma_cap_set(DMA_XOR, cap_mask);
			dma_cap_set(DMA_INTERRUPT, cap_mask);
1293 1294

			irq = irq_of_parse_and_map(np, 0);
1295 1296
			if (!irq) {
				ret = -ENODEV;
1297 1298 1299
				goto err_channel_add;
			}

1300
			chan = mv_xor_channel_add(xordev, pdev, i,
1301
						  cap_mask, irq);
1302 1303
			if (IS_ERR(chan)) {
				ret = PTR_ERR(chan);
1304 1305 1306 1307
				irq_dispose_mapping(irq);
				goto err_channel_add;
			}

1308
			xordev->channels[i] = chan;
1309 1310 1311
			i++;
		}
	} else if (pdata && pdata->channels) {
1312
		for (i = 0; i < max_channels; i++) {
1313
			struct mv_xor_channel_data *cd;
1314
			struct mv_xor_chan *chan;
1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328
			int irq;

			cd = &pdata->channels[i];
			if (!cd) {
				ret = -ENODEV;
				goto err_channel_add;
			}

			irq = platform_get_irq(pdev, i);
			if (irq < 0) {
				ret = irq;
				goto err_channel_add;
			}

1329
			chan = mv_xor_channel_add(xordev, pdev, i,
1330
						  cd->cap_mask, irq);
1331 1332
			if (IS_ERR(chan)) {
				ret = PTR_ERR(chan);
1333 1334
				goto err_channel_add;
			}
1335 1336

			xordev->channels[i] = chan;
1337 1338
		}
	}
1339

1340
	return 0;
1341 1342 1343

err_channel_add:
	for (i = 0; i < MV_XOR_MAX_CHANNELS; i++)
1344
		if (xordev->channels[i]) {
1345
			mv_xor_channel_remove(xordev->channels[i]);
1346 1347 1348
			if (pdev->dev.of_node)
				irq_dispose_mapping(xordev->channels[i]->irq);
		}
1349

1350 1351 1352 1353 1354
	if (!IS_ERR(xordev->clk)) {
		clk_disable_unprepare(xordev->clk);
		clk_put(xordev->clk);
	}

1355
	return ret;
1356 1357
}

1358 1359
static struct platform_driver mv_xor_driver = {
	.probe		= mv_xor_probe,
1360 1361
	.suspend        = mv_xor_suspend,
	.resume         = mv_xor_resume,
1362
	.driver		= {
1363 1364
		.name	        = MV_XOR_NAME,
		.of_match_table = of_match_ptr(mv_xor_dt_ids),
1365 1366 1367 1368 1369 1370
	},
};


static int __init mv_xor_init(void)
{
1371
	return platform_driver_register(&mv_xor_driver);
1372
}
1373
device_initcall(mv_xor_init);
1374

1375
/*
1376 1377 1378
MODULE_AUTHOR("Saeed Bishara <saeed@marvell.com>");
MODULE_DESCRIPTION("DMA engine driver for Marvell's XOR engine");
MODULE_LICENSE("GPL");
1379
*/