dmapool.c 12.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
/*
 * DMA Pool allocator
 *
 * Copyright 2001 David Brownell
 * Copyright 2007 Intel Corporation
 *   Author: Matthew Wilcox <willy@linux.intel.com>
 *
 * This software may be redistributed and/or modified under the terms of
 * the GNU General Public License ("GPL") version 2 as published by the
 * Free Software Foundation.
 *
 * This allocator returns small blocks of a given size which are DMA-able by
 * the given device.  It uses the dma_alloc_coherent page allocator to get
 * new pages, then splits them up into blocks of the required size.
 * Many older drivers still have their own code to do this.
 *
 * The current design of this allocator is fairly simple.  The pool is
 * represented by the 'struct dma_pool' which keeps a doubly-linked list of
 * allocated pages.  Each page in the page_list is split into blocks of at
20 21 22
 * least 'size' bytes.  Free blocks are tracked in an unsorted singly-linked
 * list of free blocks within the page.  Used blocks aren't tracked, but we
 * keep a count of how many are currently allocated from each page.
23
 */
L
Linus Torvalds 已提交
24 25 26 27

#include <linux/device.h>
#include <linux/dma-mapping.h>
#include <linux/dmapool.h>
28 29
#include <linux/kernel.h>
#include <linux/list.h>
L
Linus Torvalds 已提交
30
#include <linux/module.h>
31
#include <linux/mutex.h>
32
#include <linux/poison.h>
A
Alexey Dobriyan 已提交
33
#include <linux/sched.h>
34 35 36 37 38
#include <linux/slab.h>
#include <linux/spinlock.h>
#include <linux/string.h>
#include <linux/types.h>
#include <linux/wait.h>
L
Linus Torvalds 已提交
39

40 41 42 43
#if defined(CONFIG_DEBUG_SLAB) || defined(CONFIG_SLUB_DEBUG_ON)
#define DMAPOOL_DEBUG 1
#endif

M
Matthew Wilcox 已提交
44 45 46 47 48 49
struct dma_pool {		/* the pool */
	struct list_head page_list;
	spinlock_t lock;
	size_t size;
	struct device *dev;
	size_t allocation;
50
	size_t boundary;
M
Matthew Wilcox 已提交
51 52 53
	char name[32];
	wait_queue_head_t waitq;
	struct list_head pools;
L
Linus Torvalds 已提交
54 55
};

M
Matthew Wilcox 已提交
56 57 58 59
struct dma_page {		/* cacheable header for 'allocation' bytes */
	struct list_head page_list;
	void *vaddr;
	dma_addr_t dma;
60 61
	unsigned int in_use;
	unsigned int offset;
L
Linus Torvalds 已提交
62 63 64 65
};

#define	POOL_TIMEOUT_JIFFIES	((100 /* msec */ * HZ) / 1000)

M
Matthew Wilcox 已提交
66
static DEFINE_MUTEX(pools_lock);
L
Linus Torvalds 已提交
67 68

static ssize_t
M
Matthew Wilcox 已提交
69
show_pools(struct device *dev, struct device_attribute *attr, char *buf)
L
Linus Torvalds 已提交
70 71 72 73 74 75 76 77 78 79 80 81 82 83
{
	unsigned temp;
	unsigned size;
	char *next;
	struct dma_page *page;
	struct dma_pool *pool;

	next = buf;
	size = PAGE_SIZE;

	temp = scnprintf(next, size, "poolinfo - 0.1\n");
	size -= temp;
	next += temp;

84
	mutex_lock(&pools_lock);
L
Linus Torvalds 已提交
85 86 87 88 89 90 91 92 93 94 95
	list_for_each_entry(pool, &dev->dma_pools, pools) {
		unsigned pages = 0;
		unsigned blocks = 0;

		list_for_each_entry(page, &pool->page_list, page_list) {
			pages++;
			blocks += page->in_use;
		}

		/* per-pool info, no real statistics yet */
		temp = scnprintf(next, size, "%-16s %4u %4Zu %4Zu %2u\n",
96 97
				 pool->name, blocks,
				 pages * (pool->allocation / pool->size),
M
Matthew Wilcox 已提交
98
				 pool->size, pages);
L
Linus Torvalds 已提交
99 100 101
		size -= temp;
		next += temp;
	}
102
	mutex_unlock(&pools_lock);
L
Linus Torvalds 已提交
103 104 105

	return PAGE_SIZE - size;
}
M
Matthew Wilcox 已提交
106 107

static DEVICE_ATTR(pools, S_IRUGO, show_pools, NULL);
L
Linus Torvalds 已提交
108 109 110 111 112 113 114

/**
 * dma_pool_create - Creates a pool of consistent memory blocks, for dma.
 * @name: name of pool, for diagnostics
 * @dev: device that will be doing the DMA
 * @size: size of the blocks in this pool.
 * @align: alignment requirement for blocks; must be a power of two
115
 * @boundary: returned blocks won't cross this power of two boundary
L
Linus Torvalds 已提交
116 117 118 119 120 121 122 123 124
 * Context: !in_interrupt()
 *
 * Returns a dma allocation pool with the requested characteristics, or
 * null if one can't be created.  Given one of these pools, dma_pool_alloc()
 * may be used to allocate memory.  Such memory will all have "consistent"
 * DMA mappings, accessible by the device and its driver without using
 * cache flushing primitives.  The actual size of blocks allocated may be
 * larger than requested because of alignment.
 *
125
 * If @boundary is nonzero, objects returned from dma_pool_alloc() won't
L
Linus Torvalds 已提交
126 127 128 129
 * cross that size boundary.  This is useful for devices which have
 * addressing restrictions on individual DMA transfers, such as not crossing
 * boundaries of 4KBytes.
 */
M
Matthew Wilcox 已提交
130
struct dma_pool *dma_pool_create(const char *name, struct device *dev,
131
				 size_t size, size_t align, size_t boundary)
L
Linus Torvalds 已提交
132
{
M
Matthew Wilcox 已提交
133
	struct dma_pool *retval;
134
	size_t allocation;
L
Linus Torvalds 已提交
135

136
	if (align == 0) {
L
Linus Torvalds 已提交
137
		align = 1;
138
	} else if (align & (align - 1)) {
L
Linus Torvalds 已提交
139 140 141
		return NULL;
	}

142
	if (size == 0) {
143
		return NULL;
144 145 146
	} else if (size < 4) {
		size = 4;
	}
147 148 149 150

	if ((size % align) != 0)
		size = ALIGN(size, align);

151 152 153 154 155
	allocation = max_t(size_t, size, PAGE_SIZE);

	if (!boundary) {
		boundary = allocation;
	} else if ((boundary < size) || (boundary & (boundary - 1))) {
L
Linus Torvalds 已提交
156
		return NULL;
157
	}
L
Linus Torvalds 已提交
158

159 160
	retval = kmalloc_node(sizeof(*retval), GFP_KERNEL, dev_to_node(dev));
	if (!retval)
L
Linus Torvalds 已提交
161 162
		return retval;

163
	strlcpy(retval->name, name, sizeof(retval->name));
L
Linus Torvalds 已提交
164 165 166

	retval->dev = dev;

M
Matthew Wilcox 已提交
167 168
	INIT_LIST_HEAD(&retval->page_list);
	spin_lock_init(&retval->lock);
L
Linus Torvalds 已提交
169
	retval->size = size;
170
	retval->boundary = boundary;
L
Linus Torvalds 已提交
171
	retval->allocation = allocation;
M
Matthew Wilcox 已提交
172
	init_waitqueue_head(&retval->waitq);
L
Linus Torvalds 已提交
173 174

	if (dev) {
175 176
		int ret;

177
		mutex_lock(&pools_lock);
M
Matthew Wilcox 已提交
178 179
		if (list_empty(&dev->dma_pools))
			ret = device_create_file(dev, &dev_attr_pools);
180 181
		else
			ret = 0;
L
Linus Torvalds 已提交
182
		/* note:  not currently insisting "name" be unique */
183
		if (!ret)
M
Matthew Wilcox 已提交
184
			list_add(&retval->pools, &dev->dma_pools);
185 186 187 188
		else {
			kfree(retval);
			retval = NULL;
		}
189
		mutex_unlock(&pools_lock);
L
Linus Torvalds 已提交
190
	} else
M
Matthew Wilcox 已提交
191
		INIT_LIST_HEAD(&retval->pools);
L
Linus Torvalds 已提交
192 193 194

	return retval;
}
M
Matthew Wilcox 已提交
195
EXPORT_SYMBOL(dma_pool_create);
L
Linus Torvalds 已提交
196

197 198 199
static void pool_initialise_page(struct dma_pool *pool, struct dma_page *page)
{
	unsigned int offset = 0;
200
	unsigned int next_boundary = pool->boundary;
201 202 203

	do {
		unsigned int next = offset + pool->size;
204 205 206 207
		if (unlikely((next + pool->size) >= next_boundary)) {
			next = next_boundary;
			next_boundary += pool->boundary;
		}
208 209 210 211 212
		*(int *)(page->vaddr + offset) = next;
		offset = next;
	} while (offset < pool->allocation);
}

M
Matthew Wilcox 已提交
213
static struct dma_page *pool_alloc_page(struct dma_pool *pool, gfp_t mem_flags)
L
Linus Torvalds 已提交
214
{
M
Matthew Wilcox 已提交
215
	struct dma_page *page;
L
Linus Torvalds 已提交
216

217
	page = kmalloc(sizeof(*page), mem_flags);
L
Linus Torvalds 已提交
218 219
	if (!page)
		return NULL;
220
	page->vaddr = dma_alloc_coherent(pool->dev, pool->allocation,
M
Matthew Wilcox 已提交
221
					 &page->dma, mem_flags);
L
Linus Torvalds 已提交
222
	if (page->vaddr) {
223
#ifdef	DMAPOOL_DEBUG
M
Matthew Wilcox 已提交
224
		memset(page->vaddr, POOL_POISON_FREED, pool->allocation);
L
Linus Torvalds 已提交
225
#endif
226
		pool_initialise_page(pool, page);
M
Matthew Wilcox 已提交
227
		list_add(&page->page_list, &pool->page_list);
L
Linus Torvalds 已提交
228
		page->in_use = 0;
229
		page->offset = 0;
L
Linus Torvalds 已提交
230
	} else {
M
Matthew Wilcox 已提交
231
		kfree(page);
L
Linus Torvalds 已提交
232 233 234 235 236
		page = NULL;
	}
	return page;
}

237
static inline int is_page_busy(struct dma_page *page)
L
Linus Torvalds 已提交
238
{
239
	return page->in_use != 0;
L
Linus Torvalds 已提交
240 241
}

M
Matthew Wilcox 已提交
242
static void pool_free_page(struct dma_pool *pool, struct dma_page *page)
L
Linus Torvalds 已提交
243
{
M
Matthew Wilcox 已提交
244
	dma_addr_t dma = page->dma;
L
Linus Torvalds 已提交
245

246
#ifdef	DMAPOOL_DEBUG
M
Matthew Wilcox 已提交
247
	memset(page->vaddr, POOL_POISON_FREED, pool->allocation);
L
Linus Torvalds 已提交
248
#endif
M
Matthew Wilcox 已提交
249 250 251
	dma_free_coherent(pool->dev, pool->allocation, page->vaddr, dma);
	list_del(&page->page_list);
	kfree(page);
L
Linus Torvalds 已提交
252 253 254 255 256 257 258 259 260 261
}

/**
 * dma_pool_destroy - destroys a pool of dma memory blocks.
 * @pool: dma pool that will be destroyed
 * Context: !in_interrupt()
 *
 * Caller guarantees that no more memory from the pool is in use,
 * and that nothing will try to use the pool after this call.
 */
M
Matthew Wilcox 已提交
262
void dma_pool_destroy(struct dma_pool *pool)
L
Linus Torvalds 已提交
263
{
264
	mutex_lock(&pools_lock);
M
Matthew Wilcox 已提交
265 266 267
	list_del(&pool->pools);
	if (pool->dev && list_empty(&pool->dev->dma_pools))
		device_remove_file(pool->dev, &dev_attr_pools);
268
	mutex_unlock(&pools_lock);
L
Linus Torvalds 已提交
269

M
Matthew Wilcox 已提交
270 271 272 273
	while (!list_empty(&pool->page_list)) {
		struct dma_page *page;
		page = list_entry(pool->page_list.next,
				  struct dma_page, page_list);
274
		if (is_page_busy(page)) {
L
Linus Torvalds 已提交
275
			if (pool->dev)
M
Matthew Wilcox 已提交
276 277
				dev_err(pool->dev,
					"dma_pool_destroy %s, %p busy\n",
L
Linus Torvalds 已提交
278 279
					pool->name, page->vaddr);
			else
M
Matthew Wilcox 已提交
280 281 282
				printk(KERN_ERR
				       "dma_pool_destroy %s, %p busy\n",
				       pool->name, page->vaddr);
L
Linus Torvalds 已提交
283
			/* leak the still-in-use consistent memory */
M
Matthew Wilcox 已提交
284 285
			list_del(&page->page_list);
			kfree(page);
L
Linus Torvalds 已提交
286
		} else
M
Matthew Wilcox 已提交
287
			pool_free_page(pool, page);
L
Linus Torvalds 已提交
288 289
	}

M
Matthew Wilcox 已提交
290
	kfree(pool);
L
Linus Torvalds 已提交
291
}
M
Matthew Wilcox 已提交
292
EXPORT_SYMBOL(dma_pool_destroy);
L
Linus Torvalds 已提交
293 294 295 296 297 298 299 300 301

/**
 * dma_pool_alloc - get a block of consistent memory
 * @pool: dma pool that will produce the block
 * @mem_flags: GFP_* bitmask
 * @handle: pointer to dma address of block
 *
 * This returns the kernel virtual address of a currently unused block,
 * and reports its dma address through the handle.
302
 * If such a memory block can't be allocated, %NULL is returned.
L
Linus Torvalds 已提交
303
 */
M
Matthew Wilcox 已提交
304 305
void *dma_pool_alloc(struct dma_pool *pool, gfp_t mem_flags,
		     dma_addr_t *handle)
L
Linus Torvalds 已提交
306
{
M
Matthew Wilcox 已提交
307 308 309 310 311 312
	unsigned long flags;
	struct dma_page *page;
	size_t offset;
	void *retval;

	spin_lock_irqsave(&pool->lock, flags);
313
 restart:
L
Linus Torvalds 已提交
314
	list_for_each_entry(page, &pool->page_list, page_list) {
315 316
		if (page->offset < pool->allocation)
			goto ready;
L
Linus Torvalds 已提交
317
	}
M
Matthew Wilcox 已提交
318 319
	page = pool_alloc_page(pool, GFP_ATOMIC);
	if (!page) {
L
Linus Torvalds 已提交
320
		if (mem_flags & __GFP_WAIT) {
M
Matthew Wilcox 已提交
321
			DECLARE_WAITQUEUE(wait, current);
L
Linus Torvalds 已提交
322

323
			__set_current_state(TASK_INTERRUPTIBLE);
324
			__add_wait_queue(&pool->waitq, &wait);
M
Matthew Wilcox 已提交
325
			spin_unlock_irqrestore(&pool->lock, flags);
L
Linus Torvalds 已提交
326

M
Matthew Wilcox 已提交
327
			schedule_timeout(POOL_TIMEOUT_JIFFIES);
L
Linus Torvalds 已提交
328

329 330
			spin_lock_irqsave(&pool->lock, flags);
			__remove_wait_queue(&pool->waitq, &wait);
L
Linus Torvalds 已提交
331 332 333 334 335 336
			goto restart;
		}
		retval = NULL;
		goto done;
	}

M
Matthew Wilcox 已提交
337
 ready:
L
Linus Torvalds 已提交
338
	page->in_use++;
339 340
	offset = page->offset;
	page->offset = *(int *)(page->vaddr + offset);
L
Linus Torvalds 已提交
341 342
	retval = offset + page->vaddr;
	*handle = offset + page->dma;
343
#ifdef	DMAPOOL_DEBUG
M
Matthew Wilcox 已提交
344
	memset(retval, POOL_POISON_ALLOCATED, pool->size);
L
Linus Torvalds 已提交
345
#endif
M
Matthew Wilcox 已提交
346 347
 done:
	spin_unlock_irqrestore(&pool->lock, flags);
L
Linus Torvalds 已提交
348 349
	return retval;
}
M
Matthew Wilcox 已提交
350
EXPORT_SYMBOL(dma_pool_alloc);
L
Linus Torvalds 已提交
351

M
Matthew Wilcox 已提交
352
static struct dma_page *pool_find_page(struct dma_pool *pool, dma_addr_t dma)
L
Linus Torvalds 已提交
353
{
M
Matthew Wilcox 已提交
354 355
	unsigned long flags;
	struct dma_page *page;
L
Linus Torvalds 已提交
356

M
Matthew Wilcox 已提交
357
	spin_lock_irqsave(&pool->lock, flags);
L
Linus Torvalds 已提交
358 359 360 361 362 363 364
	list_for_each_entry(page, &pool->page_list, page_list) {
		if (dma < page->dma)
			continue;
		if (dma < (page->dma + pool->allocation))
			goto done;
	}
	page = NULL;
M
Matthew Wilcox 已提交
365 366
 done:
	spin_unlock_irqrestore(&pool->lock, flags);
L
Linus Torvalds 已提交
367 368 369 370 371 372 373 374 375 376 377 378
	return page;
}

/**
 * dma_pool_free - put block back into dma pool
 * @pool: the dma pool holding the block
 * @vaddr: virtual address of block
 * @dma: dma address of block
 *
 * Caller promises neither device nor driver will again touch this block
 * unless it is first re-allocated.
 */
M
Matthew Wilcox 已提交
379
void dma_pool_free(struct dma_pool *pool, void *vaddr, dma_addr_t dma)
L
Linus Torvalds 已提交
380
{
M
Matthew Wilcox 已提交
381 382
	struct dma_page *page;
	unsigned long flags;
383
	unsigned int offset;
L
Linus Torvalds 已提交
384

M
Matthew Wilcox 已提交
385 386
	page = pool_find_page(pool, dma);
	if (!page) {
L
Linus Torvalds 已提交
387
		if (pool->dev)
M
Matthew Wilcox 已提交
388 389 390
			dev_err(pool->dev,
				"dma_pool_free %s, %p/%lx (bad dma)\n",
				pool->name, vaddr, (unsigned long)dma);
L
Linus Torvalds 已提交
391
		else
M
Matthew Wilcox 已提交
392 393
			printk(KERN_ERR "dma_pool_free %s, %p/%lx (bad dma)\n",
			       pool->name, vaddr, (unsigned long)dma);
L
Linus Torvalds 已提交
394 395 396
		return;
	}

397
	offset = vaddr - page->vaddr;
398
#ifdef	DMAPOOL_DEBUG
399
	if ((dma - page->dma) != offset) {
L
Linus Torvalds 已提交
400
		if (pool->dev)
M
Matthew Wilcox 已提交
401 402 403
			dev_err(pool->dev,
				"dma_pool_free %s, %p (bad vaddr)/%Lx\n",
				pool->name, vaddr, (unsigned long long)dma);
L
Linus Torvalds 已提交
404
		else
M
Matthew Wilcox 已提交
405 406 407
			printk(KERN_ERR
			       "dma_pool_free %s, %p (bad vaddr)/%Lx\n",
			       pool->name, vaddr, (unsigned long long)dma);
L
Linus Torvalds 已提交
408 409
		return;
	}
410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426
	{
		unsigned int chain = page->offset;
		while (chain < pool->allocation) {
			if (chain != offset) {
				chain = *(int *)(page->vaddr + chain);
				continue;
			}
			if (pool->dev)
				dev_err(pool->dev, "dma_pool_free %s, dma %Lx "
					"already free\n", pool->name,
					(unsigned long long)dma);
			else
				printk(KERN_ERR "dma_pool_free %s, dma %Lx "
					"already free\n", pool->name,
					(unsigned long long)dma);
			return;
		}
L
Linus Torvalds 已提交
427
	}
M
Matthew Wilcox 已提交
428
	memset(vaddr, POOL_POISON_FREED, pool->size);
L
Linus Torvalds 已提交
429 430
#endif

M
Matthew Wilcox 已提交
431
	spin_lock_irqsave(&pool->lock, flags);
L
Linus Torvalds 已提交
432
	page->in_use--;
433 434
	*(int *)vaddr = page->offset;
	page->offset = offset;
M
Matthew Wilcox 已提交
435
	if (waitqueue_active(&pool->waitq))
436
		wake_up_locked(&pool->waitq);
L
Linus Torvalds 已提交
437 438
	/*
	 * Resist a temptation to do
439
	 *    if (!is_page_busy(page)) pool_free_page(pool, page);
L
Linus Torvalds 已提交
440 441
	 * Better have a few empty pages hang around.
	 */
M
Matthew Wilcox 已提交
442
	spin_unlock_irqrestore(&pool->lock, flags);
L
Linus Torvalds 已提交
443
}
M
Matthew Wilcox 已提交
444
EXPORT_SYMBOL(dma_pool_free);
L
Linus Torvalds 已提交
445

T
Tejun Heo 已提交
446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488
/*
 * Managed DMA pool
 */
static void dmam_pool_release(struct device *dev, void *res)
{
	struct dma_pool *pool = *(struct dma_pool **)res;

	dma_pool_destroy(pool);
}

static int dmam_pool_match(struct device *dev, void *res, void *match_data)
{
	return *(struct dma_pool **)res == match_data;
}

/**
 * dmam_pool_create - Managed dma_pool_create()
 * @name: name of pool, for diagnostics
 * @dev: device that will be doing the DMA
 * @size: size of the blocks in this pool.
 * @align: alignment requirement for blocks; must be a power of two
 * @allocation: returned blocks won't cross this boundary (or zero)
 *
 * Managed dma_pool_create().  DMA pool created with this function is
 * automatically destroyed on driver detach.
 */
struct dma_pool *dmam_pool_create(const char *name, struct device *dev,
				  size_t size, size_t align, size_t allocation)
{
	struct dma_pool **ptr, *pool;

	ptr = devres_alloc(dmam_pool_release, sizeof(*ptr), GFP_KERNEL);
	if (!ptr)
		return NULL;

	pool = *ptr = dma_pool_create(name, dev, size, align, allocation);
	if (pool)
		devres_add(dev, ptr);
	else
		devres_free(ptr);

	return pool;
}
M
Matthew Wilcox 已提交
489
EXPORT_SYMBOL(dmam_pool_create);
T
Tejun Heo 已提交
490 491 492 493 494 495 496 497 498 499 500 501 502 503

/**
 * dmam_pool_destroy - Managed dma_pool_destroy()
 * @pool: dma pool that will be destroyed
 *
 * Managed dma_pool_destroy().
 */
void dmam_pool_destroy(struct dma_pool *pool)
{
	struct device *dev = pool->dev;

	dma_pool_destroy(pool);
	WARN_ON(devres_destroy(dev, dmam_pool_release, dmam_pool_match, pool));
}
M
Matthew Wilcox 已提交
504
EXPORT_SYMBOL(dmam_pool_destroy);