radeon_ttm.c 28.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
/*
 * Copyright 2009 Jerome Glisse.
 * All Rights Reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the
 * "Software"), to deal in the Software without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sub license, and/or sell copies of the Software, and to
 * permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
 * USE OR OTHER DEALINGS IN THE SOFTWARE.
 *
 * The above copyright notice and this permission notice (including the
 * next paragraph) shall be included in all copies or substantial portions
 * of the Software.
 *
 */
/*
 * Authors:
 *    Jerome Glisse <glisse@freedesktop.org>
 *    Thomas Hellstrom <thomas-at-tungstengraphics-dot-com>
 *    Dave Airlie
 */
32 33 34 35 36 37 38 39 40 41 42 43 44 45 46

#include <linux/dma-mapping.h>
#include <linux/pagemap.h>
#include <linux/seq_file.h>
#include <linux/slab.h>
#include <linux/swap.h>
#include <linux/swiotlb.h>

#include <drm/drm_agpsupport.h>
#include <drm/drm_debugfs.h>
#include <drm/drm_device.h>
#include <drm/drm_file.h>
#include <drm/drm_pci.h>
#include <drm/drm_prime.h>
#include <drm/radeon_drm.h>
47 48 49 50
#include <drm/ttm/ttm_bo_api.h>
#include <drm/ttm/ttm_bo_driver.h>
#include <drm/ttm/ttm_module.h>
#include <drm/ttm/ttm_page_alloc.h>
51 52
#include <drm/ttm/ttm_placement.h>

53 54 55
#include "radeon_reg.h"
#include "radeon.h"

56
static int radeon_ttm_debugfs_init(struct radeon_device *rdev);
57
static void radeon_ttm_debugfs_fini(struct radeon_device *rdev);
58

59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
static struct radeon_device *radeon_get_rdev(struct ttm_bo_device *bdev)
{
	struct radeon_mman *mman;
	struct radeon_device *rdev;

	mman = container_of(bdev, struct radeon_mman, bdev);
	rdev = container_of(mman, struct radeon_device, mman);
	return rdev;
}

static int radeon_invalidate_caches(struct ttm_bo_device *bdev, uint32_t flags)
{
	return 0;
}

static int radeon_init_mem_type(struct ttm_bo_device *bdev, uint32_t type,
				struct ttm_mem_type_manager *man)
{
	struct radeon_device *rdev;

	rdev = radeon_get_rdev(bdev);

	switch (type) {
	case TTM_PL_SYSTEM:
		/* System memory */
		man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
		man->available_caching = TTM_PL_MASK_CACHING;
		man->default_caching = TTM_PL_FLAG_CACHED;
		break;
	case TTM_PL_TT:
89
		man->func = &ttm_bo_manager_func;
90
		man->gpu_offset = rdev->mc.gtt_start;
91 92
		man->available_caching = TTM_PL_MASK_CACHING;
		man->default_caching = TTM_PL_FLAG_CACHED;
93
		man->flags = TTM_MEMTYPE_FLAG_MAPPABLE | TTM_MEMTYPE_FLAG_CMA;
D
Daniel Vetter 已提交
94
#if IS_ENABLED(CONFIG_AGP)
95
		if (rdev->flags & RADEON_IS_AGP) {
D
Daniel Vetter 已提交
96
			if (!rdev->ddev->agp) {
97 98 99 100
				DRM_ERROR("AGP is not enabled for memory type %u\n",
					  (unsigned)type);
				return -EINVAL;
			}
101
			if (!rdev->ddev->agp->cant_use_aperture)
102
				man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
103 104 105 106
			man->available_caching = TTM_PL_FLAG_UNCACHED |
						 TTM_PL_FLAG_WC;
			man->default_caching = TTM_PL_FLAG_WC;
		}
107
#endif
108 109 110
		break;
	case TTM_PL_VRAM:
		/* "On-card" video ram */
111
		man->func = &ttm_bo_manager_func;
112
		man->gpu_offset = rdev->mc.vram_start;
113 114 115 116 117 118 119 120 121 122 123 124
		man->flags = TTM_MEMTYPE_FLAG_FIXED |
			     TTM_MEMTYPE_FLAG_MAPPABLE;
		man->available_caching = TTM_PL_FLAG_UNCACHED | TTM_PL_FLAG_WC;
		man->default_caching = TTM_PL_FLAG_WC;
		break;
	default:
		DRM_ERROR("Unsupported memory type %u\n", (unsigned)type);
		return -EINVAL;
	}
	return 0;
}

125 126
static void radeon_evict_flags(struct ttm_buffer_object *bo,
				struct ttm_placement *placement)
127
{
128
	static const struct ttm_place placements = {
129 130 131 132 133
		.fpfn = 0,
		.lpfn = 0,
		.flags = TTM_PL_MASK_CACHING | TTM_PL_FLAG_SYSTEM
	};

134 135 136 137 138 139 140 141 142 143
	struct radeon_bo *rbo;

	if (!radeon_ttm_bo_is_radeon_bo(bo)) {
		placement->placement = &placements;
		placement->busy_placement = &placements;
		placement->num_placement = 1;
		placement->num_busy_placement = 1;
		return;
	}
	rbo = container_of(bo, struct radeon_bo, tbo);
144
	switch (bo->mem.mem_type) {
145
	case TTM_PL_VRAM:
146
		if (rbo->rdev->ring[radeon_copy_ring_index(rbo->rdev)].ready == false)
147
			radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_CPU);
148 149 150 151 152 153 154 155 156 157 158 159 160 161 162
		else if (rbo->rdev->mc.visible_vram_size < rbo->rdev->mc.real_vram_size &&
			 bo->mem.start < (rbo->rdev->mc.visible_vram_size >> PAGE_SHIFT)) {
			unsigned fpfn = rbo->rdev->mc.visible_vram_size >> PAGE_SHIFT;
			int i;

			/* Try evicting to the CPU inaccessible part of VRAM
			 * first, but only set GTT as busy placement, so this
			 * BO will be evicted to GTT rather than causing other
			 * BOs to be evicted from VRAM
			 */
			radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_VRAM |
							 RADEON_GEM_DOMAIN_GTT);
			rbo->placement.num_busy_placement = 0;
			for (i = 0; i < rbo->placement.num_placement; i++) {
				if (rbo->placements[i].flags & TTM_PL_FLAG_VRAM) {
163 164
					if (rbo->placements[i].fpfn < fpfn)
						rbo->placements[i].fpfn = fpfn;
165 166 167 168 169 170 171
				} else {
					rbo->placement.busy_placement =
						&rbo->placements[i];
					rbo->placement.num_busy_placement = 1;
				}
			}
		} else
172
			radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_GTT);
173 174
		break;
	case TTM_PL_TT:
175
	default:
176
		radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_CPU);
177
	}
178
	*placement = rbo->placement;
179 180 181 182
}

static int radeon_verify_access(struct ttm_buffer_object *bo, struct file *filp)
{
183 184
	struct radeon_bo *rbo = container_of(bo, struct radeon_bo, tbo);

185 186
	if (radeon_ttm_tt_has_userptr(bo->ttm))
		return -EPERM;
187
	return drm_vma_node_verify_access(&rbo->tbo.base.vma_node,
D
David Herrmann 已提交
188
					  filp->private_data);
189 190 191 192 193 194 195 196 197 198 199 200 201
}

static void radeon_move_null(struct ttm_buffer_object *bo,
			     struct ttm_mem_reg *new_mem)
{
	struct ttm_mem_reg *old_mem = &bo->mem;

	BUG_ON(old_mem->mm_node != NULL);
	*old_mem = *new_mem;
	new_mem->mm_node = NULL;
}

static int radeon_move_blit(struct ttm_buffer_object *bo,
202
			bool evict, bool no_wait_gpu,
203 204
			struct ttm_mem_reg *new_mem,
			struct ttm_mem_reg *old_mem)
205 206 207
{
	struct radeon_device *rdev;
	uint64_t old_start, new_start;
208
	struct radeon_fence *fence;
209
	unsigned num_pages;
210
	int r, ridx;
211 212

	rdev = radeon_get_rdev(bo->bdev);
213
	ridx = radeon_copy_ring_index(rdev);
214 215
	old_start = (u64)old_mem->start << PAGE_SHIFT;
	new_start = (u64)new_mem->start << PAGE_SHIFT;
216 217 218

	switch (old_mem->mem_type) {
	case TTM_PL_VRAM:
219
		old_start += rdev->mc.vram_start;
220 221
		break;
	case TTM_PL_TT:
222
		old_start += rdev->mc.gtt_start;
223 224 225 226 227 228 229
		break;
	default:
		DRM_ERROR("Unknown placement %d\n", old_mem->mem_type);
		return -EINVAL;
	}
	switch (new_mem->mem_type) {
	case TTM_PL_VRAM:
230
		new_start += rdev->mc.vram_start;
231 232
		break;
	case TTM_PL_TT:
233
		new_start += rdev->mc.gtt_start;
234 235 236 237 238
		break;
	default:
		DRM_ERROR("Unknown placement %d\n", old_mem->mem_type);
		return -EINVAL;
	}
239
	if (!rdev->ring[ridx].ready) {
240
		DRM_ERROR("Trying to move memory with ring turned off.\n");
241 242
		return -EINVAL;
	}
243 244 245

	BUILD_BUG_ON((PAGE_SIZE % RADEON_GPU_PAGE_SIZE) != 0);

246
	num_pages = new_mem->num_pages * (PAGE_SIZE / RADEON_GPU_PAGE_SIZE);
247
	fence = radeon_copy(rdev, old_start, new_start, num_pages, bo->base.resv);
248 249 250
	if (IS_ERR(fence))
		return PTR_ERR(fence);

251
	r = ttm_bo_move_accel_cleanup(bo, &fence->base, evict, new_mem);
252 253 254 255 256
	radeon_fence_unref(&fence);
	return r;
}

static int radeon_move_vram_ram(struct ttm_buffer_object *bo,
257
				bool evict, bool interruptible,
258
				bool no_wait_gpu,
259 260
				struct ttm_mem_reg *new_mem)
{
261
	struct ttm_operation_ctx ctx = { interruptible, no_wait_gpu };
262 263
	struct ttm_mem_reg *old_mem = &bo->mem;
	struct ttm_mem_reg tmp_mem;
264
	struct ttm_place placements;
265
	struct ttm_placement placement;
266 267 268 269
	int r;

	tmp_mem = *new_mem;
	tmp_mem.mm_node = NULL;
270 271 272 273
	placement.num_placement = 1;
	placement.placement = &placements;
	placement.num_busy_placement = 1;
	placement.busy_placement = &placements;
274 275 276
	placements.fpfn = 0;
	placements.lpfn = 0;
	placements.flags = TTM_PL_MASK_CACHING | TTM_PL_FLAG_TT;
277
	r = ttm_bo_mem_space(bo, &placement, &tmp_mem, &ctx);
278 279 280
	if (unlikely(r)) {
		return r;
	}
281 282 283 284 285 286

	r = ttm_tt_set_placement_caching(bo->ttm, tmp_mem.placement);
	if (unlikely(r)) {
		goto out_cleanup;
	}

287
	r = ttm_tt_bind(bo->ttm, &tmp_mem, &ctx);
288 289 290
	if (unlikely(r)) {
		goto out_cleanup;
	}
291
	r = radeon_move_blit(bo, true, no_wait_gpu, &tmp_mem, old_mem);
292 293 294
	if (unlikely(r)) {
		goto out_cleanup;
	}
295
	r = ttm_bo_move_ttm(bo, &ctx, new_mem);
296
out_cleanup:
297
	ttm_bo_mem_put(bo, &tmp_mem);
298 299 300 301
	return r;
}

static int radeon_move_ram_vram(struct ttm_buffer_object *bo,
302
				bool evict, bool interruptible,
303
				bool no_wait_gpu,
304 305
				struct ttm_mem_reg *new_mem)
{
306
	struct ttm_operation_ctx ctx = { interruptible, no_wait_gpu };
307 308
	struct ttm_mem_reg *old_mem = &bo->mem;
	struct ttm_mem_reg tmp_mem;
309
	struct ttm_placement placement;
310
	struct ttm_place placements;
311 312 313 314
	int r;

	tmp_mem = *new_mem;
	tmp_mem.mm_node = NULL;
315 316 317 318
	placement.num_placement = 1;
	placement.placement = &placements;
	placement.num_busy_placement = 1;
	placement.busy_placement = &placements;
319 320 321
	placements.fpfn = 0;
	placements.lpfn = 0;
	placements.flags = TTM_PL_MASK_CACHING | TTM_PL_FLAG_TT;
322
	r = ttm_bo_mem_space(bo, &placement, &tmp_mem, &ctx);
323 324 325
	if (unlikely(r)) {
		return r;
	}
326
	r = ttm_bo_move_ttm(bo, &ctx, &tmp_mem);
327 328 329
	if (unlikely(r)) {
		goto out_cleanup;
	}
330
	r = radeon_move_blit(bo, true, no_wait_gpu, new_mem, old_mem);
331 332 333 334
	if (unlikely(r)) {
		goto out_cleanup;
	}
out_cleanup:
335
	ttm_bo_mem_put(bo, &tmp_mem);
336 337 338
	return r;
}

339 340 341
static int radeon_bo_move(struct ttm_buffer_object *bo, bool evict,
			  struct ttm_operation_ctx *ctx,
			  struct ttm_mem_reg *new_mem)
342 343
{
	struct radeon_device *rdev;
344
	struct radeon_bo *rbo;
345 346 347
	struct ttm_mem_reg *old_mem = &bo->mem;
	int r;

348
	r = ttm_bo_wait(bo, ctx->interruptible, ctx->no_wait_gpu);
349 350 351
	if (r)
		return r;

352 353 354 355 356
	/* Can't move a pinned BO */
	rbo = container_of(bo, struct radeon_bo, tbo);
	if (WARN_ON_ONCE(rbo->pin_count > 0))
		return -EINVAL;

357 358 359 360 361 362 363 364 365
	rdev = radeon_get_rdev(bo->bdev);
	if (old_mem->mem_type == TTM_PL_SYSTEM && bo->ttm == NULL) {
		radeon_move_null(bo, new_mem);
		return 0;
	}
	if ((old_mem->mem_type == TTM_PL_TT &&
	     new_mem->mem_type == TTM_PL_SYSTEM) ||
	    (old_mem->mem_type == TTM_PL_SYSTEM &&
	     new_mem->mem_type == TTM_PL_TT)) {
366
		/* bind is enough */
367 368 369
		radeon_move_null(bo, new_mem);
		return 0;
	}
370 371
	if (!rdev->ring[radeon_copy_ring_index(rdev)].ready ||
	    rdev->asic->copy.copy == NULL) {
372
		/* use memcpy */
373
		goto memcpy;
374 375 376 377
	}

	if (old_mem->mem_type == TTM_PL_VRAM &&
	    new_mem->mem_type == TTM_PL_SYSTEM) {
378 379
		r = radeon_move_vram_ram(bo, evict, ctx->interruptible,
					ctx->no_wait_gpu, new_mem);
380 381
	} else if (old_mem->mem_type == TTM_PL_SYSTEM &&
		   new_mem->mem_type == TTM_PL_VRAM) {
382 383
		r = radeon_move_ram_vram(bo, evict, ctx->interruptible,
					    ctx->no_wait_gpu, new_mem);
384
	} else {
385 386
		r = radeon_move_blit(bo, evict, ctx->no_wait_gpu,
				     new_mem, old_mem);
387
	}
388 389 390

	if (r) {
memcpy:
391
		r = ttm_bo_move_memcpy(bo, ctx, new_mem);
392 393 394
		if (r) {
			return r;
		}
395
	}
396 397 398 399

	/* update statistics */
	atomic64_add((u64)bo->num_pages << PAGE_SHIFT, &rdev->num_bytes_moved);
	return 0;
400 401
}

402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418
static int radeon_ttm_io_mem_reserve(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
{
	struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
	struct radeon_device *rdev = radeon_get_rdev(bdev);

	mem->bus.addr = NULL;
	mem->bus.offset = 0;
	mem->bus.size = mem->num_pages << PAGE_SHIFT;
	mem->bus.base = 0;
	mem->bus.is_iomem = false;
	if (!(man->flags & TTM_MEMTYPE_FLAG_MAPPABLE))
		return -EINVAL;
	switch (mem->mem_type) {
	case TTM_PL_SYSTEM:
		/* system memory */
		return 0;
	case TTM_PL_TT:
D
Daniel Vetter 已提交
419
#if IS_ENABLED(CONFIG_AGP)
420 421
		if (rdev->flags & RADEON_IS_AGP) {
			/* RADEON_IS_AGP is set only if AGP is active */
422
			mem->bus.offset = mem->start << PAGE_SHIFT;
423
			mem->bus.base = rdev->mc.agp_base;
424
			mem->bus.is_iomem = !rdev->ddev->agp->cant_use_aperture;
425 426 427 428
		}
#endif
		break;
	case TTM_PL_VRAM:
429
		mem->bus.offset = mem->start << PAGE_SHIFT;
430 431 432 433 434
		/* check if it's visible */
		if ((mem->bus.offset + mem->bus.size) > rdev->mc.visible_vram_size)
			return -EINVAL;
		mem->bus.base = rdev->mc.aper_base;
		mem->bus.is_iomem = true;
435 436 437 438 439 440 441 442 443 444 445 446 447
#ifdef __alpha__
		/*
		 * Alpha: use bus.addr to hold the ioremap() return,
		 * so we can modify bus.base below.
		 */
		if (mem->placement & TTM_PL_FLAG_WC)
			mem->bus.addr =
				ioremap_wc(mem->bus.base + mem->bus.offset,
					   mem->bus.size);
		else
			mem->bus.addr =
				ioremap_nocache(mem->bus.base + mem->bus.offset,
						mem->bus.size);
448 449
		if (!mem->bus.addr)
			return -ENOMEM;
450 451 452 453 454 455 456 457 458 459

		/*
		 * Alpha: Use just the bus offset plus
		 * the hose/domain memory base for bus.base.
		 * It then can be used to build PTEs for VRAM
		 * access, as done in ttm_bo_vm_fault().
		 */
		mem->bus.base = (mem->bus.base & 0x0ffffffffUL) +
			rdev->ddev->hose->dense_mem_base;
#endif
460 461 462 463 464 465 466 467 468 469 470
		break;
	default:
		return -EINVAL;
	}
	return 0;
}

static void radeon_ttm_io_mem_free(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
{
}

471 472 473 474
/*
 * TTM backend functions.
 */
struct radeon_ttm_tt {
475
	struct ttm_dma_tt		ttm;
476 477
	struct radeon_device		*rdev;
	u64				offset;
478 479 480 481

	uint64_t			userptr;
	struct mm_struct		*usermm;
	uint32_t			userflags;
482 483
};

484 485 486 487 488 489 490 491 492 493 494 495 496 497 498
/* prepare the sg table with the user pages */
static int radeon_ttm_tt_pin_userptr(struct ttm_tt *ttm)
{
	struct radeon_device *rdev = radeon_get_rdev(ttm->bdev);
	struct radeon_ttm_tt *gtt = (void *)ttm;
	unsigned pinned = 0, nents;
	int r;

	int write = !(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
	enum dma_data_direction direction = write ?
		DMA_BIDIRECTIONAL : DMA_TO_DEVICE;

	if (current->mm != gtt->usermm)
		return -EPERM;

499 500 501 502 503 504 505 506 507 508
	if (gtt->userflags & RADEON_GEM_USERPTR_ANONONLY) {
		/* check that we only pin down anonymous memory
		   to prevent problems with writeback */
		unsigned long end = gtt->userptr + ttm->num_pages * PAGE_SIZE;
		struct vm_area_struct *vma;
		vma = find_vma(gtt->usermm, gtt->userptr);
		if (!vma || vma->vm_file || vma->vm_end < end)
			return -EPERM;
	}

509 510 511 512 513
	do {
		unsigned num_pages = ttm->num_pages - pinned;
		uint64_t userptr = gtt->userptr + pinned * PAGE_SIZE;
		struct page **pages = ttm->pages + pinned;

514 515
		r = get_user_pages(userptr, num_pages, write ? FOLL_WRITE : 0,
				   pages, NULL);
516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542
		if (r < 0)
			goto release_pages;

		pinned += r;

	} while (pinned < ttm->num_pages);

	r = sg_alloc_table_from_pages(ttm->sg, ttm->pages, ttm->num_pages, 0,
				      ttm->num_pages << PAGE_SHIFT,
				      GFP_KERNEL);
	if (r)
		goto release_sg;

	r = -ENOMEM;
	nents = dma_map_sg(rdev->dev, ttm->sg->sgl, ttm->sg->nents, direction);
	if (nents != ttm->sg->nents)
		goto release_sg;

	drm_prime_sg_to_page_addr_arrays(ttm->sg, ttm->pages,
					 gtt->ttm.dma_address, ttm->num_pages);

	return 0;

release_sg:
	kfree(ttm->sg);

release_pages:
543
	release_pages(ttm->pages, pinned);
544 545 546 547 548 549 550
	return r;
}

static void radeon_ttm_tt_unpin_userptr(struct ttm_tt *ttm)
{
	struct radeon_device *rdev = radeon_get_rdev(ttm->bdev);
	struct radeon_ttm_tt *gtt = (void *)ttm;
551
	struct sg_page_iter sg_iter;
552 553 554 555 556

	int write = !(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
	enum dma_data_direction direction = write ?
		DMA_BIDIRECTIONAL : DMA_TO_DEVICE;

557 558 559 560
	/* double check that we don't free the table twice */
	if (!ttm->sg->sgl)
		return;

561 562 563
	/* free the sg table and pages again */
	dma_unmap_sg(rdev->dev, ttm->sg->sgl, ttm->sg->nents, direction);

564 565
	for_each_sg_page(ttm->sg->sgl, &sg_iter, ttm->sg->nents, 0) {
		struct page *page = sg_page_iter_page(&sg_iter);
566 567 568 569
		if (!(gtt->userflags & RADEON_GEM_USERPTR_READONLY))
			set_page_dirty(page);

		mark_page_accessed(page);
570
		put_page(page);
571 572 573 574 575
	}

	sg_free_table(ttm->sg);
}

576 577 578
static int radeon_ttm_backend_bind(struct ttm_tt *ttm,
				   struct ttm_mem_reg *bo_mem)
{
579
	struct radeon_ttm_tt *gtt = (void*)ttm;
580 581
	uint32_t flags = RADEON_GART_PAGE_VALID | RADEON_GART_PAGE_READ |
		RADEON_GART_PAGE_WRITE;
582 583
	int r;

584 585 586 587 588
	if (gtt->userptr) {
		radeon_ttm_tt_pin_userptr(ttm);
		flags &= ~RADEON_GART_PAGE_WRITE;
	}

589 590 591 592 593
	gtt->offset = (unsigned long)(bo_mem->start << PAGE_SHIFT);
	if (!ttm->num_pages) {
		WARN(1, "nothing to bind %lu pages for mreg %p back %p!\n",
		     ttm->num_pages, bo_mem, ttm);
	}
594 595 596 597
	if (ttm->caching_state == tt_cached)
		flags |= RADEON_GART_PAGE_SNOOP;
	r = radeon_gart_bind(gtt->rdev, gtt->offset, ttm->num_pages,
			     ttm->pages, gtt->ttm.dma_address, flags);
598 599 600 601 602 603 604 605 606 607
	if (r) {
		DRM_ERROR("failed to bind %lu pages at 0x%08X\n",
			  ttm->num_pages, (unsigned)gtt->offset);
		return r;
	}
	return 0;
}

static int radeon_ttm_backend_unbind(struct ttm_tt *ttm)
{
608
	struct radeon_ttm_tt *gtt = (void *)ttm;
609 610

	radeon_gart_unbind(gtt->rdev, gtt->offset, ttm->num_pages);
611 612 613 614

	if (gtt->userptr)
		radeon_ttm_tt_unpin_userptr(ttm);

615 616 617 618 619
	return 0;
}

static void radeon_ttm_backend_destroy(struct ttm_tt *ttm)
{
620
	struct radeon_ttm_tt *gtt = (void *)ttm;
621

622
	ttm_dma_tt_fini(&gtt->ttm);
623 624 625 626 627 628 629 630 631
	kfree(gtt);
}

static struct ttm_backend_func radeon_backend_func = {
	.bind = &radeon_ttm_backend_bind,
	.unbind = &radeon_ttm_backend_unbind,
	.destroy = &radeon_ttm_backend_destroy,
};

632 633
static struct ttm_tt *radeon_ttm_tt_create(struct ttm_buffer_object *bo,
					   uint32_t page_flags)
634 635 636 637
{
	struct radeon_device *rdev;
	struct radeon_ttm_tt *gtt;

638
	rdev = radeon_get_rdev(bo->bdev);
D
Daniel Vetter 已提交
639
#if IS_ENABLED(CONFIG_AGP)
640
	if (rdev->flags & RADEON_IS_AGP) {
641 642
		return ttm_agp_tt_create(bo, rdev->ddev->agp->bridge,
					 page_flags);
643 644 645 646 647 648 649
	}
#endif

	gtt = kzalloc(sizeof(struct radeon_ttm_tt), GFP_KERNEL);
	if (gtt == NULL) {
		return NULL;
	}
650
	gtt->ttm.ttm.func = &radeon_backend_func;
651
	gtt->rdev = rdev;
652
	if (ttm_dma_tt_init(&gtt->ttm, bo, page_flags)) {
653
		kfree(gtt);
654 655
		return NULL;
	}
656
	return &gtt->ttm.ttm;
657 658
}

659 660 661 662 663 664 665
static struct radeon_ttm_tt *radeon_ttm_tt_to_gtt(struct ttm_tt *ttm)
{
	if (!ttm || ttm->func != &radeon_backend_func)
		return NULL;
	return (struct radeon_ttm_tt *)ttm;
}

666 667
static int radeon_ttm_tt_populate(struct ttm_tt *ttm,
			struct ttm_operation_ctx *ctx)
668
{
669
	struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(ttm);
670
	struct radeon_device *rdev;
671
	bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);
672

673
	if (gtt && gtt->userptr) {
674
		ttm->sg = kzalloc(sizeof(struct sg_table), GFP_KERNEL);
675 676 677 678 679 680 681 682
		if (!ttm->sg)
			return -ENOMEM;

		ttm->page_flags |= TTM_PAGE_FLAG_SG;
		ttm->state = tt_unbound;
		return 0;
	}

683 684 685 686 687 688 689
	if (slave && ttm->sg) {
		drm_prime_sg_to_page_addr_arrays(ttm->sg, ttm->pages,
						 gtt->ttm.dma_address, ttm->num_pages);
		ttm->state = tt_unbound;
		return 0;
	}

690
	rdev = radeon_get_rdev(ttm->bdev);
D
Daniel Vetter 已提交
691
#if IS_ENABLED(CONFIG_AGP)
J
Jerome Glisse 已提交
692
	if (rdev->flags & RADEON_IS_AGP) {
693
		return ttm_agp_tt_populate(ttm, ctx);
J
Jerome Glisse 已提交
694 695
	}
#endif
696 697

#ifdef CONFIG_SWIOTLB
698
	if (rdev->need_swiotlb && swiotlb_nr_tbl()) {
699
		return ttm_dma_populate(&gtt->ttm, rdev->dev, ctx);
700 701 702
	}
#endif

703
	return ttm_populate_and_map_pages(rdev->dev, &gtt->ttm, ctx);
704 705 706 707 708
}

static void radeon_ttm_tt_unpopulate(struct ttm_tt *ttm)
{
	struct radeon_device *rdev;
709
	struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(ttm);
710 711
	bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);

712
	if (gtt && gtt->userptr) {
713 714 715 716 717
		kfree(ttm->sg);
		ttm->page_flags &= ~TTM_PAGE_FLAG_SG;
		return;
	}

718 719
	if (slave)
		return;
720 721

	rdev = radeon_get_rdev(ttm->bdev);
D
Daniel Vetter 已提交
722
#if IS_ENABLED(CONFIG_AGP)
J
Jerome Glisse 已提交
723 724 725 726 727
	if (rdev->flags & RADEON_IS_AGP) {
		ttm_agp_tt_unpopulate(ttm);
		return;
	}
#endif
728 729

#ifdef CONFIG_SWIOTLB
730
	if (rdev->need_swiotlb && swiotlb_nr_tbl()) {
731
		ttm_dma_unpopulate(&gtt->ttm, rdev->dev);
732 733 734 735
		return;
	}
#endif

736
	ttm_unmap_and_unpopulate_pages(rdev->dev, &gtt->ttm);
737
}
738

739 740 741
int radeon_ttm_tt_set_userptr(struct ttm_tt *ttm, uint64_t addr,
			      uint32_t flags)
{
742
	struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(ttm);
743 744 745 746 747 748 749 750 751 752 753 754

	if (gtt == NULL)
		return -EINVAL;

	gtt->userptr = addr;
	gtt->usermm = current->mm;
	gtt->userflags = flags;
	return 0;
}

bool radeon_ttm_tt_has_userptr(struct ttm_tt *ttm)
{
755
	struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(ttm);
756 757 758 759 760 761 762 763 764

	if (gtt == NULL)
		return false;

	return !!gtt->userptr;
}

bool radeon_ttm_tt_is_readonly(struct ttm_tt *ttm)
{
765
	struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(ttm);
766 767 768 769 770 771 772

	if (gtt == NULL)
		return false;

	return !!(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
}

773
static struct ttm_bo_driver radeon_bo_driver = {
774
	.ttm_tt_create = &radeon_ttm_tt_create,
775 776
	.ttm_tt_populate = &radeon_ttm_tt_populate,
	.ttm_tt_unpopulate = &radeon_ttm_tt_unpopulate,
777 778
	.invalidate_caches = &radeon_invalidate_caches,
	.init_mem_type = &radeon_init_mem_type,
779
	.eviction_valuable = ttm_bo_eviction_valuable,
780 781 782
	.evict_flags = &radeon_evict_flags,
	.move = &radeon_bo_move,
	.verify_access = &radeon_verify_access,
783 784
	.move_notify = &radeon_bo_move_notify,
	.fault_reserve_notify = &radeon_bo_fault_reserve_notify,
785 786
	.io_mem_reserve = &radeon_ttm_io_mem_reserve,
	.io_mem_free = &radeon_ttm_io_mem_free,
787 788 789 790 791 792 793 794
};

int radeon_ttm_init(struct radeon_device *rdev)
{
	int r;

	/* No others user of address space so set it to 0 */
	r = ttm_bo_device_init(&rdev->mman.bdev,
795 796
			       &radeon_bo_driver,
			       rdev->ddev->anon_inode->i_mapping,
797
			       rdev->ddev->vma_offset_manager,
798
			       dma_addressing_limited(&rdev->pdev->dev));
799 800 801 802
	if (r) {
		DRM_ERROR("failed initializing buffer object driver(%d).\n", r);
		return r;
	}
803
	rdev->mman.initialized = true;
804
	r = ttm_bo_init_mm(&rdev->mman.bdev, TTM_PL_VRAM,
805
				rdev->mc.real_vram_size >> PAGE_SHIFT);
806 807 808 809
	if (r) {
		DRM_ERROR("Failed initializing VRAM heap.\n");
		return r;
	}
810 811 812
	/* Change the size here instead of the init above so only lpfn is affected */
	radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);

813
	r = radeon_bo_create(rdev, 256 * 1024, PAGE_SIZE, true,
814
			     RADEON_GEM_DOMAIN_VRAM, 0, NULL,
K
Kent Russell 已提交
815
			     NULL, &rdev->stolen_vga_memory);
816 817 818
	if (r) {
		return r;
	}
K
Kent Russell 已提交
819
	r = radeon_bo_reserve(rdev->stolen_vga_memory, false);
820 821
	if (r)
		return r;
K
Kent Russell 已提交
822 823
	r = radeon_bo_pin(rdev->stolen_vga_memory, RADEON_GEM_DOMAIN_VRAM, NULL);
	radeon_bo_unreserve(rdev->stolen_vga_memory);
824
	if (r) {
K
Kent Russell 已提交
825
		radeon_bo_unref(&rdev->stolen_vga_memory);
826 827 828
		return r;
	}
	DRM_INFO("radeon: %uM of VRAM memory ready\n",
829
		 (unsigned) (rdev->mc.real_vram_size / (1024 * 1024)));
830
	r = ttm_bo_init_mm(&rdev->mman.bdev, TTM_PL_TT,
831
				rdev->mc.gtt_size >> PAGE_SHIFT);
832 833 834 835 836
	if (r) {
		DRM_ERROR("Failed initializing GTT heap.\n");
		return r;
	}
	DRM_INFO("radeon: %uM of GTT memory ready.\n",
837
		 (unsigned)(rdev->mc.gtt_size / (1024 * 1024)));
838 839 840 841 842 843

	r = radeon_ttm_debugfs_init(rdev);
	if (r) {
		DRM_ERROR("Failed to init debugfs\n");
		return r;
	}
844 845 846 847 848
	return 0;
}

void radeon_ttm_fini(struct radeon_device *rdev)
{
849 850
	int r;

851 852
	if (!rdev->mman.initialized)
		return;
853
	radeon_ttm_debugfs_fini(rdev);
K
Kent Russell 已提交
854 855
	if (rdev->stolen_vga_memory) {
		r = radeon_bo_reserve(rdev->stolen_vga_memory, false);
856
		if (r == 0) {
K
Kent Russell 已提交
857 858
			radeon_bo_unpin(rdev->stolen_vga_memory);
			radeon_bo_unreserve(rdev->stolen_vga_memory);
859
		}
K
Kent Russell 已提交
860
		radeon_bo_unref(&rdev->stolen_vga_memory);
861 862 863 864 865
	}
	ttm_bo_clean_mm(&rdev->mman.bdev, TTM_PL_VRAM);
	ttm_bo_clean_mm(&rdev->mman.bdev, TTM_PL_TT);
	ttm_bo_device_release(&rdev->mman.bdev);
	radeon_gart_fini(rdev);
866
	rdev->mman.initialized = false;
867 868 869
	DRM_INFO("radeon: ttm finalized\n");
}

870 871 872 873 874 875 876 877 878 879 880 881 882 883
/* this should only be called at bootup or when userspace
 * isn't running */
void radeon_ttm_set_active_vram_size(struct radeon_device *rdev, u64 size)
{
	struct ttm_mem_type_manager *man;

	if (!rdev->mman.initialized)
		return;

	man = &rdev->mman.bdev.man[TTM_PL_VRAM];
	/* this just adjusts TTM size idea, which sets lpfn to the correct value */
	man->size = size >> PAGE_SHIFT;
}

884
static struct vm_operations_struct radeon_ttm_vm_ops;
885
static const struct vm_operations_struct *ttm_vm_ops = NULL;
886

887
static vm_fault_t radeon_ttm_fault(struct vm_fault *vmf)
888 889
{
	struct ttm_buffer_object *bo;
890
	struct radeon_device *rdev;
891
	vm_fault_t ret;
892

893
	bo = (struct ttm_buffer_object *)vmf->vma->vm_private_data;
894 895 896
	if (bo == NULL) {
		return VM_FAULT_NOPAGE;
	}
897
	rdev = radeon_get_rdev(bo->bdev);
898
	down_read(&rdev->pm.mclk_lock);
899
	ret = ttm_vm_ops->fault(vmf);
900
	up_read(&rdev->pm.mclk_lock);
901
	return ret;
902 903 904 905 906
}

int radeon_mmap(struct file *filp, struct vm_area_struct *vma)
{
	int r;
907 908
	struct drm_file *file_priv = filp->private_data;
	struct radeon_device *rdev = file_priv->minor->dev->dev_private;
909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925

	if (rdev == NULL) {
		return -EINVAL;
	}
	r = ttm_bo_mmap(filp, vma, &rdev->mman.bdev);
	if (unlikely(r != 0)) {
		return r;
	}
	if (unlikely(ttm_vm_ops == NULL)) {
		ttm_vm_ops = vma->vm_ops;
		radeon_ttm_vm_ops = *ttm_vm_ops;
		radeon_ttm_vm_ops.fault = &radeon_ttm_fault;
	}
	vma->vm_ops = &radeon_ttm_vm_ops;
	return 0;
}

926
#if defined(CONFIG_DEBUG_FS)
927

928 929 930
static int radeon_mm_dump_table(struct seq_file *m, void *data)
{
	struct drm_info_node *node = (struct drm_info_node *)m->private;
931
	unsigned ttm_pl = *(int*)node->info_ent->data;
932 933
	struct drm_device *dev = node->minor->dev;
	struct radeon_device *rdev = dev->dev_private;
934
	struct ttm_mem_type_manager *man = &rdev->mman.bdev.man[ttm_pl];
D
Daniel Vetter 已提交
935
	struct drm_printer p = drm_seq_file_printer(m);
936

937
	man->func->debug(man, &p);
D
Daniel Vetter 已提交
938
	return 0;
939
}
940

941

942 943 944 945 946 947 948 949 950 951 952 953
static int ttm_pl_vram = TTM_PL_VRAM;
static int ttm_pl_tt = TTM_PL_TT;

static struct drm_info_list radeon_ttm_debugfs_list[] = {
	{"radeon_vram_mm", radeon_mm_dump_table, 0, &ttm_pl_vram},
	{"radeon_gtt_mm", radeon_mm_dump_table, 0, &ttm_pl_tt},
	{"ttm_page_pool", ttm_page_alloc_debugfs, 0, NULL},
#ifdef CONFIG_SWIOTLB
	{"ttm_dma_page_pool", ttm_dma_page_alloc_debugfs, 0, NULL}
#endif
};

954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005
static int radeon_ttm_vram_open(struct inode *inode, struct file *filep)
{
	struct radeon_device *rdev = inode->i_private;
	i_size_write(inode, rdev->mc.mc_vram_size);
	filep->private_data = inode->i_private;
	return 0;
}

static ssize_t radeon_ttm_vram_read(struct file *f, char __user *buf,
				    size_t size, loff_t *pos)
{
	struct radeon_device *rdev = f->private_data;
	ssize_t result = 0;
	int r;

	if (size & 0x3 || *pos & 0x3)
		return -EINVAL;

	while (size) {
		unsigned long flags;
		uint32_t value;

		if (*pos >= rdev->mc.mc_vram_size)
			return result;

		spin_lock_irqsave(&rdev->mmio_idx_lock, flags);
		WREG32(RADEON_MM_INDEX, ((uint32_t)*pos) | 0x80000000);
		if (rdev->family >= CHIP_CEDAR)
			WREG32(EVERGREEN_MM_INDEX_HI, *pos >> 31);
		value = RREG32(RADEON_MM_DATA);
		spin_unlock_irqrestore(&rdev->mmio_idx_lock, flags);

		r = put_user(value, (uint32_t *)buf);
		if (r)
			return r;

		result += 4;
		buf += 4;
		*pos += 4;
		size -= 4;
	}

	return result;
}

static const struct file_operations radeon_ttm_vram_fops = {
	.owner = THIS_MODULE,
	.open = radeon_ttm_vram_open,
	.read = radeon_ttm_vram_read,
	.llseek = default_llseek
};

1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023
static int radeon_ttm_gtt_open(struct inode *inode, struct file *filep)
{
	struct radeon_device *rdev = inode->i_private;
	i_size_write(inode, rdev->mc.gtt_size);
	filep->private_data = inode->i_private;
	return 0;
}

static ssize_t radeon_ttm_gtt_read(struct file *f, char __user *buf,
				   size_t size, loff_t *pos)
{
	struct radeon_device *rdev = f->private_data;
	ssize_t result = 0;
	int r;

	while (size) {
		loff_t p = *pos / PAGE_SIZE;
		unsigned off = *pos & ~PAGE_MASK;
1024
		size_t cur_size = min_t(size_t, size, PAGE_SIZE - off);
1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059
		struct page *page;
		void *ptr;

		if (p >= rdev->gart.num_cpu_pages)
			return result;

		page = rdev->gart.pages[p];
		if (page) {
			ptr = kmap(page);
			ptr += off;

			r = copy_to_user(buf, ptr, cur_size);
			kunmap(rdev->gart.pages[p]);
		} else
			r = clear_user(buf, cur_size);

		if (r)
			return -EFAULT;

		result += cur_size;
		buf += cur_size;
		*pos += cur_size;
		size -= cur_size;
	}

	return result;
}

static const struct file_operations radeon_ttm_gtt_fops = {
	.owner = THIS_MODULE,
	.open = radeon_ttm_gtt_open,
	.read = radeon_ttm_gtt_read,
	.llseek = default_llseek
};

1060 1061 1062 1063
#endif

static int radeon_ttm_debugfs_init(struct radeon_device *rdev)
{
1064
#if defined(CONFIG_DEBUG_FS)
1065 1066 1067
	unsigned count;

	struct drm_minor *minor = rdev->ddev->primary;
1068 1069 1070 1071 1072 1073 1074 1075
	struct dentry *root = minor->debugfs_root;

	rdev->mman.vram = debugfs_create_file("radeon_vram", S_IFREG | S_IRUGO,
					      root, rdev,
					      &radeon_ttm_vram_fops);

	rdev->mman.gtt = debugfs_create_file("radeon_gtt", S_IFREG | S_IRUGO,
					     root, rdev, &radeon_ttm_gtt_fops);
1076

1077
	count = ARRAY_SIZE(radeon_ttm_debugfs_list);
1078

1079
#ifdef CONFIG_SWIOTLB
1080
	if (!(rdev->need_swiotlb && swiotlb_nr_tbl()))
1081
		--count;
1082
#endif
1083

1084 1085 1086
	return radeon_debugfs_add_files(rdev, radeon_ttm_debugfs_list, count);
#else

1087
	return 0;
1088
#endif
1089
}
1090 1091 1092 1093 1094 1095 1096

static void radeon_ttm_debugfs_fini(struct radeon_device *rdev)
{
#if defined(CONFIG_DEBUG_FS)

	debugfs_remove(rdev->mman.vram);
	rdev->mman.vram = NULL;
1097 1098 1099

	debugfs_remove(rdev->mman.gtt);
	rdev->mman.gtt = NULL;
1100 1101
#endif
}