i915_gem_stolen.c 15.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Copyright © 2008-2012 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 *
 * Authors:
 *    Eric Anholt <eric@anholt.net>
 *    Chris Wilson <chris@chris-wilson.co.uk>
 *
 */

29 30
#include <drm/drmP.h>
#include <drm/i915_drm.h>
31 32 33 34 35 36 37 38 39 40 41 42 43 44
#include "i915_drv.h"

/*
 * The BIOS typically reserves some of the system's memory for the exclusive
 * use of the integrated graphics. This memory is no longer available for
 * use by the OS and so the user finds that his system has less memory
 * available than he put in. We refer to this memory as stolen.
 *
 * The BIOS will allocate its framebuffer from the stolen memory. Our
 * goal is try to reuse that object for our own fbcon which must always
 * be available for panics. Anything else we can reuse the stolen memory
 * for is a boon.
 */

45
static unsigned long i915_stolen_to_physical(struct drm_device *dev)
46 47
{
	struct drm_i915_private *dev_priv = dev->dev_private;
48
	struct resource *r;
49 50
	u32 base;

51 52 53 54 55 56 57 58
	/* Almost universally we can find the Graphics Base of Stolen Memory
	 * at offset 0x5c in the igfx configuration space. On a few (desktop)
	 * machines this is also mirrored in the bridge device at different
	 * locations, or in the MCHBAR. On gen2, the layout is again slightly
	 * different with the Graphics Segment immediately following Top of
	 * Memory (or Top of Usable DRAM). Note it appears that TOUD is only
	 * reported by 865g, so we just use the top of memory as determined
	 * by the e820 probe.
59
	 *
60
	 * XXX However gen2 requires an unavailable symbol.
61
	 */
62
	base = 0;
63 64
	if (INTEL_INFO(dev)->gen >= 3) {
		/* Read Graphics Base of Stolen Memory directly */
65 66
		pci_read_config_dword(dev->pdev, 0x5c, &base);
		base &= ~((1<<20) - 1);
67
	} else { /* GEN2 */
68 69 70
#if 0
		/* Stolen is immediately above Top of Memory */
		base = max_low_pfn_mapped << PAGE_SHIFT;
71
#endif
72
	}
73

74 75 76
	if (base == 0)
		return 0;

77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120
	/* make sure we don't clobber the GTT if it's within stolen memory */
	if (INTEL_INFO(dev)->gen <= 4 && !IS_G33(dev) && !IS_G4X(dev)) {
		struct {
			u32 start, end;
		} stolen[2] = {
			{ .start = base, .end = base + dev_priv->gtt.stolen_size, },
			{ .start = base, .end = base + dev_priv->gtt.stolen_size, },
		};
		u64 gtt_start, gtt_end;

		gtt_start = I915_READ(PGTBL_CTL);
		if (IS_GEN4(dev))
			gtt_start = (gtt_start & PGTBL_ADDRESS_LO_MASK) |
				(gtt_start & PGTBL_ADDRESS_HI_MASK) << 28;
		else
			gtt_start &= PGTBL_ADDRESS_LO_MASK;
		gtt_end = gtt_start + gtt_total_entries(dev_priv->gtt) * 4;

		if (gtt_start >= stolen[0].start && gtt_start < stolen[0].end)
			stolen[0].end = gtt_start;
		if (gtt_end > stolen[1].start && gtt_end <= stolen[1].end)
			stolen[1].start = gtt_end;

		/* pick the larger of the two chunks */
		if (stolen[0].end - stolen[0].start >
		    stolen[1].end - stolen[1].start) {
			base = stolen[0].start;
			dev_priv->gtt.stolen_size = stolen[0].end - stolen[0].start;
		} else {
			base = stolen[1].start;
			dev_priv->gtt.stolen_size = stolen[1].end - stolen[1].start;
		}

		if (stolen[0].start != stolen[1].start ||
		    stolen[0].end != stolen[1].end) {
			DRM_DEBUG_KMS("GTT within stolen memory at 0x%llx-0x%llx\n",
				      (unsigned long long) gtt_start,
				      (unsigned long long) gtt_end - 1);
			DRM_DEBUG_KMS("Stolen memory adjusted to 0x%x-0x%x\n",
				      base, base + (u32) dev_priv->gtt.stolen_size - 1);
		}
	}


121 122 123 124 125 126 127 128
	/* Verify that nothing else uses this physical address. Stolen
	 * memory should be reserved by the BIOS and hidden from the
	 * kernel. So if the region is already marked as busy, something
	 * is seriously wrong.
	 */
	r = devm_request_mem_region(dev->dev, base, dev_priv->gtt.stolen_size,
				    "Graphics Stolen Memory");
	if (r == NULL) {
129 130 131 132 133 134 135 136 137 138 139
		/*
		 * One more attempt but this time requesting region from
		 * base + 1, as we have seen that this resolves the region
		 * conflict with the PCI Bus.
		 * This is a BIOS w/a: Some BIOS wrap stolen in the root
		 * PCI bus, but have an off-by-one error. Hence retry the
		 * reservation starting from 1 instead of 0.
		 */
		r = devm_request_mem_region(dev->dev, base + 1,
					    dev_priv->gtt.stolen_size - 1,
					    "Graphics Stolen Memory");
140 141 142 143 144
		/*
		 * GEN3 firmware likes to smash pci bridges into the stolen
		 * range. Apparently this works.
		 */
		if (r == NULL && !IS_GEN3(dev)) {
145 146 147 148
			DRM_ERROR("conflict detected with stolen region: [0x%08x - 0x%08x]\n",
				  base, base + (uint32_t)dev_priv->gtt.stolen_size);
			base = 0;
		}
149 150
	}

151
	return base;
152 153
}

154 155
static int find_compression_threshold(struct drm_device *dev,
				      struct drm_mm_node *node,
B
Ben Widawsky 已提交
156 157
				      int size,
				      int fb_cpp)
158 159
{
	struct drm_i915_private *dev_priv = dev->dev_private;
B
Ben Widawsky 已提交
160
	int compression_threshold = 1;
161
	int ret;
162

B
Ben Widawsky 已提交
163 164 165 166 167 168 169 170
	/* HACK: This code depends on what we will do in *_enable_fbc. If that
	 * code changes, this code needs to change as well.
	 *
	 * The enable_fbc code will attempt to use one of our 2 compression
	 * thresholds, therefore, in that case, we only have 1 resort.
	 */

	/* Try to over-allocate to reduce reallocations and fragmentation. */
171
	ret = drm_mm_insert_node(&dev_priv->mm.stolen, node,
172
				 size <<= 1, 4096, DRM_MM_SEARCH_DEFAULT);
B
Ben Widawsky 已提交
173 174 175 176 177 178 179
	if (ret == 0)
		return compression_threshold;

again:
	/* HW's ability to limit the CFB is 1:4 */
	if (compression_threshold > 4 ||
	    (fb_cpp == 2 && compression_threshold == 2))
180
		return 0;
B
Ben Widawsky 已提交
181 182 183 184 185 186 187 188 189 190

	ret = drm_mm_insert_node(&dev_priv->mm.stolen, node,
				 size >>= 1, 4096,
				 DRM_MM_SEARCH_DEFAULT);
	if (ret && INTEL_INFO(dev)->gen <= 4) {
		return 0;
	} else if (ret) {
		compression_threshold <<= 1;
		goto again;
	} else {
191
		return compression_threshold;
B
Ben Widawsky 已提交
192
	}
193 194
}

B
Ben Widawsky 已提交
195
static int i915_setup_compression(struct drm_device *dev, int size, int fb_cpp)
196 197 198 199 200 201
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_mm_node *uninitialized_var(compressed_llb);
	int ret;

	ret = find_compression_threshold(dev, &dev_priv->fbc.compressed_fb,
B
Ben Widawsky 已提交
202
					 size, fb_cpp);
203
	if (!ret)
204
		goto err_llb;
B
Ben Widawsky 已提交
205 206 207 208 209 210
	else if (ret > 1) {
		DRM_INFO("Reducing the compressed framebuffer size. This may lead to less power savings than a non-reduced-size. Try to increase stolen memory size if available in BIOS.\n");

	}

	dev_priv->fbc.threshold = ret;
211

212
	if (HAS_PCH_SPLIT(dev))
213
		I915_WRITE(ILK_DPFC_CB_BASE, dev_priv->fbc.compressed_fb.start);
214
	else if (IS_GM45(dev)) {
215
		I915_WRITE(DPFC_CB_BASE, dev_priv->fbc.compressed_fb.start);
216
	} else {
217
		compressed_llb = kzalloc(sizeof(*compressed_llb), GFP_KERNEL);
218 219 220
		if (!compressed_llb)
			goto err_fb;

221 222 223 224 225
		ret = drm_mm_insert_node(&dev_priv->mm.stolen, compressed_llb,
					 4096, 4096, DRM_MM_SEARCH_DEFAULT);
		if (ret)
			goto err_fb;

226
		dev_priv->fbc.compressed_llb = compressed_llb;
227 228

		I915_WRITE(FBC_CFB_BASE,
229
			   dev_priv->mm.stolen_base + dev_priv->fbc.compressed_fb.start);
230 231
		I915_WRITE(FBC_LL_BASE,
			   dev_priv->mm.stolen_base + compressed_llb->start);
232 233
	}

234
	dev_priv->fbc.uncompressed_size = size;
235

236 237
	DRM_DEBUG_KMS("reserved %d bytes of contiguous stolen space for FBC\n",
		      size);
238

239
	return 0;
240 241

err_fb:
242
	kfree(compressed_llb);
243
	drm_mm_remove_node(&dev_priv->fbc.compressed_fb);
244
err_llb:
245
	pr_info_once("drm: not enough stolen space for compressed buffer (need %d more bytes), disabling. Hint: you may be able to increase stolen memory size in the BIOS to avoid this.\n", size);
246 247 248
	return -ENOSPC;
}

B
Ben Widawsky 已提交
249
int i915_gem_stolen_setup_compression(struct drm_device *dev, int size, int fb_cpp)
250 251 252
{
	struct drm_i915_private *dev_priv = dev->dev_private;

253
	if (!drm_mm_initialized(&dev_priv->mm.stolen))
254 255
		return -ENODEV;

256
	if (size < dev_priv->fbc.uncompressed_size)
257 258 259 260 261
		return 0;

	/* Release any current block */
	i915_gem_stolen_cleanup_compression(dev);

B
Ben Widawsky 已提交
262
	return i915_setup_compression(dev, size, fb_cpp);
263 264
}

265
void i915_gem_stolen_cleanup_compression(struct drm_device *dev)
266 267 268
{
	struct drm_i915_private *dev_priv = dev->dev_private;

269
	if (dev_priv->fbc.uncompressed_size == 0)
270 271
		return;

272
	drm_mm_remove_node(&dev_priv->fbc.compressed_fb);
273

274 275 276 277
	if (dev_priv->fbc.compressed_llb) {
		drm_mm_remove_node(dev_priv->fbc.compressed_llb);
		kfree(dev_priv->fbc.compressed_llb);
	}
278

279
	dev_priv->fbc.uncompressed_size = 0;
280 281 282 283
}

void i915_gem_cleanup_stolen(struct drm_device *dev)
{
284 285
	struct drm_i915_private *dev_priv = dev->dev_private;

286 287 288
	if (!drm_mm_initialized(&dev_priv->mm.stolen))
		return;

289
	i915_gem_stolen_cleanup_compression(dev);
290
	drm_mm_takedown(&dev_priv->mm.stolen);
291 292 293 294 295
}

int i915_gem_init_stolen(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
296
	u32 tmp;
297
	int bios_reserved = 0;
298

299
#ifdef CONFIG_INTEL_IOMMU
300
	if (intel_iommu_gfx_mapped && INTEL_INFO(dev)->gen < 8) {
301 302 303 304 305
		DRM_INFO("DMAR active, disabling use of stolen memory\n");
		return 0;
	}
#endif

306 307 308
	if (dev_priv->gtt.stolen_size == 0)
		return 0;

309 310 311 312
	dev_priv->mm.stolen_base = i915_stolen_to_physical(dev);
	if (dev_priv->mm.stolen_base == 0)
		return 0;

313 314
	DRM_DEBUG_KMS("found %zd bytes of stolen memory at %08lx\n",
		      dev_priv->gtt.stolen_size, dev_priv->mm.stolen_base);
315

316 317 318 319 320 321 322 323 324 325
	if (INTEL_INFO(dev)->gen >= 8) {
		tmp = I915_READ(GEN7_BIOS_RESERVED);
		tmp >>= GEN8_BIOS_RESERVED_SHIFT;
		tmp &= GEN8_BIOS_RESERVED_MASK;
		bios_reserved = (1024*1024) << tmp;
	} else if (IS_GEN7(dev)) {
		tmp = I915_READ(GEN7_BIOS_RESERVED);
		bios_reserved = tmp & GEN7_BIOS_RESERVED_256K ?
			256*1024 : 1024*1024;
	}
326

327 328 329
	if (WARN_ON(bios_reserved > dev_priv->gtt.stolen_size))
		return 0;

330
	/* Basic memrange allocator for stolen space */
331 332
	drm_mm_init(&dev_priv->mm.stolen, 0, dev_priv->gtt.stolen_size -
		    bios_reserved);
333 334 335

	return 0;
}
336 337 338 339 340 341 342 343 344 345

static struct sg_table *
i915_pages_create_for_stolen(struct drm_device *dev,
			     u32 offset, u32 size)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct sg_table *st;
	struct scatterlist *sg;

	DRM_DEBUG_DRIVER("offset=0x%x, size=%d\n", offset, size);
346
	BUG_ON(offset > dev_priv->gtt.stolen_size - size);
347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362

	/* We hide that we have no struct page backing our stolen object
	 * by wrapping the contiguous physical allocation with a fake
	 * dma mapping in a single scatterlist.
	 */

	st = kmalloc(sizeof(*st), GFP_KERNEL);
	if (st == NULL)
		return NULL;

	if (sg_alloc_table(st, 1, GFP_KERNEL)) {
		kfree(st);
		return NULL;
	}

	sg = st->sgl;
363
	sg->offset = 0;
364
	sg->length = size;
365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384

	sg_dma_address(sg) = (dma_addr_t)dev_priv->mm.stolen_base + offset;
	sg_dma_len(sg) = size;

	return st;
}

static int i915_gem_object_get_pages_stolen(struct drm_i915_gem_object *obj)
{
	BUG();
	return -EINVAL;
}

static void i915_gem_object_put_pages_stolen(struct drm_i915_gem_object *obj)
{
	/* Should only be called during free */
	sg_free_table(obj->pages);
	kfree(obj->pages);
}

385 386 387 388 389 390 391 392 393 394

static void
i915_gem_object_release_stolen(struct drm_i915_gem_object *obj)
{
	if (obj->stolen) {
		drm_mm_remove_node(obj->stolen);
		kfree(obj->stolen);
		obj->stolen = NULL;
	}
}
395 396 397
static const struct drm_i915_gem_object_ops i915_gem_object_stolen_ops = {
	.get_pages = i915_gem_object_get_pages_stolen,
	.put_pages = i915_gem_object_put_pages_stolen,
398
	.release = i915_gem_object_release_stolen,
399 400 401 402 403 404 405 406
};

static struct drm_i915_gem_object *
_i915_gem_object_create_stolen(struct drm_device *dev,
			       struct drm_mm_node *stolen)
{
	struct drm_i915_gem_object *obj;

407
	obj = i915_gem_object_alloc(dev);
408 409 410
	if (obj == NULL)
		return NULL;

411
	drm_gem_private_object_init(dev, &obj->base, stolen->size);
412 413 414 415 416 417 418 419
	i915_gem_object_init(obj, &i915_gem_object_stolen_ops);

	obj->pages = i915_pages_create_for_stolen(dev,
						  stolen->start, stolen->size);
	if (obj->pages == NULL)
		goto cleanup;

	obj->has_dma_mapping = true;
420
	i915_gem_object_pin_pages(obj);
421 422
	obj->stolen = stolen;

423 424
	obj->base.read_domains = I915_GEM_DOMAIN_CPU | I915_GEM_DOMAIN_GTT;
	obj->cache_level = HAS_LLC(dev) ? I915_CACHE_LLC : I915_CACHE_NONE;
425 426 427 428

	return obj;

cleanup:
429
	i915_gem_object_free(obj);
430 431 432 433 434 435 436 437 438
	return NULL;
}

struct drm_i915_gem_object *
i915_gem_object_create_stolen(struct drm_device *dev, u32 size)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_gem_object *obj;
	struct drm_mm_node *stolen;
439
	int ret;
440

441
	if (!drm_mm_initialized(&dev_priv->mm.stolen))
442 443 444 445 446 447
		return NULL;

	DRM_DEBUG_KMS("creating stolen object: size=%x\n", size);
	if (size == 0)
		return NULL;

448 449
	stolen = kzalloc(sizeof(*stolen), GFP_KERNEL);
	if (!stolen)
450 451
		return NULL;

452 453 454 455 456 457 458
	ret = drm_mm_insert_node(&dev_priv->mm.stolen, stolen, size,
				 4096, DRM_MM_SEARCH_DEFAULT);
	if (ret) {
		kfree(stolen);
		return NULL;
	}

459 460 461 462
	obj = _i915_gem_object_create_stolen(dev, stolen);
	if (obj)
		return obj;

463 464
	drm_mm_remove_node(stolen);
	kfree(stolen);
465 466 467
	return NULL;
}

468 469 470 471 472 473 474
struct drm_i915_gem_object *
i915_gem_object_create_stolen_for_preallocated(struct drm_device *dev,
					       u32 stolen_offset,
					       u32 gtt_offset,
					       u32 size)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
475
	struct i915_address_space *ggtt = &dev_priv->gtt.base;
476 477
	struct drm_i915_gem_object *obj;
	struct drm_mm_node *stolen;
B
Ben Widawsky 已提交
478
	struct i915_vma *vma;
479
	int ret;
480

481
	if (!drm_mm_initialized(&dev_priv->mm.stolen))
482 483 484 485 486 487 488 489 490 491 492 493
		return NULL;

	DRM_DEBUG_KMS("creating preallocated stolen object: stolen_offset=%x, gtt_offset=%x, size=%x\n",
			stolen_offset, gtt_offset, size);

	/* KISS and expect everything to be page-aligned */
	BUG_ON(stolen_offset & 4095);
	BUG_ON(size & 4095);

	if (WARN_ON(size == 0))
		return NULL;

494 495 496 497
	stolen = kzalloc(sizeof(*stolen), GFP_KERNEL);
	if (!stolen)
		return NULL;

498 499 500
	stolen->start = stolen_offset;
	stolen->size = size;
	ret = drm_mm_reserve_node(&dev_priv->mm.stolen, stolen);
501
	if (ret) {
502
		DRM_DEBUG_KMS("failed to allocate stolen space\n");
503
		kfree(stolen);
504 505 506 507 508 509
		return NULL;
	}

	obj = _i915_gem_object_create_stolen(dev, stolen);
	if (obj == NULL) {
		DRM_DEBUG_KMS("failed to allocate stolen object\n");
510 511
		drm_mm_remove_node(stolen);
		kfree(stolen);
512 513 514
		return NULL;
	}

515
	/* Some objects just need physical mem from stolen space */
516
	if (gtt_offset == I915_GTT_OFFSET_NONE)
517 518
		return obj;

519
	vma = i915_gem_obj_lookup_or_create_vma(obj, ggtt);
520 521
	if (IS_ERR(vma)) {
		ret = PTR_ERR(vma);
B
Ben Widawsky 已提交
522 523 524
		goto err_out;
	}

525 526 527 528 529
	/* To simplify the initialisation sequence between KMS and GTT,
	 * we allow construction of the stolen object prior to
	 * setting up the GTT space. The actual reservation will occur
	 * later.
	 */
B
Ben Widawsky 已提交
530 531
	vma->node.start = gtt_offset;
	vma->node.size = size;
532 533
	if (drm_mm_initialized(&ggtt->mm)) {
		ret = drm_mm_reserve_node(&ggtt->mm, &vma->node);
534
		if (ret) {
535
			DRM_DEBUG_KMS("failed to allocate stolen GTT space\n");
536
			goto err_vma;
537
		}
B
Ben Widawsky 已提交
538
	}
539

540
	vma->bound |= GLOBAL_BIND;
541

542
	list_add_tail(&obj->global_list, &dev_priv->mm.bound_list);
B
Ben Widawsky 已提交
543
	list_add_tail(&vma->mm_list, &ggtt->inactive_list);
544
	i915_gem_object_pin_pages(obj);
545 546

	return obj;
547

548 549
err_vma:
	i915_gem_vma_destroy(vma);
550
err_out:
551 552
	drm_mm_remove_node(stolen);
	kfree(stolen);
553 554
	drm_gem_object_unreference(&obj->base);
	return NULL;
555
}