intel_fbc.c 30.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * Copyright © 2014 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 * DEALINGS IN THE SOFTWARE.
 */

R
Rodrigo Vivi 已提交
24 25 26 27 28 29
/**
 * DOC: Frame Buffer Compression (FBC)
 *
 * FBC tries to save memory bandwidth (and so power consumption) by
 * compressing the amount of memory used by the display. It is total
 * transparent to user space and completely handled in the kernel.
30 31
 *
 * The benefits of FBC are mostly visible with solid backgrounds and
R
Rodrigo Vivi 已提交
32 33
 * variation-less patterns. It comes from keeping the memory footprint small
 * and having fewer memory pages opened and accessed for refreshing the display.
34
 *
R
Rodrigo Vivi 已提交
35 36 37 38
 * i915 is responsible to reserve stolen memory for FBC and configure its
 * offset on proper registers. The hardware takes care of all
 * compress/decompress. However there are many known cases where we have to
 * forcibly disable it to allow proper screen updates.
39 40
 */

R
Rodrigo Vivi 已提交
41 42 43
#include "intel_drv.h"
#include "i915_drv.h"

P
Paulo Zanoni 已提交
44 45 46 47 48
static inline bool fbc_supported(struct drm_i915_private *dev_priv)
{
	return dev_priv->fbc.enable_fbc != NULL;
}

49 50 51 52 53
static inline bool fbc_on_pipe_a_only(struct drm_i915_private *dev_priv)
{
	return IS_HASWELL(dev_priv) || INTEL_INFO(dev_priv)->gen >= 8;
}

54 55 56 57 58 59 60 61 62 63 64 65 66
/*
 * In some platforms where the CRTC's x:0/y:0 coordinates doesn't match the
 * frontbuffer's x:0/y:0 coordinates we lie to the hardware about the plane's
 * origin so the x and y offsets can actually fit the registers. As a
 * consequence, the fence doesn't really start exactly at the display plane
 * address we program because it starts at the real start of the buffer, so we
 * have to take this into consideration here.
 */
static unsigned int get_crtc_fence_y_offset(struct intel_crtc *crtc)
{
	return crtc->base.y - crtc->adjusted_y;
}

67
static void i8xx_fbc_disable(struct drm_i915_private *dev_priv)
68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
{
	u32 fbc_ctl;

	dev_priv->fbc.enabled = false;

	/* Disable compression */
	fbc_ctl = I915_READ(FBC_CONTROL);
	if ((fbc_ctl & FBC_CTL_EN) == 0)
		return;

	fbc_ctl &= ~FBC_CTL_EN;
	I915_WRITE(FBC_CONTROL, fbc_ctl);

	/* Wait for compressing bit to clear */
	if (wait_for((I915_READ(FBC_STATUS) & FBC_STAT_COMPRESSING) == 0, 10)) {
		DRM_DEBUG_KMS("FBC idle timed out\n");
		return;
	}

	DRM_DEBUG_KMS("disabled FBC\n");
}

90
static void i8xx_fbc_enable(struct intel_crtc *crtc)
91
{
92 93
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
94 95 96 97 98 99 100
	struct drm_i915_gem_object *obj = intel_fb_obj(fb);
	int cfb_pitch;
	int i;
	u32 fbc_ctl;

	dev_priv->fbc.enabled = true;

101 102
	/* Note: fbc.threshold == 1 for i8xx */
	cfb_pitch = dev_priv->fbc.uncompressed_size / FBC_LL_SIZE;
103 104 105 106
	if (fb->pitches[0] < cfb_pitch)
		cfb_pitch = fb->pitches[0];

	/* FBC_CTL wants 32B or 64B units */
107
	if (IS_GEN2(dev_priv))
108 109 110 111 112 113
		cfb_pitch = (cfb_pitch / 32) - 1;
	else
		cfb_pitch = (cfb_pitch / 64) - 1;

	/* Clear old tags */
	for (i = 0; i < (FBC_LL_SIZE / 32) + 1; i++)
114
		I915_WRITE(FBC_TAG(i), 0);
115

116
	if (IS_GEN4(dev_priv)) {
117 118 119 120
		u32 fbc_ctl2;

		/* Set it up... */
		fbc_ctl2 = FBC_CTL_FENCE_DBL | FBC_CTL_IDLE_IMM | FBC_CTL_CPU_FENCE;
121
		fbc_ctl2 |= FBC_CTL_PLANE(crtc->plane);
122
		I915_WRITE(FBC_CONTROL2, fbc_ctl2);
123
		I915_WRITE(FBC_FENCE_OFF, get_crtc_fence_y_offset(crtc));
124 125 126 127 128 129
	}

	/* enable it... */
	fbc_ctl = I915_READ(FBC_CONTROL);
	fbc_ctl &= 0x3fff << FBC_CTL_INTERVAL_SHIFT;
	fbc_ctl |= FBC_CTL_EN | FBC_CTL_PERIODIC;
130
	if (IS_I945GM(dev_priv))
131 132 133 134 135 136
		fbc_ctl |= FBC_CTL_C3_IDLE; /* 945 needs special SR handling */
	fbc_ctl |= (cfb_pitch & 0xff) << FBC_CTL_STRIDE_SHIFT;
	fbc_ctl |= obj->fence_reg;
	I915_WRITE(FBC_CONTROL, fbc_ctl);

	DRM_DEBUG_KMS("enabled FBC, pitch %d, yoff %d, plane %c\n",
137
		      cfb_pitch, crtc->base.y, plane_name(crtc->plane));
138 139
}

140
static bool i8xx_fbc_enabled(struct drm_i915_private *dev_priv)
141 142 143 144
{
	return I915_READ(FBC_CONTROL) & FBC_CTL_EN;
}

145
static void g4x_fbc_enable(struct intel_crtc *crtc)
146
{
147 148
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
149 150 151 152 153
	struct drm_i915_gem_object *obj = intel_fb_obj(fb);
	u32 dpfc_ctl;

	dev_priv->fbc.enabled = true;

154
	dpfc_ctl = DPFC_CTL_PLANE(crtc->plane) | DPFC_SR_EN;
155 156 157 158 159 160
	if (drm_format_plane_cpp(fb->pixel_format, 0) == 2)
		dpfc_ctl |= DPFC_CTL_LIMIT_2X;
	else
		dpfc_ctl |= DPFC_CTL_LIMIT_1X;
	dpfc_ctl |= DPFC_CTL_FENCE_EN | obj->fence_reg;

161
	I915_WRITE(DPFC_FENCE_YOFF, get_crtc_fence_y_offset(crtc));
162 163 164 165

	/* enable it... */
	I915_WRITE(DPFC_CONTROL, dpfc_ctl | DPFC_CTL_EN);

166
	DRM_DEBUG_KMS("enabled fbc on plane %c\n", plane_name(crtc->plane));
167 168
}

169
static void g4x_fbc_disable(struct drm_i915_private *dev_priv)
170 171 172 173 174 175 176 177 178 179 180 181 182 183 184
{
	u32 dpfc_ctl;

	dev_priv->fbc.enabled = false;

	/* Disable compression */
	dpfc_ctl = I915_READ(DPFC_CONTROL);
	if (dpfc_ctl & DPFC_CTL_EN) {
		dpfc_ctl &= ~DPFC_CTL_EN;
		I915_WRITE(DPFC_CONTROL, dpfc_ctl);

		DRM_DEBUG_KMS("disabled FBC\n");
	}
}

185
static bool g4x_fbc_enabled(struct drm_i915_private *dev_priv)
186 187 188 189
{
	return I915_READ(DPFC_CONTROL) & DPFC_CTL_EN;
}

190 191
/* This function forces a CFB recompression through the nuke operation. */
static void intel_fbc_recompress(struct drm_i915_private *dev_priv)
192
{
193 194
	I915_WRITE(MSG_FBC_REND_STATE, FBC_REND_NUKE);
	POSTING_READ(MSG_FBC_REND_STATE);
195 196
}

197
static void ilk_fbc_enable(struct intel_crtc *crtc)
198
{
199 200
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
201 202
	struct drm_i915_gem_object *obj = intel_fb_obj(fb);
	u32 dpfc_ctl;
203
	int threshold = dev_priv->fbc.threshold;
204
	unsigned int y_offset;
205 206 207

	dev_priv->fbc.enabled = true;

208
	dpfc_ctl = DPFC_CTL_PLANE(crtc->plane);
209
	if (drm_format_plane_cpp(fb->pixel_format, 0) == 2)
210
		threshold++;
211

212
	switch (threshold) {
213 214 215 216 217 218 219 220 221 222 223 224
	case 4:
	case 3:
		dpfc_ctl |= DPFC_CTL_LIMIT_4X;
		break;
	case 2:
		dpfc_ctl |= DPFC_CTL_LIMIT_2X;
		break;
	case 1:
		dpfc_ctl |= DPFC_CTL_LIMIT_1X;
		break;
	}
	dpfc_ctl |= DPFC_CTL_FENCE_EN;
225
	if (IS_GEN5(dev_priv))
226 227
		dpfc_ctl |= obj->fence_reg;

228 229
	y_offset = get_crtc_fence_y_offset(crtc);
	I915_WRITE(ILK_DPFC_FENCE_YOFF, y_offset);
230 231 232 233
	I915_WRITE(ILK_FBC_RT_BASE, i915_gem_obj_ggtt_offset(obj) | ILK_FBC_RT_VALID);
	/* enable it... */
	I915_WRITE(ILK_DPFC_CONTROL, dpfc_ctl | DPFC_CTL_EN);

234
	if (IS_GEN6(dev_priv)) {
235 236
		I915_WRITE(SNB_DPFC_CTL_SA,
			   SNB_CPU_FENCE_ENABLE | obj->fence_reg);
237
		I915_WRITE(DPFC_CPU_FENCE_OFFSET, y_offset);
238 239
	}

240
	intel_fbc_recompress(dev_priv);
241

242
	DRM_DEBUG_KMS("enabled fbc on plane %c\n", plane_name(crtc->plane));
243 244
}

245
static void ilk_fbc_disable(struct drm_i915_private *dev_priv)
246 247 248 249 250 251 252 253 254 255 256 257 258 259 260
{
	u32 dpfc_ctl;

	dev_priv->fbc.enabled = false;

	/* Disable compression */
	dpfc_ctl = I915_READ(ILK_DPFC_CONTROL);
	if (dpfc_ctl & DPFC_CTL_EN) {
		dpfc_ctl &= ~DPFC_CTL_EN;
		I915_WRITE(ILK_DPFC_CONTROL, dpfc_ctl);

		DRM_DEBUG_KMS("disabled FBC\n");
	}
}

261
static bool ilk_fbc_enabled(struct drm_i915_private *dev_priv)
262 263 264 265
{
	return I915_READ(ILK_DPFC_CONTROL) & DPFC_CTL_EN;
}

266
static void gen7_fbc_enable(struct intel_crtc *crtc)
267
{
268 269
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
270 271
	struct drm_i915_gem_object *obj = intel_fb_obj(fb);
	u32 dpfc_ctl;
272
	int threshold = dev_priv->fbc.threshold;
273 274 275

	dev_priv->fbc.enabled = true;

276
	dpfc_ctl = 0;
277
	if (IS_IVYBRIDGE(dev_priv))
278
		dpfc_ctl |= IVB_DPFC_CTL_PLANE(crtc->plane);
279

280
	if (drm_format_plane_cpp(fb->pixel_format, 0) == 2)
281
		threshold++;
282

283
	switch (threshold) {
284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300
	case 4:
	case 3:
		dpfc_ctl |= DPFC_CTL_LIMIT_4X;
		break;
	case 2:
		dpfc_ctl |= DPFC_CTL_LIMIT_2X;
		break;
	case 1:
		dpfc_ctl |= DPFC_CTL_LIMIT_1X;
		break;
	}

	dpfc_ctl |= IVB_DPFC_CTL_FENCE_EN;

	if (dev_priv->fbc.false_color)
		dpfc_ctl |= FBC_CTL_FALSE_COLOR;

301
	if (IS_IVYBRIDGE(dev_priv)) {
302 303 304 305
		/* WaFbcAsynchFlipDisableFbcQueue:ivb */
		I915_WRITE(ILK_DISPLAY_CHICKEN1,
			   I915_READ(ILK_DISPLAY_CHICKEN1) |
			   ILK_FBCQ_DIS);
306
	} else if (IS_HASWELL(dev_priv) || IS_BROADWELL(dev_priv)) {
307
		/* WaFbcAsynchFlipDisableFbcQueue:hsw,bdw */
308 309
		I915_WRITE(CHICKEN_PIPESL_1(crtc->pipe),
			   I915_READ(CHICKEN_PIPESL_1(crtc->pipe)) |
310 311 312
			   HSW_FBCQ_DIS);
	}

313 314
	I915_WRITE(ILK_DPFC_CONTROL, dpfc_ctl | DPFC_CTL_EN);

315 316
	I915_WRITE(SNB_DPFC_CTL_SA,
		   SNB_CPU_FENCE_ENABLE | obj->fence_reg);
317
	I915_WRITE(DPFC_CPU_FENCE_OFFSET, get_crtc_fence_y_offset(crtc));
318

319
	intel_fbc_recompress(dev_priv);
320

321
	DRM_DEBUG_KMS("enabled fbc on plane %c\n", plane_name(crtc->plane));
322 323
}

R
Rodrigo Vivi 已提交
324 325
/**
 * intel_fbc_enabled - Is FBC enabled?
326
 * @dev_priv: i915 device instance
R
Rodrigo Vivi 已提交
327 328 329 330 331
 *
 * This function is used to verify the current state of FBC.
 * FIXME: This should be tracked in the plane config eventually
 *        instead of queried at runtime for most callers.
 */
332
bool intel_fbc_enabled(struct drm_i915_private *dev_priv)
333 334 335 336
{
	return dev_priv->fbc.enabled;
}

337 338 339 340 341 342 343 344 345 346 347 348
static void intel_fbc_enable(struct intel_crtc *crtc,
			     const struct drm_framebuffer *fb)
{
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;

	dev_priv->fbc.enable_fbc(crtc);

	dev_priv->fbc.crtc = crtc;
	dev_priv->fbc.fb_id = fb->base.id;
	dev_priv->fbc.y = crtc->base.y;
}

349 350 351 352 353
static void intel_fbc_work_fn(struct work_struct *__work)
{
	struct intel_fbc_work *work =
		container_of(to_delayed_work(__work),
			     struct intel_fbc_work, work);
354 355
	struct drm_i915_private *dev_priv = work->crtc->base.dev->dev_private;
	struct drm_framebuffer *crtc_fb = work->crtc->base.primary->fb;
356

P
Paulo Zanoni 已提交
357
	mutex_lock(&dev_priv->fbc.lock);
358 359 360 361
	if (work == dev_priv->fbc.fbc_work) {
		/* Double check that we haven't switched fb without cancelling
		 * the prior work.
		 */
362 363
		if (crtc_fb == work->fb)
			intel_fbc_enable(work->crtc, work->fb);
364 365 366

		dev_priv->fbc.fbc_work = NULL;
	}
P
Paulo Zanoni 已提交
367
	mutex_unlock(&dev_priv->fbc.lock);
368 369 370 371 372 373

	kfree(work);
}

static void intel_fbc_cancel_work(struct drm_i915_private *dev_priv)
{
P
Paulo Zanoni 已提交
374 375
	WARN_ON(!mutex_is_locked(&dev_priv->fbc.lock));

376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396
	if (dev_priv->fbc.fbc_work == NULL)
		return;

	DRM_DEBUG_KMS("cancelling pending FBC enable\n");

	/* Synchronisation is provided by struct_mutex and checking of
	 * dev_priv->fbc.fbc_work, so we can perform the cancellation
	 * entirely asynchronously.
	 */
	if (cancel_delayed_work(&dev_priv->fbc.fbc_work->work))
		/* tasklet was killed before being run, clean up */
		kfree(dev_priv->fbc.fbc_work);

	/* Mark the work as no longer wanted so that if it does
	 * wake-up (because the work was already running and waiting
	 * for our mutex), it will discover that is no longer
	 * necessary to run.
	 */
	dev_priv->fbc.fbc_work = NULL;
}

397
static void intel_fbc_schedule_enable(struct intel_crtc *crtc)
398 399
{
	struct intel_fbc_work *work;
400
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
401

P
Paulo Zanoni 已提交
402 403
	WARN_ON(!mutex_is_locked(&dev_priv->fbc.lock));

404 405 406 407 408
	intel_fbc_cancel_work(dev_priv);

	work = kzalloc(sizeof(*work), GFP_KERNEL);
	if (work == NULL) {
		DRM_ERROR("Failed to allocate FBC work structure\n");
409
		intel_fbc_enable(crtc, crtc->base.primary->fb);
410 411 412 413
		return;
	}

	work->crtc = crtc;
414
	work->fb = crtc->base.primary->fb;
415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434
	INIT_DELAYED_WORK(&work->work, intel_fbc_work_fn);

	dev_priv->fbc.fbc_work = work;

	/* Delay the actual enabling to let pageflipping cease and the
	 * display to settle before starting the compression. Note that
	 * this delay also serves a second purpose: it allows for a
	 * vblank to pass after disabling the FBC before we attempt
	 * to modify the control registers.
	 *
	 * A more complicated solution would involve tracking vblanks
	 * following the termination of the page-flipping sequence
	 * and indeed performing the enable as a co-routine and not
	 * waiting synchronously upon the vblank.
	 *
	 * WaFbcWaitForVBlankBeforeEnable:ilk,snb
	 */
	schedule_delayed_work(&work->work, msecs_to_jiffies(50));
}

435
static void __intel_fbc_disable(struct drm_i915_private *dev_priv)
P
Paulo Zanoni 已提交
436 437 438 439 440
{
	WARN_ON(!mutex_is_locked(&dev_priv->fbc.lock));

	intel_fbc_cancel_work(dev_priv);

441
	dev_priv->fbc.disable_fbc(dev_priv);
P
Paulo Zanoni 已提交
442 443 444
	dev_priv->fbc.crtc = NULL;
}

R
Rodrigo Vivi 已提交
445 446
/**
 * intel_fbc_disable - disable FBC
447
 * @dev_priv: i915 device instance
R
Rodrigo Vivi 已提交
448 449 450
 *
 * This function disables FBC.
 */
451
void intel_fbc_disable(struct drm_i915_private *dev_priv)
452
{
P
Paulo Zanoni 已提交
453
	if (!fbc_supported(dev_priv))
454 455
		return;

P
Paulo Zanoni 已提交
456
	mutex_lock(&dev_priv->fbc.lock);
457
	__intel_fbc_disable(dev_priv);
P
Paulo Zanoni 已提交
458 459
	mutex_unlock(&dev_priv->fbc.lock);
}
460

P
Paulo Zanoni 已提交
461 462 463 464 465 466 467 468
/*
 * intel_fbc_disable_crtc - disable FBC if it's associated with crtc
 * @crtc: the CRTC
 *
 * This function disables FBC if it's associated with the provided CRTC.
 */
void intel_fbc_disable_crtc(struct intel_crtc *crtc)
{
469
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
470

P
Paulo Zanoni 已提交
471
	if (!fbc_supported(dev_priv))
472 473
		return;

P
Paulo Zanoni 已提交
474 475
	mutex_lock(&dev_priv->fbc.lock);
	if (dev_priv->fbc.crtc == crtc)
476
		__intel_fbc_disable(dev_priv);
P
Paulo Zanoni 已提交
477
	mutex_unlock(&dev_priv->fbc.lock);
478 479
}

480
static void set_no_fbc_reason(struct drm_i915_private *dev_priv,
481
			      const char *reason)
482 483
{
	if (dev_priv->fbc.no_fbc_reason == reason)
484
		return;
485 486

	dev_priv->fbc.no_fbc_reason = reason;
487
	DRM_DEBUG_KMS("Disabling FBC: %s\n", reason);
488 489
}

490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505
static bool crtc_is_valid(struct intel_crtc *crtc)
{
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;

	if (fbc_on_pipe_a_only(dev_priv) && crtc->pipe != PIPE_A)
		return false;

	if (!intel_crtc_active(&crtc->base))
		return false;

	if (!to_intel_plane_state(crtc->base.primary->state)->visible)
		return false;

	return true;
}

506 507 508
static struct drm_crtc *intel_fbc_find_crtc(struct drm_i915_private *dev_priv)
{
	struct drm_crtc *crtc = NULL, *tmp_crtc;
509 510 511 512
	enum pipe pipe;

	for_each_pipe(dev_priv, pipe) {
		tmp_crtc = dev_priv->pipe_to_crtc_mapping[pipe];
513

514
		if (crtc_is_valid(to_intel_crtc(tmp_crtc)))
515 516 517
			crtc = tmp_crtc;
	}

518
	if (!crtc)
519 520 521 522 523
		return NULL;

	return crtc;
}

524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543
static bool multiple_pipes_ok(struct drm_i915_private *dev_priv)
{
	enum pipe pipe;
	int n_pipes = 0;
	struct drm_crtc *crtc;

	if (INTEL_INFO(dev_priv)->gen > 4)
		return true;

	for_each_pipe(dev_priv, pipe) {
		crtc = dev_priv->pipe_to_crtc_mapping[pipe];

		if (intel_crtc_active(crtc) &&
		    to_intel_plane_state(crtc->primary->state)->visible)
			n_pipes++;
	}

	return (n_pipes < 2);
}

544
static int find_compression_threshold(struct drm_i915_private *dev_priv,
545 546 547 548 549 550
				      struct drm_mm_node *node,
				      int size,
				      int fb_cpp)
{
	int compression_threshold = 1;
	int ret;
551 552 553 554 555 556
	u64 end;

	/* The FBC hardware for BDW/SKL doesn't have access to the stolen
	 * reserved range size, so it always assumes the maximum (8mb) is used.
	 * If we enable FBC using a CFB on that memory range we'll get FIFO
	 * underruns, even if that range is not reserved by the BIOS. */
557 558
	if (IS_BROADWELL(dev_priv) ||
	    IS_SKYLAKE(dev_priv) || IS_KABYLAKE(dev_priv))
559 560 561
		end = dev_priv->gtt.stolen_size - 8 * 1024 * 1024;
	else
		end = dev_priv->gtt.stolen_usable_size;
562 563 564 565 566 567 568 569 570

	/* HACK: This code depends on what we will do in *_enable_fbc. If that
	 * code changes, this code needs to change as well.
	 *
	 * The enable_fbc code will attempt to use one of our 2 compression
	 * thresholds, therefore, in that case, we only have 1 resort.
	 */

	/* Try to over-allocate to reduce reallocations and fragmentation. */
571 572
	ret = i915_gem_stolen_insert_node_in_range(dev_priv, node, size <<= 1,
						   4096, 0, end);
573 574 575 576 577 578 579 580 581
	if (ret == 0)
		return compression_threshold;

again:
	/* HW's ability to limit the CFB is 1:4 */
	if (compression_threshold > 4 ||
	    (fb_cpp == 2 && compression_threshold == 2))
		return 0;

582 583
	ret = i915_gem_stolen_insert_node_in_range(dev_priv, node, size >>= 1,
						   4096, 0, end);
584
	if (ret && INTEL_INFO(dev_priv)->gen <= 4) {
585 586 587 588 589 590 591 592 593
		return 0;
	} else if (ret) {
		compression_threshold <<= 1;
		goto again;
	} else {
		return compression_threshold;
	}
}

594 595
static int intel_fbc_alloc_cfb(struct drm_i915_private *dev_priv, int size,
			       int fb_cpp)
596 597 598 599
{
	struct drm_mm_node *uninitialized_var(compressed_llb);
	int ret;

600
	ret = find_compression_threshold(dev_priv, &dev_priv->fbc.compressed_fb,
601 602 603 604 605 606 607 608 609 610 611 612
					 size, fb_cpp);
	if (!ret)
		goto err_llb;
	else if (ret > 1) {
		DRM_INFO("Reducing the compressed framebuffer size. This may lead to less power savings than a non-reduced-size. Try to increase stolen memory size if available in BIOS.\n");

	}

	dev_priv->fbc.threshold = ret;

	if (INTEL_INFO(dev_priv)->gen >= 5)
		I915_WRITE(ILK_DPFC_CB_BASE, dev_priv->fbc.compressed_fb.start);
613
	else if (IS_GM45(dev_priv)) {
614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
		I915_WRITE(DPFC_CB_BASE, dev_priv->fbc.compressed_fb.start);
	} else {
		compressed_llb = kzalloc(sizeof(*compressed_llb), GFP_KERNEL);
		if (!compressed_llb)
			goto err_fb;

		ret = i915_gem_stolen_insert_node(dev_priv, compressed_llb,
						  4096, 4096);
		if (ret)
			goto err_fb;

		dev_priv->fbc.compressed_llb = compressed_llb;

		I915_WRITE(FBC_CFB_BASE,
			   dev_priv->mm.stolen_base + dev_priv->fbc.compressed_fb.start);
		I915_WRITE(FBC_LL_BASE,
			   dev_priv->mm.stolen_base + compressed_llb->start);
	}

	dev_priv->fbc.uncompressed_size = size;

635 636 637
	DRM_DEBUG_KMS("reserved %llu bytes of contiguous stolen space for FBC, threshold: %d\n",
		      dev_priv->fbc.compressed_fb.size,
		      dev_priv->fbc.threshold);
638 639 640 641 642 643 644 645 646 647 648

	return 0;

err_fb:
	kfree(compressed_llb);
	i915_gem_stolen_remove_node(dev_priv, &dev_priv->fbc.compressed_fb);
err_llb:
	pr_info_once("drm: not enough stolen space for compressed buffer (need %d more bytes), disabling. Hint: you may be able to increase stolen memory size in the BIOS to avoid this.\n", size);
	return -ENOSPC;
}

649
static void __intel_fbc_cleanup_cfb(struct drm_i915_private *dev_priv)
650 651 652 653 654 655 656 657 658 659 660 661 662 663 664
{
	if (dev_priv->fbc.uncompressed_size == 0)
		return;

	i915_gem_stolen_remove_node(dev_priv, &dev_priv->fbc.compressed_fb);

	if (dev_priv->fbc.compressed_llb) {
		i915_gem_stolen_remove_node(dev_priv,
					    dev_priv->fbc.compressed_llb);
		kfree(dev_priv->fbc.compressed_llb);
	}

	dev_priv->fbc.uncompressed_size = 0;
}

665
void intel_fbc_cleanup_cfb(struct drm_i915_private *dev_priv)
P
Paulo Zanoni 已提交
666
{
P
Paulo Zanoni 已提交
667
	if (!fbc_supported(dev_priv))
668 669
		return;

P
Paulo Zanoni 已提交
670
	mutex_lock(&dev_priv->fbc.lock);
671
	__intel_fbc_cleanup_cfb(dev_priv);
P
Paulo Zanoni 已提交
672 673 674
	mutex_unlock(&dev_priv->fbc.lock);
}

P
Paulo Zanoni 已提交
675 676 677 678 679 680 681
/*
 * For SKL+, the plane source size used by the hardware is based on the value we
 * write to the PLANE_SIZE register. For BDW-, the hardware looks at the value
 * we wrote to PIPESRC.
 */
static void intel_fbc_get_plane_source_size(struct intel_crtc *crtc,
					    int *width, int *height)
682
{
P
Paulo Zanoni 已提交
683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722
	struct intel_plane_state *plane_state =
			to_intel_plane_state(crtc->base.primary->state);
	int w, h;

	if (intel_rotation_90_or_270(plane_state->base.rotation)) {
		w = drm_rect_height(&plane_state->src) >> 16;
		h = drm_rect_width(&plane_state->src) >> 16;
	} else {
		w = drm_rect_width(&plane_state->src) >> 16;
		h = drm_rect_height(&plane_state->src) >> 16;
	}

	if (width)
		*width = w;
	if (height)
		*height = h;
}

static int intel_fbc_calculate_cfb_size(struct intel_crtc *crtc)
{
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
	int lines;

	intel_fbc_get_plane_source_size(crtc, NULL, &lines);
	if (INTEL_INFO(dev_priv)->gen >= 7)
		lines = min(lines, 2048);

	return lines * fb->pitches[0];
}

static int intel_fbc_setup_cfb(struct intel_crtc *crtc)
{
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
	struct drm_framebuffer *fb = crtc->base.primary->fb;
	int size, cpp;

	size = intel_fbc_calculate_cfb_size(crtc);
	cpp = drm_format_plane_cpp(fb->pixel_format, 0);

723 724 725 726
	if (size <= dev_priv->fbc.uncompressed_size)
		return 0;

	/* Release any current block */
727
	__intel_fbc_cleanup_cfb(dev_priv);
728

P
Paulo Zanoni 已提交
729
	return intel_fbc_alloc_cfb(dev_priv, size, cpp);
730 731
}

732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752
static bool stride_is_valid(struct drm_i915_private *dev_priv,
			    unsigned int stride)
{
	/* These should have been caught earlier. */
	WARN_ON(stride < 512);
	WARN_ON((stride & (64 - 1)) != 0);

	/* Below are the additional FBC restrictions. */

	if (IS_GEN2(dev_priv) || IS_GEN3(dev_priv))
		return stride == 4096 || stride == 8192;

	if (IS_GEN4(dev_priv) && !IS_G4X(dev_priv) && stride < 2048)
		return false;

	if (stride > 16384)
		return false;

	return true;
}

753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775
static bool pixel_format_is_valid(struct drm_framebuffer *fb)
{
	struct drm_device *dev = fb->dev;
	struct drm_i915_private *dev_priv = dev->dev_private;

	switch (fb->pixel_format) {
	case DRM_FORMAT_XRGB8888:
	case DRM_FORMAT_XBGR8888:
		return true;
	case DRM_FORMAT_XRGB1555:
	case DRM_FORMAT_RGB565:
		/* 16bpp not supported on gen2 */
		if (IS_GEN2(dev))
			return false;
		/* WaFbcOnly1to1Ratio:ctg */
		if (IS_G4X(dev_priv))
			return false;
		return true;
	default:
		return false;
	}
}

776 777 778 779 780 781 782
/*
 * For some reason, the hardware tracking starts looking at whatever we
 * programmed as the display plane base address register. It does not look at
 * the X and Y offset registers. That's why we look at the crtc->adjusted{x,y}
 * variables instead of just looking at the pipe/plane size.
 */
static bool intel_fbc_hw_tracking_covers_screen(struct intel_crtc *crtc)
783 784
{
	struct drm_i915_private *dev_priv = crtc->base.dev->dev_private;
785
	unsigned int effective_w, effective_h, max_w, max_h;
786 787 788 789 790 791 792 793 794 795 796 797

	if (INTEL_INFO(dev_priv)->gen >= 8 || IS_HASWELL(dev_priv)) {
		max_w = 4096;
		max_h = 4096;
	} else if (IS_G4X(dev_priv) || INTEL_INFO(dev_priv)->gen >= 5) {
		max_w = 4096;
		max_h = 2048;
	} else {
		max_w = 2048;
		max_h = 1536;
	}

798 799 800 801 802
	intel_fbc_get_plane_source_size(crtc, &effective_w, &effective_h);
	effective_w += crtc->adjusted_x;
	effective_h += crtc->adjusted_y;

	return effective_w <= max_w && effective_h <= max_h;
803 804
}

805
/**
P
Paulo Zanoni 已提交
806
 * __intel_fbc_update - enable/disable FBC as needed, unlocked
807
 * @dev_priv: i915 device instance
808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823
 *
 * Set up the framebuffer compression hardware at mode set time.  We
 * enable it if possible:
 *   - plane A only (on pre-965)
 *   - no pixel mulitply/line duplication
 *   - no alpha buffer discard
 *   - no dual wide
 *   - framebuffer <= max_hdisplay in width, max_vdisplay in height
 *
 * We can't assume that any compression will take place (worst case),
 * so the compressed buffer has to be the same size as the uncompressed
 * one.  It also must reside (along with the line length buffer) in
 * stolen memory.
 *
 * We need to enable/disable FBC on a global basis.
 */
824
static void __intel_fbc_update(struct drm_i915_private *dev_priv)
825
{
826 827
	struct drm_crtc *drm_crtc = NULL;
	struct intel_crtc *crtc;
828 829 830 831
	struct drm_framebuffer *fb;
	struct drm_i915_gem_object *obj;
	const struct drm_display_mode *adjusted_mode;

P
Paulo Zanoni 已提交
832 833
	WARN_ON(!mutex_is_locked(&dev_priv->fbc.lock));

834
	/* disable framebuffer compression in vGPU */
835
	if (intel_vgpu_active(dev_priv->dev))
836 837
		i915.enable_fbc = 0;

838
	if (i915.enable_fbc < 0) {
839
		set_no_fbc_reason(dev_priv, "disabled per chip default");
840 841 842
		goto out_disable;
	}

R
Rodrigo Vivi 已提交
843
	if (!i915.enable_fbc) {
844
		set_no_fbc_reason(dev_priv, "disabled per module param");
845
		goto out_disable;
846 847 848 849 850 851 852 853 854 855 856
	}

	/*
	 * If FBC is already on, we just have to verify that we can
	 * keep it that way...
	 * Need to disable if:
	 *   - more than one pipe is active
	 *   - changing FBC params (stride, fence, mode)
	 *   - new fb is too large to fit in compressed buffer
	 *   - going to an unsupported config (interlace, pixel multiply, etc.)
	 */
857 858
	drm_crtc = intel_fbc_find_crtc(dev_priv);
	if (!drm_crtc) {
859
		set_no_fbc_reason(dev_priv, "no output");
860
		goto out_disable;
861
	}
862

863
	if (!multiple_pipes_ok(dev_priv)) {
864
		set_no_fbc_reason(dev_priv, "more than one pipe active");
865 866 867
		goto out_disable;
	}

868 869
	crtc = to_intel_crtc(drm_crtc);
	fb = crtc->base.primary->fb;
870
	obj = intel_fb_obj(fb);
871
	adjusted_mode = &crtc->config->base.adjusted_mode;
872 873 874

	if ((adjusted_mode->flags & DRM_MODE_FLAG_INTERLACE) ||
	    (adjusted_mode->flags & DRM_MODE_FLAG_DBLSCAN)) {
875
		set_no_fbc_reason(dev_priv, "incompatible mode");
876 877 878
		goto out_disable;
	}

879
	if (!intel_fbc_hw_tracking_covers_screen(crtc)) {
880
		set_no_fbc_reason(dev_priv, "mode too large for compression");
881 882
		goto out_disable;
	}
883

884
	if ((INTEL_INFO(dev_priv)->gen < 4 || HAS_DDI(dev_priv)) &&
885
	    crtc->plane != PLANE_A) {
886
		set_no_fbc_reason(dev_priv, "FBC unsupported on plane");
887 888 889 890 891 892 893 894
		goto out_disable;
	}

	/* The use of a CPU fence is mandatory in order to detect writes
	 * by the CPU to the scanout and trigger updates to the FBC.
	 */
	if (obj->tiling_mode != I915_TILING_X ||
	    obj->fence_reg == I915_FENCE_REG_NONE) {
895
		set_no_fbc_reason(dev_priv, "framebuffer not tiled or fenced");
896 897
		goto out_disable;
	}
898
	if (INTEL_INFO(dev_priv)->gen <= 4 && !IS_G4X(dev_priv) &&
899
	    crtc->base.primary->state->rotation != BIT(DRM_ROTATE_0)) {
900
		set_no_fbc_reason(dev_priv, "rotation unsupported");
901 902 903
		goto out_disable;
	}

904
	if (!stride_is_valid(dev_priv, fb->pitches[0])) {
905
		set_no_fbc_reason(dev_priv, "framebuffer stride not supported");
906 907 908
		goto out_disable;
	}

909
	if (!pixel_format_is_valid(fb)) {
910
		set_no_fbc_reason(dev_priv, "pixel format is invalid");
911 912 913
		goto out_disable;
	}

914
	/* If the kernel debugger is active, always disable compression */
915
	if (in_dbg_master()) {
916
		set_no_fbc_reason(dev_priv, "Kernel debugger is active");
917
		goto out_disable;
918
	}
919

920 921
	/* WaFbcExceedCdClockThreshold:hsw,bdw */
	if ((IS_HASWELL(dev_priv) || IS_BROADWELL(dev_priv)) &&
922
	    ilk_pipe_pixel_rate(crtc->config) >=
923
	    dev_priv->cdclk_freq * 95 / 100) {
924
		set_no_fbc_reason(dev_priv, "pixel rate is too big");
925 926 927
		goto out_disable;
	}

928
	if (intel_fbc_setup_cfb(crtc)) {
929
		set_no_fbc_reason(dev_priv, "not enough stolen memory");
930 931 932 933 934 935 936 937
		goto out_disable;
	}

	/* If the scanout has not changed, don't modify the FBC settings.
	 * Note that we make the fundamental assumption that the fb->obj
	 * cannot be unpinned (and have its GTT offset and fence revoked)
	 * without first being decoupled from the scanout and FBC disabled.
	 */
938
	if (dev_priv->fbc.crtc == crtc &&
939
	    dev_priv->fbc.fb_id == fb->base.id &&
940
	    dev_priv->fbc.y == crtc->base.y)
941 942
		return;

943
	if (intel_fbc_enabled(dev_priv)) {
944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967
		/* We update FBC along two paths, after changing fb/crtc
		 * configuration (modeswitching) and after page-flipping
		 * finishes. For the latter, we know that not only did
		 * we disable the FBC at the start of the page-flip
		 * sequence, but also more than one vblank has passed.
		 *
		 * For the former case of modeswitching, it is possible
		 * to switch between two FBC valid configurations
		 * instantaneously so we do need to disable the FBC
		 * before we can modify its control registers. We also
		 * have to wait for the next vblank for that to take
		 * effect. However, since we delay enabling FBC we can
		 * assume that a vblank has passed since disabling and
		 * that we can safely alter the registers in the deferred
		 * callback.
		 *
		 * In the scenario that we go from a valid to invalid
		 * and then back to valid FBC configuration we have
		 * no strict enforcement that a vblank occurred since
		 * disabling the FBC. However, along all current pipe
		 * disabling paths we do need to wait for a vblank at
		 * some point. And we wait before enabling FBC anyway.
		 */
		DRM_DEBUG_KMS("disabling active FBC for update\n");
968
		__intel_fbc_disable(dev_priv);
969 970
	}

971
	intel_fbc_schedule_enable(crtc);
972
	dev_priv->fbc.no_fbc_reason = "FBC enabled (not necessarily active)";
973 974 975 976
	return;

out_disable:
	/* Multiple disables should be harmless */
977
	if (intel_fbc_enabled(dev_priv)) {
978
		DRM_DEBUG_KMS("unsupported config, disabling FBC\n");
979
		__intel_fbc_disable(dev_priv);
980
	}
981
	__intel_fbc_cleanup_cfb(dev_priv);
P
Paulo Zanoni 已提交
982 983 984 985
}

/*
 * intel_fbc_update - enable/disable FBC as needed
986
 * @dev_priv: i915 device instance
P
Paulo Zanoni 已提交
987 988 989
 *
 * This function reevaluates the overall state and enables or disables FBC.
 */
990
void intel_fbc_update(struct drm_i915_private *dev_priv)
P
Paulo Zanoni 已提交
991
{
P
Paulo Zanoni 已提交
992
	if (!fbc_supported(dev_priv))
993 994
		return;

P
Paulo Zanoni 已提交
995
	mutex_lock(&dev_priv->fbc.lock);
996
	__intel_fbc_update(dev_priv);
P
Paulo Zanoni 已提交
997
	mutex_unlock(&dev_priv->fbc.lock);
998 999
}

1000 1001 1002 1003 1004 1005
void intel_fbc_invalidate(struct drm_i915_private *dev_priv,
			  unsigned int frontbuffer_bits,
			  enum fb_op_origin origin)
{
	unsigned int fbc_bits;

P
Paulo Zanoni 已提交
1006
	if (!fbc_supported(dev_priv))
1007 1008
		return;

1009 1010 1011
	if (origin == ORIGIN_GTT)
		return;

P
Paulo Zanoni 已提交
1012 1013
	mutex_lock(&dev_priv->fbc.lock);

1014 1015 1016 1017
	if (dev_priv->fbc.enabled)
		fbc_bits = INTEL_FRONTBUFFER_PRIMARY(dev_priv->fbc.crtc->pipe);
	else if (dev_priv->fbc.fbc_work)
		fbc_bits = INTEL_FRONTBUFFER_PRIMARY(
1018
					dev_priv->fbc.fbc_work->crtc->pipe);
1019 1020 1021 1022 1023 1024
	else
		fbc_bits = dev_priv->fbc.possible_framebuffer_bits;

	dev_priv->fbc.busy_bits |= (fbc_bits & frontbuffer_bits);

	if (dev_priv->fbc.busy_bits)
1025
		__intel_fbc_disable(dev_priv);
P
Paulo Zanoni 已提交
1026 1027

	mutex_unlock(&dev_priv->fbc.lock);
1028 1029 1030
}

void intel_fbc_flush(struct drm_i915_private *dev_priv,
1031
		     unsigned int frontbuffer_bits, enum fb_op_origin origin)
1032
{
P
Paulo Zanoni 已提交
1033
	if (!fbc_supported(dev_priv))
1034 1035
		return;

1036 1037
	if (origin == ORIGIN_GTT)
		return;
P
Paulo Zanoni 已提交
1038

1039
	mutex_lock(&dev_priv->fbc.lock);
1040 1041 1042

	dev_priv->fbc.busy_bits &= ~frontbuffer_bits;

1043 1044
	if (!dev_priv->fbc.busy_bits) {
		__intel_fbc_disable(dev_priv);
1045
		__intel_fbc_update(dev_priv);
1046
	}
P
Paulo Zanoni 已提交
1047 1048

	mutex_unlock(&dev_priv->fbc.lock);
1049 1050
}

R
Rodrigo Vivi 已提交
1051 1052 1053 1054 1055 1056
/**
 * intel_fbc_init - Initialize FBC
 * @dev_priv: the i915 device
 *
 * This function might be called during PM init process.
 */
1057 1058
void intel_fbc_init(struct drm_i915_private *dev_priv)
{
1059 1060
	enum pipe pipe;

P
Paulo Zanoni 已提交
1061 1062
	mutex_init(&dev_priv->fbc.lock);

1063 1064
	if (!HAS_FBC(dev_priv)) {
		dev_priv->fbc.enabled = false;
1065
		dev_priv->fbc.no_fbc_reason = "unsupported by this chipset";
1066 1067 1068
		return;
	}

1069 1070 1071 1072
	for_each_pipe(dev_priv, pipe) {
		dev_priv->fbc.possible_framebuffer_bits |=
				INTEL_FRONTBUFFER_PRIMARY(pipe);

1073
		if (fbc_on_pipe_a_only(dev_priv))
1074 1075 1076
			break;
	}

1077
	if (INTEL_INFO(dev_priv)->gen >= 7) {
1078 1079 1080
		dev_priv->fbc.fbc_enabled = ilk_fbc_enabled;
		dev_priv->fbc.enable_fbc = gen7_fbc_enable;
		dev_priv->fbc.disable_fbc = ilk_fbc_disable;
1081
	} else if (INTEL_INFO(dev_priv)->gen >= 5) {
1082 1083 1084
		dev_priv->fbc.fbc_enabled = ilk_fbc_enabled;
		dev_priv->fbc.enable_fbc = ilk_fbc_enable;
		dev_priv->fbc.disable_fbc = ilk_fbc_disable;
1085
	} else if (IS_GM45(dev_priv)) {
1086 1087 1088
		dev_priv->fbc.fbc_enabled = g4x_fbc_enabled;
		dev_priv->fbc.enable_fbc = g4x_fbc_enable;
		dev_priv->fbc.disable_fbc = g4x_fbc_disable;
1089
	} else {
1090 1091 1092
		dev_priv->fbc.fbc_enabled = i8xx_fbc_enabled;
		dev_priv->fbc.enable_fbc = i8xx_fbc_enable;
		dev_priv->fbc.disable_fbc = i8xx_fbc_disable;
1093 1094 1095 1096 1097

		/* This value was pulled out of someone's hat */
		I915_WRITE(FBC_CONTROL, 500 << FBC_CTL_INTERVAL_SHIFT);
	}

1098
	dev_priv->fbc.enabled = dev_priv->fbc.fbc_enabled(dev_priv);
1099
}