intel_uncore.c 44.2 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright © 2013 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 */

#include "i915_drv.h"
#include "intel_drv.h"
26
#include "i915_vgpu.h"
27

28 29
#include <linux/pm_runtime.h>

30
#define FORCEWAKE_ACK_TIMEOUT_MS 50
31

32
#define __raw_posting_read(dev_priv__, reg__) (void)__raw_i915_read32((dev_priv__), (reg__))
33

34 35 36 37 38 39 40
static const char * const forcewake_domain_names[] = {
	"render",
	"blitter",
	"media",
};

const char *
41
intel_uncore_forcewake_domain_to_str(const enum forcewake_domain_id id)
42
{
43
	BUILD_BUG_ON(ARRAY_SIZE(forcewake_domain_names) != FW_DOMAIN_ID_COUNT);
44 45 46 47 48 49 50 51 52 53 54

	if (id >= 0 && id < FW_DOMAIN_ID_COUNT)
		return forcewake_domain_names[id];

	WARN_ON(id);

	return "unknown";
}

static inline void
fw_domain_reset(const struct intel_uncore_forcewake_domain *d)
55
{
56
	WARN_ON(!i915_mmio_reg_valid(d->reg_set));
57
	__raw_i915_write32(d->i915, d->reg_set, d->val_reset);
58 59
}

60 61
static inline void
fw_domain_arm_timer(struct intel_uncore_forcewake_domain *d)
62
{
63
	mod_timer_pinned(&d->timer, jiffies + 1);
64 65
}

66 67
static inline void
fw_domain_wait_ack_clear(const struct intel_uncore_forcewake_domain *d)
68
{
69 70
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL) == 0,
71
			    FORCEWAKE_ACK_TIMEOUT_MS))
72 73 74
		DRM_ERROR("%s: timed out waiting for forcewake ack to clear.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
75

76 77 78 79 80
static inline void
fw_domain_get(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_set);
}
81

82 83 84 85 86
static inline void
fw_domain_wait_ack(const struct intel_uncore_forcewake_domain *d)
{
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL),
87
			    FORCEWAKE_ACK_TIMEOUT_MS))
88 89 90
		DRM_ERROR("%s: timed out waiting for forcewake ack request.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
91

92 93 94 95
static inline void
fw_domain_put(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_clear);
96 97
}

98 99
static inline void
fw_domain_posting_read(const struct intel_uncore_forcewake_domain *d)
100
{
101
	/* something from same cacheline, but not from the set register */
102
	if (i915_mmio_reg_valid(d->reg_post))
103
		__raw_posting_read(d->i915, d->reg_post);
104 105
}

106
static void
107
fw_domains_get(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
108
{
109
	struct intel_uncore_forcewake_domain *d;
110
	enum forcewake_domain_id id;
111

112 113 114 115 116 117
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_wait_ack_clear(d);
		fw_domain_get(d);
		fw_domain_wait_ack(d);
	}
}
118

119
static void
120
fw_domains_put(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
121 122
{
	struct intel_uncore_forcewake_domain *d;
123
	enum forcewake_domain_id id;
124

125 126 127 128 129
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_put(d);
		fw_domain_posting_read(d);
	}
}
130

131 132 133 134
static void
fw_domains_posting_read(struct drm_i915_private *dev_priv)
{
	struct intel_uncore_forcewake_domain *d;
135
	enum forcewake_domain_id id;
136 137 138 139 140 141 142 143 144

	/* No need to do for all, just do for first found */
	for_each_fw_domain(d, dev_priv, id) {
		fw_domain_posting_read(d);
		break;
	}
}

static void
145
fw_domains_reset(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
146 147
{
	struct intel_uncore_forcewake_domain *d;
148
	enum forcewake_domain_id id;
149

150 151
	if (dev_priv->uncore.fw_domains == 0)
		return;
152

153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id)
		fw_domain_reset(d);

	fw_domains_posting_read(dev_priv);
}

static void __gen6_gt_wait_for_thread_c0(struct drm_i915_private *dev_priv)
{
	/* w/a for a sporadic read returning 0 by waiting for the GT
	 * thread to wake up.
	 */
	if (wait_for_atomic_us((__raw_i915_read32(dev_priv, GEN6_GT_THREAD_STATUS_REG) &
				GEN6_GT_THREAD_STATUS_CORE_MASK) == 0, 500))
		DRM_ERROR("GT thread status wait timed out\n");
}

static void fw_domains_get_with_thread_status(struct drm_i915_private *dev_priv,
170
					      enum forcewake_domains fw_domains)
171 172
{
	fw_domains_get(dev_priv, fw_domains);
173

174
	/* WaRsForcewakeWaitTC0:snb,ivb,hsw,bdw,vlv */
175
	__gen6_gt_wait_for_thread_c0(dev_priv);
176 177 178 179 180
}

static void gen6_gt_check_fifodbg(struct drm_i915_private *dev_priv)
{
	u32 gtfifodbg;
181 182

	gtfifodbg = __raw_i915_read32(dev_priv, GTFIFODBG);
183 184
	if (WARN(gtfifodbg, "GT wake FIFO error 0x%x\n", gtfifodbg))
		__raw_i915_write32(dev_priv, GTFIFODBG, gtfifodbg);
185 186
}

187
static void fw_domains_put_with_fifo(struct drm_i915_private *dev_priv,
188
				     enum forcewake_domains fw_domains)
189
{
190
	fw_domains_put(dev_priv, fw_domains);
191 192 193
	gen6_gt_check_fifodbg(dev_priv);
}

194 195 196 197 198 199 200
static inline u32 fifo_free_entries(struct drm_i915_private *dev_priv)
{
	u32 count = __raw_i915_read32(dev_priv, GTFIFOCTL);

	return count & GT_FIFO_FREE_ENTRIES_MASK;
}

201 202 203 204
static int __gen6_gt_wait_for_fifo(struct drm_i915_private *dev_priv)
{
	int ret = 0;

205 206 207
	/* On VLV, FIFO will be shared by both SW and HW.
	 * So, we need to read the FREE_ENTRIES everytime */
	if (IS_VALLEYVIEW(dev_priv->dev))
208
		dev_priv->uncore.fifo_count = fifo_free_entries(dev_priv);
209

210 211
	if (dev_priv->uncore.fifo_count < GT_FIFO_NUM_RESERVED_ENTRIES) {
		int loop = 500;
212 213
		u32 fifo = fifo_free_entries(dev_priv);

214 215
		while (fifo <= GT_FIFO_NUM_RESERVED_ENTRIES && loop--) {
			udelay(10);
216
			fifo = fifo_free_entries(dev_priv);
217 218 219 220 221 222 223 224 225 226
		}
		if (WARN_ON(loop < 0 && fifo <= GT_FIFO_NUM_RESERVED_ENTRIES))
			++ret;
		dev_priv->uncore.fifo_count = fifo;
	}
	dev_priv->uncore.fifo_count--;

	return ret;
}

227
static void intel_uncore_fw_release_timer(unsigned long arg)
Z
Zhe Wang 已提交
228
{
229 230
	struct intel_uncore_forcewake_domain *domain = (void *)arg;
	unsigned long irqflags;
Z
Zhe Wang 已提交
231

232
	assert_rpm_device_not_suspended(domain->i915);
Z
Zhe Wang 已提交
233

234 235 236 237 238 239 240 241 242
	spin_lock_irqsave(&domain->i915->uncore.lock, irqflags);
	if (WARN_ON(domain->wake_count == 0))
		domain->wake_count++;

	if (--domain->wake_count == 0)
		domain->i915->uncore.funcs.force_wake_put(domain->i915,
							  1 << domain->id);

	spin_unlock_irqrestore(&domain->i915->uncore.lock, irqflags);
Z
Zhe Wang 已提交
243 244
}

245
void intel_uncore_forcewake_reset(struct drm_device *dev, bool restore)
Z
Zhe Wang 已提交
246
{
247
	struct drm_i915_private *dev_priv = dev->dev_private;
248
	unsigned long irqflags;
249
	struct intel_uncore_forcewake_domain *domain;
250 251 252
	int retry_count = 100;
	enum forcewake_domain_id id;
	enum forcewake_domains fw = 0, active_domains;
Z
Zhe Wang 已提交
253

254 255 256 257 258 259
	/* Hold uncore.lock across reset to prevent any register access
	 * with forcewake not set correctly. Wait until all pending
	 * timers are run before holding.
	 */
	while (1) {
		active_domains = 0;
Z
Zhe Wang 已提交
260

261 262 263
		for_each_fw_domain(domain, dev_priv, id) {
			if (del_timer_sync(&domain->timer) == 0)
				continue;
Z
Zhe Wang 已提交
264

265
			intel_uncore_fw_release_timer((unsigned long)domain);
266
		}
267

268
		spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
269

270 271 272 273
		for_each_fw_domain(domain, dev_priv, id) {
			if (timer_pending(&domain->timer))
				active_domains |= (1 << id);
		}
274

275 276
		if (active_domains == 0)
			break;
277

278 279 280 281
		if (--retry_count == 0) {
			DRM_ERROR("Timed out waiting for forcewake timers to finish\n");
			break;
		}
282

283 284 285
		spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
		cond_resched();
	}
286

287 288 289 290 291 292 293 294
	WARN_ON(active_domains);

	for_each_fw_domain(domain, dev_priv, id)
		if (domain->wake_count)
			fw |= 1 << id;

	if (fw)
		dev_priv->uncore.funcs.force_wake_put(dev_priv, fw);
295

296
	fw_domains_reset(dev_priv, FORCEWAKE_ALL);
Z
Zhe Wang 已提交
297

298 299 300 301 302 303
	if (restore) { /* If reset with a user forcewake, try to restore */
		if (fw)
			dev_priv->uncore.funcs.force_wake_get(dev_priv, fw);

		if (IS_GEN6(dev) || IS_GEN7(dev))
			dev_priv->uncore.fifo_count =
304
				fifo_free_entries(dev_priv);
305 306
	}

307
	if (!restore)
308
		assert_forcewakes_inactive(dev_priv);
309

310
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
311 312
}

313
static void intel_uncore_ellc_detect(struct drm_device *dev)
314 315 316
{
	struct drm_i915_private *dev_priv = dev->dev_private;

317 318
	if ((IS_HASWELL(dev) || IS_BROADWELL(dev) ||
	     INTEL_INFO(dev)->gen >= 9) &&
319
	    (__raw_i915_read32(dev_priv, HSW_EDRAM_PRESENT) & EDRAM_ENABLED)) {
320 321 322 323 324 325 326 327
		/* The docs do not explain exactly how the calculation can be
		 * made. It is somewhat guessable, but for now, it's always
		 * 128MB.
		 * NB: We can't write IDICR yet because we do not have gt funcs
		 * set up */
		dev_priv->ellc_size = 128;
		DRM_INFO("Found %zuMB of eLLC\n", dev_priv->ellc_size);
	}
328 329
}

330
static bool
331
fpga_check_for_unclaimed_mmio(struct drm_i915_private *dev_priv)
332 333 334 335 336 337 338 339 340 341 342 343
{
	u32 dbg;

	dbg = __raw_i915_read32(dev_priv, FPGA_DBG);
	if (likely(!(dbg & FPGA_DBG_RM_NOCLAIM)))
		return false;

	__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);

	return true;
}

344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369
static bool
vlv_check_for_unclaimed_mmio(struct drm_i915_private *dev_priv)
{
	u32 cer;

	cer = __raw_i915_read32(dev_priv, CLAIM_ER);
	if (likely(!(cer & (CLAIM_ER_OVERFLOW | CLAIM_ER_CTR_MASK))))
		return false;

	__raw_i915_write32(dev_priv, CLAIM_ER, CLAIM_ER_CLR);

	return true;
}

static bool
check_for_unclaimed_mmio(struct drm_i915_private *dev_priv)
{
	if (HAS_FPGA_DBG_UNCLAIMED(dev_priv))
		return fpga_check_for_unclaimed_mmio(dev_priv);

	if (IS_VALLEYVIEW(dev_priv) || IS_CHERRYVIEW(dev_priv))
		return vlv_check_for_unclaimed_mmio(dev_priv);

	return false;
}

370 371 372 373 374
static void __intel_uncore_early_sanitize(struct drm_device *dev,
					  bool restore_forcewake)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

375 376 377
	/* clear out unclaimed reg detection bit */
	if (check_for_unclaimed_mmio(dev_priv))
		DRM_DEBUG("unclaimed mmio detected on uncore init, clearing\n");
378

379 380 381 382 383
	/* clear out old GT FIFO errors */
	if (IS_GEN6(dev) || IS_GEN7(dev))
		__raw_i915_write32(dev_priv, GTFIFODBG,
				   __raw_i915_read32(dev_priv, GTFIFODBG));

384 385 386 387 388 389 390 391
	/* WaDisableShadowRegForCpd:chv */
	if (IS_CHERRYVIEW(dev)) {
		__raw_i915_write32(dev_priv, GTFIFOCTL,
				   __raw_i915_read32(dev_priv, GTFIFOCTL) |
				   GT_FIFO_CTL_BLOCK_ALL_POLICY_STALL |
				   GT_FIFO_CTL_RC6_POLICY_STALL);
	}

392
	intel_uncore_forcewake_reset(dev, restore_forcewake);
393 394
}

395 396 397 398 399 400
void intel_uncore_early_sanitize(struct drm_device *dev, bool restore_forcewake)
{
	__intel_uncore_early_sanitize(dev, restore_forcewake);
	i915_check_and_clear_faults(dev);
}

401 402
void intel_uncore_sanitize(struct drm_device *dev)
{
403 404
	i915.enable_rc6 = sanitize_rc6_option(dev, i915.enable_rc6);

405 406 407 408
	/* BIOS often leaves RC6 enabled, but disable it for hw init */
	intel_disable_gt_powersave(dev);
}

409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428
static void __intel_uncore_forcewake_get(struct drm_i915_private *dev_priv,
					 enum forcewake_domains fw_domains)
{
	struct intel_uncore_forcewake_domain *domain;
	enum forcewake_domain_id id;

	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

	fw_domains &= dev_priv->uncore.fw_domains;

	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (domain->wake_count++)
			fw_domains &= ~(1 << id);
	}

	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);
}

429 430 431 432 433 434 435 436 437 438 439 440
/**
 * intel_uncore_forcewake_get - grab forcewake domain references
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to get reference on
 *
 * This function can be used get GT's forcewake domain references.
 * Normal register access will handle the forcewake domains automatically.
 * However if some sequence requires the GT to not power down a particular
 * forcewake domains this function should be called at the beginning of the
 * sequence. And subsequently the reference should be dropped by symmetric
 * call to intel_unforce_forcewake_put(). Usually caller wants all the domains
 * to be kept awake so the @fw_domains would be then FORCEWAKE_ALL.
441
 */
442
void intel_uncore_forcewake_get(struct drm_i915_private *dev_priv,
443
				enum forcewake_domains fw_domains)
444 445 446
{
	unsigned long irqflags;

447 448 449
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

450
	assert_rpm_wakelock_held(dev_priv);
451

452
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
453
	__intel_uncore_forcewake_get(dev_priv, fw_domains);
454 455 456
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

457
/**
458
 * intel_uncore_forcewake_get__locked - grab forcewake domain references
459
 * @dev_priv: i915 device instance
460
 * @fw_domains: forcewake domains to get reference on
461
 *
462 463
 * See intel_uncore_forcewake_get(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
464
 */
465 466 467 468 469 470 471 472 473 474 475 476 477
void intel_uncore_forcewake_get__locked(struct drm_i915_private *dev_priv,
					enum forcewake_domains fw_domains)
{
	assert_spin_locked(&dev_priv->uncore.lock);

	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

	__intel_uncore_forcewake_get(dev_priv, fw_domains);
}

static void __intel_uncore_forcewake_put(struct drm_i915_private *dev_priv,
					 enum forcewake_domains fw_domains)
478
{
479
	struct intel_uncore_forcewake_domain *domain;
480
	enum forcewake_domain_id id;
481

482 483 484
	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

485 486 487 488 489 490 491 492 493 494
	fw_domains &= dev_priv->uncore.fw_domains;

	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (WARN_ON(domain->wake_count == 0))
			continue;

		if (--domain->wake_count)
			continue;

		domain->wake_count++;
495
		fw_domain_arm_timer(domain);
496
	}
497
}
498

499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516
/**
 * intel_uncore_forcewake_put - release a forcewake domain reference
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to put references
 *
 * This function drops the device-level forcewakes for specified
 * domains obtained by intel_uncore_forcewake_get().
 */
void intel_uncore_forcewake_put(struct drm_i915_private *dev_priv,
				enum forcewake_domains fw_domains)
{
	unsigned long irqflags;

	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
	__intel_uncore_forcewake_put(dev_priv, fw_domains);
517 518 519
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538
/**
 * intel_uncore_forcewake_put__locked - grab forcewake domain references
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to get reference on
 *
 * See intel_uncore_forcewake_put(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
 */
void intel_uncore_forcewake_put__locked(struct drm_i915_private *dev_priv,
					enum forcewake_domains fw_domains)
{
	assert_spin_locked(&dev_priv->uncore.lock);

	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

	__intel_uncore_forcewake_put(dev_priv, fw_domains);
}

539
void assert_forcewakes_inactive(struct drm_i915_private *dev_priv)
540
{
541
	struct intel_uncore_forcewake_domain *domain;
542
	enum forcewake_domain_id id;
543

544 545 546
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

547
	for_each_fw_domain(domain, dev_priv, id)
548
		WARN_ON(domain->wake_count);
549 550
}

551
/* We give fast paths for the really cool registers */
552
#define NEEDS_FORCE_WAKE(reg) ((reg) < 0x40000)
553

554
#define REG_RANGE(reg, start, end) ((reg) >= (start) && (reg) < (end))
555

556 557 558 559 560 561 562 563 564 565 566 567 568
#define FORCEWAKE_VLV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
	 REG_RANGE((reg), 0x5000, 0x8000) || \
	 REG_RANGE((reg), 0xB000, 0x12000) || \
	 REG_RANGE((reg), 0x2E000, 0x30000))

#define FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x22000, 0x24000) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
569
	 REG_RANGE((reg), 0x5200, 0x8000) || \
570
	 REG_RANGE((reg), 0x8300, 0x8500) || \
571
	 REG_RANGE((reg), 0xB000, 0xB480) || \
572 573 574 575 576 577 578 579
	 REG_RANGE((reg), 0xE000, 0xE800))

#define FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x8800, 0x8900) || \
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1C000) || \
	 REG_RANGE((reg), 0x1E800, 0x1EA00) || \
580
	 REG_RANGE((reg), 0x30000, 0x38000))
581 582 583 584 585 586

#define FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x4000, 0x5000) || \
	 REG_RANGE((reg), 0x8000, 0x8300) || \
	 REG_RANGE((reg), 0x8500, 0x8600) || \
	 REG_RANGE((reg), 0x9000, 0xB000) || \
587
	 REG_RANGE((reg), 0xF000, 0x10000))
588

589
#define FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) \
590
	REG_RANGE((reg), 0xB00,  0x2000)
591 592

#define FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) \
593 594
	(REG_RANGE((reg), 0x2000, 0x2700) || \
	 REG_RANGE((reg), 0x3000, 0x4000) || \
595
	 REG_RANGE((reg), 0x5200, 0x8000) || \
596
	 REG_RANGE((reg), 0x8140, 0x8160) || \
597 598 599
	 REG_RANGE((reg), 0x8300, 0x8500) || \
	 REG_RANGE((reg), 0x8C00, 0x8D00) || \
	 REG_RANGE((reg), 0xB000, 0xB480) || \
600 601
	 REG_RANGE((reg), 0xE000, 0xE900) || \
	 REG_RANGE((reg), 0x24400, 0x24800))
602 603

#define FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) \
604 605
	(REG_RANGE((reg), 0x8130, 0x8140) || \
	 REG_RANGE((reg), 0x8800, 0x8A00) || \
606 607 608 609 610 611 612 613 614
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1EA00) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg) \
	REG_RANGE((reg), 0x9400, 0x9800)

#define FORCEWAKE_GEN9_BLITTER_RANGE_OFFSET(reg) \
615
	((reg) < 0x40000 && \
616 617 618 619 620
	 !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg))

621 622 623 624 625 626
static void
ilk_dummy_write(struct drm_i915_private *dev_priv)
{
	/* WaIssueDummyWriteToWakeupFromRC6:ilk Issue a dummy write to wake up
	 * the chip from rc6 before touching it for real. MI_MODE is masked,
	 * hence harmless to write 0 into. */
627
	__raw_i915_write32(dev_priv, MI_MODE, 0);
628 629 630
}

static void
631 632 633 634
__unclaimed_reg_debug(struct drm_i915_private *dev_priv,
		      const i915_reg_t reg,
		      const bool read,
		      const bool before)
635
{
636 637 638 639 640 641 642 643 644
	/* XXX. We limit the auto arming traces for mmio
	 * debugs on these platforms. There are just too many
	 * revealed by these and CI/Bat suffers from the noise.
	 * Please fix and then re-enable the automatic traces.
	 */
	if (i915.mmio_debug < 2 &&
	    (IS_VALLEYVIEW(dev_priv) || IS_CHERRYVIEW(dev_priv)))
		return;

645 646 647 648 649
	if (WARN(check_for_unclaimed_mmio(dev_priv),
		 "Unclaimed register detected %s %s register 0x%x\n",
		 before ? "before" : "after",
		 read ? "reading" : "writing to",
		 i915_mmio_reg_offset(reg)))
650
		i915.mmio_debug--; /* Only report the first N failures */
651 652
}

653 654 655 656 657 658 659 660 661 662 663 664
static inline void
unclaimed_reg_debug(struct drm_i915_private *dev_priv,
		    const i915_reg_t reg,
		    const bool read,
		    const bool before)
{
	if (likely(!i915.mmio_debug))
		return;

	__unclaimed_reg_debug(dev_priv, reg, read, before);
}

665
#define GEN2_READ_HEADER(x) \
B
Ben Widawsky 已提交
666
	u##x val = 0; \
667
	assert_rpm_wakelock_held(dev_priv);
B
Ben Widawsky 已提交
668

669
#define GEN2_READ_FOOTER \
B
Ben Widawsky 已提交
670 671 672
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

673
#define __gen2_read(x) \
674
static u##x \
675
gen2_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
676
	GEN2_READ_HEADER(x); \
677
	val = __raw_i915_read##x(dev_priv, reg); \
678
	GEN2_READ_FOOTER; \
679 680 681 682
}

#define __gen5_read(x) \
static u##x \
683
gen5_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
684
	GEN2_READ_HEADER(x); \
685 686
	ilk_dummy_write(dev_priv); \
	val = __raw_i915_read##x(dev_priv, reg); \
687
	GEN2_READ_FOOTER; \
688 689
}

690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705
__gen5_read(8)
__gen5_read(16)
__gen5_read(32)
__gen5_read(64)
__gen2_read(8)
__gen2_read(16)
__gen2_read(32)
__gen2_read(64)

#undef __gen5_read
#undef __gen2_read

#undef GEN2_READ_FOOTER
#undef GEN2_READ_HEADER

#define GEN6_READ_HEADER(x) \
706
	u32 offset = i915_mmio_reg_offset(reg); \
707 708
	unsigned long irqflags; \
	u##x val = 0; \
709
	assert_rpm_wakelock_held(dev_priv); \
710 711
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags); \
	unclaimed_reg_debug(dev_priv, reg, true, true)
712 713

#define GEN6_READ_FOOTER \
714
	unclaimed_reg_debug(dev_priv, reg, true, false); \
715 716 717 718
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags); \
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

719
static inline void __force_wake_get(struct drm_i915_private *dev_priv,
720
				    enum forcewake_domains fw_domains)
721 722
{
	struct intel_uncore_forcewake_domain *domain;
723
	enum forcewake_domain_id id;
724 725 726 727 728

	if (WARN_ON(!fw_domains))
		return;

	/* Ideally GCC would be constant-fold and eliminate this loop */
729
	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
730
		if (domain->wake_count) {
731
			fw_domains &= ~(1 << id);
732 733 734 735
			continue;
		}

		domain->wake_count++;
736
		fw_domain_arm_timer(domain);
737 738 739 740 741 742
	}

	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);
}

743 744
#define __gen6_read(x) \
static u##x \
745
gen6_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
746
	GEN6_READ_HEADER(x); \
747
	if (NEEDS_FORCE_WAKE(offset)) \
748
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
749
	val = __raw_i915_read##x(dev_priv, reg); \
750
	GEN6_READ_FOOTER; \
751 752
}

753 754
#define __vlv_read(x) \
static u##x \
755
vlv_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
756
	enum forcewake_domains fw_engine = 0; \
757
	GEN6_READ_HEADER(x); \
758
	if (!NEEDS_FORCE_WAKE(offset)) \
759
		fw_engine = 0; \
760
	else if (FORCEWAKE_VLV_RENDER_RANGE_OFFSET(offset)) \
761
		fw_engine = FORCEWAKE_RENDER; \
762
	else if (FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(offset)) \
763 764 765
		fw_engine = FORCEWAKE_MEDIA; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
766
	val = __raw_i915_read##x(dev_priv, reg); \
767
	GEN6_READ_FOOTER; \
768 769
}

770 771
#define __chv_read(x) \
static u##x \
772
chv_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
773
	enum forcewake_domains fw_engine = 0; \
774
	GEN6_READ_HEADER(x); \
775
	if (!NEEDS_FORCE_WAKE(offset)) \
776
		fw_engine = 0; \
777
	else if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(offset)) \
778
		fw_engine = FORCEWAKE_RENDER; \
779
	else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(offset)) \
780
		fw_engine = FORCEWAKE_MEDIA; \
781
	else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(offset)) \
782 783 784
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
785
	val = __raw_i915_read##x(dev_priv, reg); \
786
	GEN6_READ_FOOTER; \
787
}
788

789
#define SKL_NEEDS_FORCE_WAKE(reg) \
790
	((reg) < 0x40000 && !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg))
791 792 793

#define __gen9_read(x) \
static u##x \
794
gen9_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
795
	enum forcewake_domains fw_engine; \
796
	GEN6_READ_HEADER(x); \
797
	if (!SKL_NEEDS_FORCE_WAKE(offset)) \
798
		fw_engine = 0; \
799
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(offset)) \
800
		fw_engine = FORCEWAKE_RENDER; \
801
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(offset)) \
802
		fw_engine = FORCEWAKE_MEDIA; \
803
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(offset)) \
804 805 806 807 808 809
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	val = __raw_i915_read##x(dev_priv, reg); \
810
	GEN6_READ_FOOTER; \
811 812 813 814 815 816
}

__gen9_read(8)
__gen9_read(16)
__gen9_read(32)
__gen9_read(64)
817 818 819 820
__chv_read(8)
__chv_read(16)
__chv_read(32)
__chv_read(64)
821 822 823 824
__vlv_read(8)
__vlv_read(16)
__vlv_read(32)
__vlv_read(64)
825 826 827 828 829
__gen6_read(8)
__gen6_read(16)
__gen6_read(32)
__gen6_read(64)

830
#undef __gen9_read
831
#undef __chv_read
832
#undef __vlv_read
833
#undef __gen6_read
834 835
#undef GEN6_READ_FOOTER
#undef GEN6_READ_HEADER
B
Ben Widawsky 已提交
836

837 838 839
#define VGPU_READ_HEADER(x) \
	unsigned long irqflags; \
	u##x val = 0; \
840
	assert_rpm_device_not_suspended(dev_priv); \
841 842 843 844 845 846 847 848 849
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define VGPU_READ_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags); \
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

#define __vgpu_read(x) \
static u##x \
850
vgpu_read##x(struct drm_i915_private *dev_priv, i915_reg_t reg, bool trace) { \
851 852 853 854 855 856 857 858 859 860 861 862 863 864
	VGPU_READ_HEADER(x); \
	val = __raw_i915_read##x(dev_priv, reg); \
	VGPU_READ_FOOTER; \
}

__vgpu_read(8)
__vgpu_read(16)
__vgpu_read(32)
__vgpu_read(64)

#undef __vgpu_read
#undef VGPU_READ_FOOTER
#undef VGPU_READ_HEADER

865
#define GEN2_WRITE_HEADER \
B
Ben Widawsky 已提交
866
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
867
	assert_rpm_wakelock_held(dev_priv); \
868

869
#define GEN2_WRITE_FOOTER
V
Ville Syrjälä 已提交
870

871
#define __gen2_write(x) \
872
static void \
873
gen2_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
874
	GEN2_WRITE_HEADER; \
875
	__raw_i915_write##x(dev_priv, reg, val); \
876
	GEN2_WRITE_FOOTER; \
877 878 879 880
}

#define __gen5_write(x) \
static void \
881
gen5_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
882
	GEN2_WRITE_HEADER; \
883 884
	ilk_dummy_write(dev_priv); \
	__raw_i915_write##x(dev_priv, reg, val); \
885
	GEN2_WRITE_FOOTER; \
886 887
}

888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903
__gen5_write(8)
__gen5_write(16)
__gen5_write(32)
__gen5_write(64)
__gen2_write(8)
__gen2_write(16)
__gen2_write(32)
__gen2_write(64)

#undef __gen5_write
#undef __gen2_write

#undef GEN2_WRITE_FOOTER
#undef GEN2_WRITE_HEADER

#define GEN6_WRITE_HEADER \
904
	u32 offset = i915_mmio_reg_offset(reg); \
905 906
	unsigned long irqflags; \
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
907
	assert_rpm_wakelock_held(dev_priv); \
908 909
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags); \
	unclaimed_reg_debug(dev_priv, reg, false, true)
910 911

#define GEN6_WRITE_FOOTER \
912
	unclaimed_reg_debug(dev_priv, reg, false, false); \
913 914
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags)

915 916
#define __gen6_write(x) \
static void \
917
gen6_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
918
	u32 __fifo_ret = 0; \
919
	GEN6_WRITE_HEADER; \
920
	if (NEEDS_FORCE_WAKE(offset)) { \
921 922 923 924 925 926
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
	__raw_i915_write##x(dev_priv, reg, val); \
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
927
	GEN6_WRITE_FOOTER; \
928 929 930 931
}

#define __hsw_write(x) \
static void \
932
hsw_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
933
	u32 __fifo_ret = 0; \
934
	GEN6_WRITE_HEADER; \
935
	if (NEEDS_FORCE_WAKE(offset)) { \
936 937
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
938
	__raw_i915_write##x(dev_priv, reg, val); \
939 940 941
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
942
	GEN6_WRITE_FOOTER; \
943
}
944

945
static const i915_reg_t gen8_shadowed_regs[] = {
946 947 948 949 950 951 952 953 954 955
	FORCEWAKE_MT,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	/* TODO: Other registers are not yet used */
};

956 957
static bool is_gen8_shadowed(struct drm_i915_private *dev_priv,
			     i915_reg_t reg)
958 959 960
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen8_shadowed_regs); i++)
961
		if (i915_mmio_reg_equal(reg, gen8_shadowed_regs[i]))
962 963 964 965 966 967 968
			return true;

	return false;
}

#define __gen8_write(x) \
static void \
969
gen8_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
970
	GEN6_WRITE_HEADER; \
971
	if (NEEDS_FORCE_WAKE(offset) && !is_gen8_shadowed(dev_priv, reg)) \
972 973
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	__raw_i915_write##x(dev_priv, reg, val); \
974
	GEN6_WRITE_FOOTER; \
975 976
}

977 978
#define __chv_write(x) \
static void \
979
chv_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, bool trace) { \
980
	enum forcewake_domains fw_engine = 0; \
981
	GEN6_WRITE_HEADER; \
982
	if (!NEEDS_FORCE_WAKE(offset) || \
983
	    is_gen8_shadowed(dev_priv, reg)) \
984
		fw_engine = 0; \
985
	else if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(offset)) \
986
		fw_engine = FORCEWAKE_RENDER; \
987
	else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(offset)) \
988
		fw_engine = FORCEWAKE_MEDIA; \
989
	else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(offset)) \
990 991 992
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
993
	__raw_i915_write##x(dev_priv, reg, val); \
994
	GEN6_WRITE_FOOTER; \
995 996
}

997
static const i915_reg_t gen9_shadowed_regs[] = {
Z
Zhe Wang 已提交
998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	FORCEWAKE_BLITTER_GEN9,
	FORCEWAKE_RENDER_GEN9,
	FORCEWAKE_MEDIA_GEN9,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	/* TODO: Other registers are not yet used */
};

1010 1011
static bool is_gen9_shadowed(struct drm_i915_private *dev_priv,
			     i915_reg_t reg)
Z
Zhe Wang 已提交
1012 1013 1014
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen9_shadowed_regs); i++)
1015
		if (i915_mmio_reg_equal(reg, gen9_shadowed_regs[i]))
Z
Zhe Wang 已提交
1016 1017 1018 1019 1020
			return true;

	return false;
}

1021 1022
#define __gen9_write(x) \
static void \
1023
gen9_write##x(struct drm_i915_private *dev_priv, i915_reg_t reg, u##x val, \
1024
		bool trace) { \
1025
	enum forcewake_domains fw_engine; \
1026
	GEN6_WRITE_HEADER; \
1027
	if (!SKL_NEEDS_FORCE_WAKE(offset) || \
1028 1029
	    is_gen9_shadowed(dev_priv, reg)) \
		fw_engine = 0; \
1030
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(offset)) \
1031
		fw_engine = FORCEWAKE_RENDER; \
1032
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(offset)) \
1033
		fw_engine = FORCEWAKE_MEDIA; \
1034
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(offset)) \
1035 1036 1037 1038 1039 1040
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	__raw_i915_write##x(dev_priv, reg, val); \
1041
	GEN6_WRITE_FOOTER; \
1042 1043 1044 1045 1046 1047
}

__gen9_write(8)
__gen9_write(16)
__gen9_write(32)
__gen9_write(64)
1048 1049 1050 1051
__chv_write(8)
__chv_write(16)
__chv_write(32)
__chv_write(64)
1052 1053 1054 1055
__gen8_write(8)
__gen8_write(16)
__gen8_write(32)
__gen8_write(64)
1056 1057 1058 1059 1060 1061 1062 1063 1064
__hsw_write(8)
__hsw_write(16)
__hsw_write(32)
__hsw_write(64)
__gen6_write(8)
__gen6_write(16)
__gen6_write(32)
__gen6_write(64)

1065
#undef __gen9_write
1066
#undef __chv_write
1067
#undef __gen8_write
1068 1069
#undef __hsw_write
#undef __gen6_write
1070 1071
#undef GEN6_WRITE_FOOTER
#undef GEN6_WRITE_HEADER
1072

1073 1074 1075
#define VGPU_WRITE_HEADER \
	unsigned long irqflags; \
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
1076
	assert_rpm_device_not_suspended(dev_priv); \
1077 1078 1079 1080 1081 1082 1083
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define VGPU_WRITE_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags)

#define __vgpu_write(x) \
static void vgpu_write##x(struct drm_i915_private *dev_priv, \
1084
			  i915_reg_t reg, u##x val, bool trace) { \
1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098
	VGPU_WRITE_HEADER; \
	__raw_i915_write##x(dev_priv, reg, val); \
	VGPU_WRITE_FOOTER; \
}

__vgpu_write(8)
__vgpu_write(16)
__vgpu_write(32)
__vgpu_write(64)

#undef __vgpu_write
#undef VGPU_WRITE_FOOTER
#undef VGPU_WRITE_HEADER

1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114
#define ASSIGN_WRITE_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_writeb = x##_write8; \
	dev_priv->uncore.funcs.mmio_writew = x##_write16; \
	dev_priv->uncore.funcs.mmio_writel = x##_write32; \
	dev_priv->uncore.funcs.mmio_writeq = x##_write64; \
} while (0)

#define ASSIGN_READ_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_readb = x##_read8; \
	dev_priv->uncore.funcs.mmio_readw = x##_read16; \
	dev_priv->uncore.funcs.mmio_readl = x##_read32; \
	dev_priv->uncore.funcs.mmio_readq = x##_read64; \
} while (0)

1115 1116

static void fw_domain_init(struct drm_i915_private *dev_priv,
1117
			   enum forcewake_domain_id domain_id,
1118 1119
			   i915_reg_t reg_set,
			   i915_reg_t reg_ack)
1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138
{
	struct intel_uncore_forcewake_domain *d;

	if (WARN_ON(domain_id >= FW_DOMAIN_ID_COUNT))
		return;

	d = &dev_priv->uncore.fw_domain[domain_id];

	WARN_ON(d->wake_count);

	d->wake_count = 0;
	d->reg_set = reg_set;
	d->reg_ack = reg_ack;

	if (IS_GEN6(dev_priv)) {
		d->val_reset = 0;
		d->val_set = FORCEWAKE_KERNEL;
		d->val_clear = 0;
	} else {
1139
		/* WaRsClearFWBitsAtReset:bdw,skl */
1140 1141 1142 1143 1144
		d->val_reset = _MASKED_BIT_DISABLE(0xffff);
		d->val_set = _MASKED_BIT_ENABLE(FORCEWAKE_KERNEL);
		d->val_clear = _MASKED_BIT_DISABLE(FORCEWAKE_KERNEL);
	}

1145
	if (IS_VALLEYVIEW(dev_priv) || IS_CHERRYVIEW(dev_priv))
1146 1147 1148 1149 1150 1151 1152
		d->reg_post = FORCEWAKE_ACK_VLV;
	else if (IS_GEN6(dev_priv) || IS_GEN7(dev_priv) || IS_GEN8(dev_priv))
		d->reg_post = ECOBUS;

	d->i915 = dev_priv;
	d->id = domain_id;

1153
	setup_timer(&d->timer, intel_uncore_fw_release_timer, (unsigned long)d);
1154 1155

	dev_priv->uncore.fw_domains |= (1 << domain_id);
1156 1157

	fw_domain_reset(d);
1158 1159
}

1160
static void intel_uncore_fw_domains_init(struct drm_device *dev)
1161 1162 1163
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1164 1165 1166
	if (INTEL_INFO(dev_priv->dev)->gen <= 5)
		return;

Z
Zhe Wang 已提交
1167
	if (IS_GEN9(dev)) {
1168 1169 1170 1171 1172 1173 1174 1175 1176 1177
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_RENDER_GEN9,
			       FORCEWAKE_ACK_RENDER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_BLITTER,
			       FORCEWAKE_BLITTER_GEN9,
			       FORCEWAKE_ACK_BLITTER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_GEN9, FORCEWAKE_ACK_MEDIA_GEN9);
1178
	} else if (IS_VALLEYVIEW(dev) || IS_CHERRYVIEW(dev)) {
1179
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
1180 1181 1182 1183 1184
		if (!IS_CHERRYVIEW(dev))
			dev_priv->uncore.funcs.force_wake_put =
				fw_domains_put_with_fifo;
		else
			dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
1185 1186 1187 1188
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_VLV, FORCEWAKE_ACK_VLV);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_VLV, FORCEWAKE_ACK_MEDIA_VLV);
1189
	} else if (IS_HASWELL(dev) || IS_BROADWELL(dev)) {
1190 1191 1192 1193 1194
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_ACK_HSW);
1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206
	} else if (IS_IVYBRIDGE(dev)) {
		u32 ecobus;

		/* IVB configs may use multi-threaded forcewake */

		/* A small trick here - if the bios hasn't configured
		 * MT forcewake, and if the device is in RC6, then
		 * force_wake_mt_get will not wake the device and the
		 * ECOBUS read will return zero. Which will be
		 * (correctly) interpreted by the test below as MT
		 * forcewake being disabled.
		 */
1207 1208 1209 1210 1211
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put =
			fw_domains_put_with_fifo;

1212 1213
		/* We need to init first for ECOBUS access and then
		 * determine later if we want to reinit, in case of MT access is
1214 1215 1216
		 * not working. In this stage we don't know which flavour this
		 * ivb is, so it is better to reset also the gen6 fw registers
		 * before the ecobus check.
1217
		 */
1218 1219 1220 1221

		__raw_i915_write32(dev_priv, FORCEWAKE, 0);
		__raw_posting_read(dev_priv, ECOBUS);

1222 1223
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_MT_ACK);
1224

1225
		mutex_lock(&dev->struct_mutex);
1226
		fw_domains_get_with_thread_status(dev_priv, FORCEWAKE_ALL);
1227
		ecobus = __raw_i915_read32(dev_priv, ECOBUS);
1228
		fw_domains_put_with_fifo(dev_priv, FORCEWAKE_ALL);
1229 1230
		mutex_unlock(&dev->struct_mutex);

1231
		if (!(ecobus & FORCEWAKE_MT_ENABLE)) {
1232 1233
			DRM_INFO("No MT forcewake available on Ivybridge, this can result in issues\n");
			DRM_INFO("when using vblank-synced partial screen updates.\n");
1234 1235
			fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
				       FORCEWAKE, FORCEWAKE_ACK);
1236 1237 1238
		}
	} else if (IS_GEN6(dev)) {
		dev_priv->uncore.funcs.force_wake_get =
1239
			fw_domains_get_with_thread_status;
1240
		dev_priv->uncore.funcs.force_wake_put =
1241 1242 1243
			fw_domains_put_with_fifo;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE, FORCEWAKE_ACK);
1244
	}
1245 1246 1247

	/* All future platforms are expected to require complex power gating */
	WARN_ON(dev_priv->uncore.fw_domains == 0);
1248 1249 1250 1251 1252 1253
}

void intel_uncore_init(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1254 1255
	i915_check_vgpu(dev);

1256 1257 1258
	intel_uncore_ellc_detect(dev);
	intel_uncore_fw_domains_init(dev);
	__intel_uncore_early_sanitize(dev, false);
1259

1260 1261
	dev_priv->uncore.unclaimed_mmio_check = 1;

1262
	switch (INTEL_INFO(dev)->gen) {
1263
	default:
1264 1265 1266 1267 1268
	case 9:
		ASSIGN_WRITE_MMIO_VFUNCS(gen9);
		ASSIGN_READ_MMIO_VFUNCS(gen9);
		break;
	case 8:
1269
		if (IS_CHERRYVIEW(dev)) {
1270 1271
			ASSIGN_WRITE_MMIO_VFUNCS(chv);
			ASSIGN_READ_MMIO_VFUNCS(chv);
1272 1273

		} else {
1274 1275
			ASSIGN_WRITE_MMIO_VFUNCS(gen8);
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1276
		}
1277
		break;
1278 1279
	case 7:
	case 6:
1280
		if (IS_HASWELL(dev)) {
1281
			ASSIGN_WRITE_MMIO_VFUNCS(hsw);
1282
		} else {
1283
			ASSIGN_WRITE_MMIO_VFUNCS(gen6);
1284
		}
1285 1286

		if (IS_VALLEYVIEW(dev)) {
1287
			ASSIGN_READ_MMIO_VFUNCS(vlv);
1288
		} else {
1289
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1290
		}
1291 1292
		break;
	case 5:
1293 1294
		ASSIGN_WRITE_MMIO_VFUNCS(gen5);
		ASSIGN_READ_MMIO_VFUNCS(gen5);
1295 1296 1297 1298
		break;
	case 4:
	case 3:
	case 2:
1299 1300
		ASSIGN_WRITE_MMIO_VFUNCS(gen2);
		ASSIGN_READ_MMIO_VFUNCS(gen2);
1301 1302
		break;
	}
1303

1304 1305 1306 1307 1308
	if (intel_vgpu_active(dev)) {
		ASSIGN_WRITE_MMIO_VFUNCS(vgpu);
		ASSIGN_READ_MMIO_VFUNCS(vgpu);
	}

1309
	i915_check_and_clear_faults(dev);
1310
}
1311 1312
#undef ASSIGN_WRITE_MMIO_VFUNCS
#undef ASSIGN_READ_MMIO_VFUNCS
1313 1314 1315 1316 1317

void intel_uncore_fini(struct drm_device *dev)
{
	/* Paranoia: make sure we have disabled everything before we exit. */
	intel_uncore_sanitize(dev);
1318
	intel_uncore_forcewake_reset(dev, false);
1319 1320
}

1321 1322
#define GEN_RANGE(l, h) GENMASK(h, l)

1323
static const struct register_whitelist {
1324
	i915_reg_t offset_ldw, offset_udw;
1325
	uint32_t size;
1326 1327
	/* supported gens, 0x10 for 4, 0x30 for 4 and 5, etc. */
	uint32_t gen_bitmask;
1328
} whitelist[] = {
1329 1330 1331
	{ .offset_ldw = RING_TIMESTAMP(RENDER_RING_BASE),
	  .offset_udw = RING_TIMESTAMP_UDW(RENDER_RING_BASE),
	  .size = 8, .gen_bitmask = GEN_RANGE(4, 9) },
1332 1333 1334 1335 1336 1337 1338 1339
};

int i915_reg_read_ioctl(struct drm_device *dev,
			void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reg_read *reg = data;
	struct register_whitelist const *entry = whitelist;
1340
	unsigned size;
1341
	i915_reg_t offset_ldw, offset_udw;
1342
	int i, ret = 0;
1343 1344

	for (i = 0; i < ARRAY_SIZE(whitelist); i++, entry++) {
1345
		if (i915_mmio_reg_offset(entry->offset_ldw) == (reg->offset & -entry->size) &&
1346 1347 1348 1349 1350 1351 1352
		    (1 << INTEL_INFO(dev)->gen & entry->gen_bitmask))
			break;
	}

	if (i == ARRAY_SIZE(whitelist))
		return -EINVAL;

1353 1354 1355 1356
	/* We use the low bits to encode extra flags as the register should
	 * be naturally aligned (and those that are not so aligned merely
	 * limit the available flags for that register).
	 */
1357 1358
	offset_ldw = entry->offset_ldw;
	offset_udw = entry->offset_udw;
1359
	size = entry->size;
1360
	size |= reg->offset ^ i915_mmio_reg_offset(offset_ldw);
1361

1362 1363
	intel_runtime_pm_get(dev_priv);

1364 1365
	switch (size) {
	case 8 | 1:
1366
		reg->val = I915_READ64_2x32(offset_ldw, offset_udw);
1367
		break;
1368
	case 8:
1369
		reg->val = I915_READ64(offset_ldw);
1370 1371
		break;
	case 4:
1372
		reg->val = I915_READ(offset_ldw);
1373 1374
		break;
	case 2:
1375
		reg->val = I915_READ16(offset_ldw);
1376 1377
		break;
	case 1:
1378
		reg->val = I915_READ8(offset_ldw);
1379 1380
		break;
	default:
1381 1382
		ret = -EINVAL;
		goto out;
1383 1384
	}

1385 1386 1387
out:
	intel_runtime_pm_put(dev_priv);
	return ret;
1388 1389
}

1390 1391 1392 1393 1394 1395
int i915_get_reset_stats_ioctl(struct drm_device *dev,
			       void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reset_stats *args = data;
	struct i915_ctx_hang_stats *hs;
1396
	struct intel_context *ctx;
1397 1398
	int ret;

1399 1400 1401
	if (args->flags || args->pad)
		return -EINVAL;

1402
	if (args->ctx_id == DEFAULT_CONTEXT_HANDLE && !capable(CAP_SYS_ADMIN))
1403 1404 1405 1406 1407 1408
		return -EPERM;

	ret = mutex_lock_interruptible(&dev->struct_mutex);
	if (ret)
		return ret;

1409 1410
	ctx = i915_gem_context_get(file->driver_priv, args->ctx_id);
	if (IS_ERR(ctx)) {
1411
		mutex_unlock(&dev->struct_mutex);
1412
		return PTR_ERR(ctx);
1413
	}
1414
	hs = &ctx->hang_stats;
1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428

	if (capable(CAP_SYS_ADMIN))
		args->reset_count = i915_reset_count(&dev_priv->gpu_error);
	else
		args->reset_count = 0;

	args->batch_active = hs->batch_active;
	args->batch_pending = hs->batch_pending;

	mutex_unlock(&dev->struct_mutex);

	return 0;
}

1429
static int i915_reset_complete(struct drm_device *dev)
1430 1431
{
	u8 gdrst;
1432
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1433
	return (gdrst & GRDOM_RESET_STATUS) == 0;
1434 1435
}

1436
static int i915_do_reset(struct drm_device *dev)
1437
{
V
Ville Syrjälä 已提交
1438
	/* assert reset for at least 20 usec */
1439
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1440
	udelay(20);
1441
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1442

1443
	return wait_for(i915_reset_complete(dev), 500);
V
Ville Syrjälä 已提交
1444 1445 1446 1447 1448
}

static int g4x_reset_complete(struct drm_device *dev)
{
	u8 gdrst;
1449
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1450
	return (gdrst & GRDOM_RESET_ENABLE) == 0;
1451 1452
}

1453 1454 1455 1456 1457 1458
static int g33_do_reset(struct drm_device *dev)
{
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
	return wait_for(g4x_reset_complete(dev), 500);
}

1459 1460 1461 1462 1463
static int g4x_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

1464
	pci_write_config_byte(dev->pdev, I915_GDRST,
1465
			      GRDOM_RENDER | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1466
	ret =  wait_for(g4x_reset_complete(dev), 500);
1467 1468 1469 1470 1471 1472 1473
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) | VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1474
	pci_write_config_byte(dev->pdev, I915_GDRST,
1475
			      GRDOM_MEDIA | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1476
	ret =  wait_for(g4x_reset_complete(dev), 500);
1477 1478 1479 1480 1481 1482 1483
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) & ~VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1484
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1485 1486 1487 1488

	return 0;
}

1489 1490 1491 1492 1493
static int ironlake_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

1494
	I915_WRITE(ILK_GDSR,
1495
		   ILK_GRDOM_RENDER | ILK_GRDOM_RESET_ENABLE);
1496
	ret = wait_for((I915_READ(ILK_GDSR) &
1497
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
1498 1499 1500
	if (ret)
		return ret;

1501
	I915_WRITE(ILK_GDSR,
1502
		   ILK_GRDOM_MEDIA | ILK_GRDOM_RESET_ENABLE);
1503
	ret = wait_for((I915_READ(ILK_GDSR) &
1504 1505 1506 1507
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
	if (ret)
		return ret;

1508
	I915_WRITE(ILK_GDSR, 0);
1509 1510

	return 0;
1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523
}

static int gen6_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int	ret;

	/* Reset the chip */

	/* GEN6_GDRST is not in the gt power well, no need to check
	 * for fifo space for the write or forcewake the chip for
	 * the read
	 */
1524
	__raw_i915_write32(dev_priv, GEN6_GDRST, GEN6_GRDOM_FULL);
1525 1526

	/* Spin waiting for the device to ack the reset request */
1527
	ret = wait_for((__raw_i915_read32(dev_priv, GEN6_GDRST) & GEN6_GRDOM_FULL) == 0, 500);
1528

1529
	intel_uncore_forcewake_reset(dev, true);
1530

1531 1532 1533
	return ret;
}

1534 1535 1536 1537 1538
static int wait_for_register_fw(struct drm_i915_private *dev_priv,
				i915_reg_t reg,
				const u32 mask,
				const u32 value,
				const unsigned long timeout_ms)
1539
{
1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567
	return wait_for((I915_READ_FW(reg) & mask) == value, timeout_ms);
}

static int gen8_request_engine_reset(struct intel_engine_cs *engine)
{
	int ret;
	struct drm_i915_private *dev_priv = engine->dev->dev_private;

	I915_WRITE_FW(RING_RESET_CTL(engine->mmio_base),
		      _MASKED_BIT_ENABLE(RESET_CTL_REQUEST_RESET));

	ret = wait_for_register_fw(dev_priv,
				   RING_RESET_CTL(engine->mmio_base),
				   RESET_CTL_READY_TO_RESET,
				   RESET_CTL_READY_TO_RESET,
				   700);
	if (ret)
		DRM_ERROR("%s: reset request timeout\n", engine->name);

	return ret;
}

static void gen8_unrequest_engine_reset(struct intel_engine_cs *engine)
{
	struct drm_i915_private *dev_priv = engine->dev->dev_private;

	I915_WRITE_FW(RING_RESET_CTL(engine->mmio_base),
		      _MASKED_BIT_DISABLE(RESET_CTL_REQUEST_RESET));
1568 1569 1570 1571 1572 1573 1574 1575
}

static int gen8_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct intel_engine_cs *engine;
	int i;

1576 1577
	for_each_ring(engine, dev_priv, i)
		if (gen8_request_engine_reset(engine))
1578 1579 1580 1581 1582 1583
			goto not_ready;

	return gen6_do_reset(dev);

not_ready:
	for_each_ring(engine, dev_priv, i)
1584
		gen8_unrequest_engine_reset(engine);
1585 1586 1587 1588

	return -EIO;
}

1589
static int (*intel_get_gpu_reset(struct drm_device *dev))(struct drm_device *)
1590
{
1591 1592 1593
	if (!i915.reset)
		return NULL;

1594 1595 1596
	if (INTEL_INFO(dev)->gen >= 8)
		return gen8_do_reset;
	else if (INTEL_INFO(dev)->gen >= 6)
1597
		return gen6_do_reset;
1598
	else if (IS_GEN5(dev))
1599
		return ironlake_do_reset;
1600
	else if (IS_G4X(dev))
1601
		return g4x_do_reset;
1602
	else if (IS_G33(dev))
1603
		return g33_do_reset;
1604
	else if (INTEL_INFO(dev)->gen >= 3)
1605
		return i915_do_reset;
1606
	else
1607 1608 1609 1610 1611
		return NULL;
}

int intel_gpu_reset(struct drm_device *dev)
{
1612
	struct drm_i915_private *dev_priv = to_i915(dev);
1613
	int (*reset)(struct drm_device *);
1614
	int ret;
1615 1616 1617

	reset = intel_get_gpu_reset(dev);
	if (reset == NULL)
1618
		return -ENODEV;
1619

1620 1621 1622 1623 1624 1625 1626 1627
	/* If the power well sleeps during the reset, the reset
	 * request may be dropped and never completes (causing -EIO).
	 */
	intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
	ret = reset(dev);
	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);

	return ret;
1628 1629 1630 1631 1632
}

bool intel_has_gpu_reset(struct drm_device *dev)
{
	return intel_get_gpu_reset(dev) != NULL;
1633 1634
}

1635
bool intel_uncore_unclaimed_mmio(struct drm_i915_private *dev_priv)
1636
{
1637
	return check_for_unclaimed_mmio(dev_priv);
1638
}
1639

1640
bool
1641 1642 1643 1644
intel_uncore_arm_unclaimed_mmio_detection(struct drm_i915_private *dev_priv)
{
	if (unlikely(i915.mmio_debug ||
		     dev_priv->uncore.unclaimed_mmio_check <= 0))
1645
		return false;
1646 1647 1648 1649 1650 1651 1652

	if (unlikely(intel_uncore_unclaimed_mmio(dev_priv))) {
		DRM_DEBUG("Unclaimed register detected, "
			  "enabling oneshot unclaimed register reporting. "
			  "Please use i915.mmio_debug=N for more information.\n");
		i915.mmio_debug++;
		dev_priv->uncore.unclaimed_mmio_check--;
1653
		return true;
1654
	}
1655 1656

	return false;
1657
}