intel_uncore.c 40.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright © 2013 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 */

#include "i915_drv.h"
#include "intel_drv.h"
26
#include "i915_vgpu.h"
27

28 29
#include <linux/pm_runtime.h>

30 31
#define FORCEWAKE_ACK_TIMEOUT_MS 2

32 33 34 35 36 37 38 39 40 41 42 43 44 45
#define __raw_i915_read8(dev_priv__, reg__) readb((dev_priv__)->regs + (reg__))
#define __raw_i915_write8(dev_priv__, reg__, val__) writeb(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read16(dev_priv__, reg__) readw((dev_priv__)->regs + (reg__))
#define __raw_i915_write16(dev_priv__, reg__, val__) writew(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read32(dev_priv__, reg__) readl((dev_priv__)->regs + (reg__))
#define __raw_i915_write32(dev_priv__, reg__, val__) writel(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read64(dev_priv__, reg__) readq((dev_priv__)->regs + (reg__))
#define __raw_i915_write64(dev_priv__, reg__, val__) writeq(val__, (dev_priv__)->regs + (reg__))

#define __raw_posting_read(dev_priv__, reg__) (void)__raw_i915_read32(dev_priv__, reg__)

46 47 48 49 50 51 52
static const char * const forcewake_domain_names[] = {
	"render",
	"blitter",
	"media",
};

const char *
53
intel_uncore_forcewake_domain_to_str(const enum forcewake_domain_id id)
54 55 56 57 58 59 60 61 62 63 64 65
{
	BUILD_BUG_ON((sizeof(forcewake_domain_names)/sizeof(const char *)) !=
		     FW_DOMAIN_ID_COUNT);

	if (id >= 0 && id < FW_DOMAIN_ID_COUNT)
		return forcewake_domain_names[id];

	WARN_ON(id);

	return "unknown";
}

66 67 68
static void
assert_device_not_suspended(struct drm_i915_private *dev_priv)
{
69 70
	WARN_ONCE(HAS_RUNTIME_PM(dev_priv->dev) && dev_priv->pm.suspended,
		  "Device suspended\n");
71
}
72

73 74
static inline void
fw_domain_reset(const struct intel_uncore_forcewake_domain *d)
75
{
76
	WARN_ON(d->reg_set == 0);
77
	__raw_i915_write32(d->i915, d->reg_set, d->val_reset);
78 79
}

80 81
static inline void
fw_domain_arm_timer(struct intel_uncore_forcewake_domain *d)
82
{
83
	mod_timer_pinned(&d->timer, jiffies + 1);
84 85
}

86 87
static inline void
fw_domain_wait_ack_clear(const struct intel_uncore_forcewake_domain *d)
88
{
89 90
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL) == 0,
91
			    FORCEWAKE_ACK_TIMEOUT_MS))
92 93 94
		DRM_ERROR("%s: timed out waiting for forcewake ack to clear.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
95

96 97 98 99 100
static inline void
fw_domain_get(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_set);
}
101

102 103 104 105 106
static inline void
fw_domain_wait_ack(const struct intel_uncore_forcewake_domain *d)
{
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL),
107
			    FORCEWAKE_ACK_TIMEOUT_MS))
108 109 110
		DRM_ERROR("%s: timed out waiting for forcewake ack request.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
111

112 113 114 115
static inline void
fw_domain_put(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_clear);
116 117
}

118 119
static inline void
fw_domain_posting_read(const struct intel_uncore_forcewake_domain *d)
120
{
121 122 123
	/* something from same cacheline, but not from the set register */
	if (d->reg_post)
		__raw_posting_read(d->i915, d->reg_post);
124 125
}

126
static void
127
fw_domains_get(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
128
{
129
	struct intel_uncore_forcewake_domain *d;
130
	enum forcewake_domain_id id;
131

132 133 134 135 136 137
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_wait_ack_clear(d);
		fw_domain_get(d);
		fw_domain_wait_ack(d);
	}
}
138

139
static void
140
fw_domains_put(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
141 142
{
	struct intel_uncore_forcewake_domain *d;
143
	enum forcewake_domain_id id;
144

145 146 147 148 149
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_put(d);
		fw_domain_posting_read(d);
	}
}
150

151 152 153 154
static void
fw_domains_posting_read(struct drm_i915_private *dev_priv)
{
	struct intel_uncore_forcewake_domain *d;
155
	enum forcewake_domain_id id;
156 157 158 159 160 161 162 163 164

	/* No need to do for all, just do for first found */
	for_each_fw_domain(d, dev_priv, id) {
		fw_domain_posting_read(d);
		break;
	}
}

static void
165
fw_domains_reset(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
166 167
{
	struct intel_uncore_forcewake_domain *d;
168
	enum forcewake_domain_id id;
169

170 171
	if (dev_priv->uncore.fw_domains == 0)
		return;
172

173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id)
		fw_domain_reset(d);

	fw_domains_posting_read(dev_priv);
}

static void __gen6_gt_wait_for_thread_c0(struct drm_i915_private *dev_priv)
{
	/* w/a for a sporadic read returning 0 by waiting for the GT
	 * thread to wake up.
	 */
	if (wait_for_atomic_us((__raw_i915_read32(dev_priv, GEN6_GT_THREAD_STATUS_REG) &
				GEN6_GT_THREAD_STATUS_CORE_MASK) == 0, 500))
		DRM_ERROR("GT thread status wait timed out\n");
}

static void fw_domains_get_with_thread_status(struct drm_i915_private *dev_priv,
190
					      enum forcewake_domains fw_domains)
191 192
{
	fw_domains_get(dev_priv, fw_domains);
193

194
	/* WaRsForcewakeWaitTC0:snb,ivb,hsw,bdw,vlv */
195
	__gen6_gt_wait_for_thread_c0(dev_priv);
196 197 198 199 200
}

static void gen6_gt_check_fifodbg(struct drm_i915_private *dev_priv)
{
	u32 gtfifodbg;
201 202

	gtfifodbg = __raw_i915_read32(dev_priv, GTFIFODBG);
203 204
	if (WARN(gtfifodbg, "GT wake FIFO error 0x%x\n", gtfifodbg))
		__raw_i915_write32(dev_priv, GTFIFODBG, gtfifodbg);
205 206
}

207
static void fw_domains_put_with_fifo(struct drm_i915_private *dev_priv,
208
				     enum forcewake_domains fw_domains)
209
{
210
	fw_domains_put(dev_priv, fw_domains);
211 212 213
	gen6_gt_check_fifodbg(dev_priv);
}

214 215 216 217 218 219 220
static inline u32 fifo_free_entries(struct drm_i915_private *dev_priv)
{
	u32 count = __raw_i915_read32(dev_priv, GTFIFOCTL);

	return count & GT_FIFO_FREE_ENTRIES_MASK;
}

221 222 223 224
static int __gen6_gt_wait_for_fifo(struct drm_i915_private *dev_priv)
{
	int ret = 0;

225 226 227
	/* On VLV, FIFO will be shared by both SW and HW.
	 * So, we need to read the FREE_ENTRIES everytime */
	if (IS_VALLEYVIEW(dev_priv->dev))
228
		dev_priv->uncore.fifo_count = fifo_free_entries(dev_priv);
229

230 231
	if (dev_priv->uncore.fifo_count < GT_FIFO_NUM_RESERVED_ENTRIES) {
		int loop = 500;
232 233
		u32 fifo = fifo_free_entries(dev_priv);

234 235
		while (fifo <= GT_FIFO_NUM_RESERVED_ENTRIES && loop--) {
			udelay(10);
236
			fifo = fifo_free_entries(dev_priv);
237 238 239 240 241 242 243 244 245 246
		}
		if (WARN_ON(loop < 0 && fifo <= GT_FIFO_NUM_RESERVED_ENTRIES))
			++ret;
		dev_priv->uncore.fifo_count = fifo;
	}
	dev_priv->uncore.fifo_count--;

	return ret;
}

247
static void intel_uncore_fw_release_timer(unsigned long arg)
Z
Zhe Wang 已提交
248
{
249 250
	struct intel_uncore_forcewake_domain *domain = (void *)arg;
	unsigned long irqflags;
Z
Zhe Wang 已提交
251

252
	assert_device_not_suspended(domain->i915);
Z
Zhe Wang 已提交
253

254 255 256 257 258 259 260 261 262
	spin_lock_irqsave(&domain->i915->uncore.lock, irqflags);
	if (WARN_ON(domain->wake_count == 0))
		domain->wake_count++;

	if (--domain->wake_count == 0)
		domain->i915->uncore.funcs.force_wake_put(domain->i915,
							  1 << domain->id);

	spin_unlock_irqrestore(&domain->i915->uncore.lock, irqflags);
Z
Zhe Wang 已提交
263 264
}

265
void intel_uncore_forcewake_reset(struct drm_device *dev, bool restore)
Z
Zhe Wang 已提交
266
{
267
	struct drm_i915_private *dev_priv = dev->dev_private;
268
	unsigned long irqflags;
269
	struct intel_uncore_forcewake_domain *domain;
270 271 272
	int retry_count = 100;
	enum forcewake_domain_id id;
	enum forcewake_domains fw = 0, active_domains;
Z
Zhe Wang 已提交
273

274 275 276 277 278 279
	/* Hold uncore.lock across reset to prevent any register access
	 * with forcewake not set correctly. Wait until all pending
	 * timers are run before holding.
	 */
	while (1) {
		active_domains = 0;
Z
Zhe Wang 已提交
280

281 282 283
		for_each_fw_domain(domain, dev_priv, id) {
			if (del_timer_sync(&domain->timer) == 0)
				continue;
Z
Zhe Wang 已提交
284

285
			intel_uncore_fw_release_timer((unsigned long)domain);
286
		}
287

288
		spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
289

290 291 292 293
		for_each_fw_domain(domain, dev_priv, id) {
			if (timer_pending(&domain->timer))
				active_domains |= (1 << id);
		}
294

295 296
		if (active_domains == 0)
			break;
297

298 299 300 301
		if (--retry_count == 0) {
			DRM_ERROR("Timed out waiting for forcewake timers to finish\n");
			break;
		}
302

303 304 305
		spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
		cond_resched();
	}
306

307 308 309 310 311 312 313 314
	WARN_ON(active_domains);

	for_each_fw_domain(domain, dev_priv, id)
		if (domain->wake_count)
			fw |= 1 << id;

	if (fw)
		dev_priv->uncore.funcs.force_wake_put(dev_priv, fw);
315

316
	fw_domains_reset(dev_priv, FORCEWAKE_ALL);
Z
Zhe Wang 已提交
317

318 319 320 321 322 323
	if (restore) { /* If reset with a user forcewake, try to restore */
		if (fw)
			dev_priv->uncore.funcs.force_wake_get(dev_priv, fw);

		if (IS_GEN6(dev) || IS_GEN7(dev))
			dev_priv->uncore.fifo_count =
324
				fifo_free_entries(dev_priv);
325 326
	}

327
	if (!restore)
328
		assert_forcewakes_inactive(dev_priv);
329

330
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
331 332
}

333
static void intel_uncore_ellc_detect(struct drm_device *dev)
334 335 336
{
	struct drm_i915_private *dev_priv = dev->dev_private;

337 338
	if ((IS_HASWELL(dev) || IS_BROADWELL(dev) ||
	     INTEL_INFO(dev)->gen >= 9) &&
339
	    (__raw_i915_read32(dev_priv, HSW_EDRAM_PRESENT) & EDRAM_ENABLED)) {
340 341 342 343 344 345 346 347
		/* The docs do not explain exactly how the calculation can be
		 * made. It is somewhat guessable, but for now, it's always
		 * 128MB.
		 * NB: We can't write IDICR yet because we do not have gt funcs
		 * set up */
		dev_priv->ellc_size = 128;
		DRM_INFO("Found %zuMB of eLLC\n", dev_priv->ellc_size);
	}
348 349 350 351 352 353 354 355 356
}

static void __intel_uncore_early_sanitize(struct drm_device *dev,
					  bool restore_forcewake)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

	if (HAS_FPGA_DBG_UNCLAIMED(dev))
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
357

358 359 360 361 362
	/* clear out old GT FIFO errors */
	if (IS_GEN6(dev) || IS_GEN7(dev))
		__raw_i915_write32(dev_priv, GTFIFODBG,
				   __raw_i915_read32(dev_priv, GTFIFODBG));

363 364 365 366 367 368 369 370
	/* WaDisableShadowRegForCpd:chv */
	if (IS_CHERRYVIEW(dev)) {
		__raw_i915_write32(dev_priv, GTFIFOCTL,
				   __raw_i915_read32(dev_priv, GTFIFOCTL) |
				   GT_FIFO_CTL_BLOCK_ALL_POLICY_STALL |
				   GT_FIFO_CTL_RC6_POLICY_STALL);
	}

371
	intel_uncore_forcewake_reset(dev, restore_forcewake);
372 373
}

374 375 376 377 378 379
void intel_uncore_early_sanitize(struct drm_device *dev, bool restore_forcewake)
{
	__intel_uncore_early_sanitize(dev, restore_forcewake);
	i915_check_and_clear_faults(dev);
}

380 381
void intel_uncore_sanitize(struct drm_device *dev)
{
382 383 384 385
	/* BIOS often leaves RC6 enabled, but disable it for hw init */
	intel_disable_gt_powersave(dev);
}

386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405
static void __intel_uncore_forcewake_get(struct drm_i915_private *dev_priv,
					 enum forcewake_domains fw_domains)
{
	struct intel_uncore_forcewake_domain *domain;
	enum forcewake_domain_id id;

	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

	fw_domains &= dev_priv->uncore.fw_domains;

	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (domain->wake_count++)
			fw_domains &= ~(1 << id);
	}

	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);
}

406 407 408 409 410 411 412 413 414 415 416 417
/**
 * intel_uncore_forcewake_get - grab forcewake domain references
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to get reference on
 *
 * This function can be used get GT's forcewake domain references.
 * Normal register access will handle the forcewake domains automatically.
 * However if some sequence requires the GT to not power down a particular
 * forcewake domains this function should be called at the beginning of the
 * sequence. And subsequently the reference should be dropped by symmetric
 * call to intel_unforce_forcewake_put(). Usually caller wants all the domains
 * to be kept awake so the @fw_domains would be then FORCEWAKE_ALL.
418
 */
419
void intel_uncore_forcewake_get(struct drm_i915_private *dev_priv,
420
				enum forcewake_domains fw_domains)
421 422 423
{
	unsigned long irqflags;

424 425 426
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

427
	WARN_ON(dev_priv->pm.suspended);
428

429
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
430
	__intel_uncore_forcewake_get(dev_priv, fw_domains);
431 432 433
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

434
/**
435
 * intel_uncore_forcewake_get__locked - grab forcewake domain references
436
 * @dev_priv: i915 device instance
437
 * @fw_domains: forcewake domains to get reference on
438
 *
439 440
 * See intel_uncore_forcewake_get(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
441
 */
442 443 444 445 446 447 448 449 450 451 452 453 454
void intel_uncore_forcewake_get__locked(struct drm_i915_private *dev_priv,
					enum forcewake_domains fw_domains)
{
	assert_spin_locked(&dev_priv->uncore.lock);

	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

	__intel_uncore_forcewake_get(dev_priv, fw_domains);
}

static void __intel_uncore_forcewake_put(struct drm_i915_private *dev_priv,
					 enum forcewake_domains fw_domains)
455
{
456
	struct intel_uncore_forcewake_domain *domain;
457
	enum forcewake_domain_id id;
458

459 460 461
	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

462 463 464 465 466 467 468 469 470 471
	fw_domains &= dev_priv->uncore.fw_domains;

	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (WARN_ON(domain->wake_count == 0))
			continue;

		if (--domain->wake_count)
			continue;

		domain->wake_count++;
472
		fw_domain_arm_timer(domain);
473
	}
474
}
475

476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493
/**
 * intel_uncore_forcewake_put - release a forcewake domain reference
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to put references
 *
 * This function drops the device-level forcewakes for specified
 * domains obtained by intel_uncore_forcewake_get().
 */
void intel_uncore_forcewake_put(struct drm_i915_private *dev_priv,
				enum forcewake_domains fw_domains)
{
	unsigned long irqflags;

	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
	__intel_uncore_forcewake_put(dev_priv, fw_domains);
494 495 496
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515
/**
 * intel_uncore_forcewake_put__locked - grab forcewake domain references
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to get reference on
 *
 * See intel_uncore_forcewake_put(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
 */
void intel_uncore_forcewake_put__locked(struct drm_i915_private *dev_priv,
					enum forcewake_domains fw_domains)
{
	assert_spin_locked(&dev_priv->uncore.lock);

	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

	__intel_uncore_forcewake_put(dev_priv, fw_domains);
}

516
void assert_forcewakes_inactive(struct drm_i915_private *dev_priv)
517
{
518
	struct intel_uncore_forcewake_domain *domain;
519
	enum forcewake_domain_id id;
520

521 522 523
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

524
	for_each_fw_domain(domain, dev_priv, id)
525
		WARN_ON(domain->wake_count);
526 527
}

528 529
/* We give fast paths for the really cool registers */
#define NEEDS_FORCE_WAKE(dev_priv, reg) \
530
	 ((reg) < 0x40000 && (reg) != FORCEWAKE)
531

532
#define REG_RANGE(reg, start, end) ((reg) >= (start) && (reg) < (end))
533

534 535 536 537 538 539 540 541 542 543 544 545 546
#define FORCEWAKE_VLV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
	 REG_RANGE((reg), 0x5000, 0x8000) || \
	 REG_RANGE((reg), 0xB000, 0x12000) || \
	 REG_RANGE((reg), 0x2E000, 0x30000))

#define FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x22000, 0x24000) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
547
	 REG_RANGE((reg), 0x5200, 0x8000) || \
548
	 REG_RANGE((reg), 0x8300, 0x8500) || \
549
	 REG_RANGE((reg), 0xB000, 0xB480) || \
550 551 552 553 554 555 556 557
	 REG_RANGE((reg), 0xE000, 0xE800))

#define FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x8800, 0x8900) || \
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1C000) || \
	 REG_RANGE((reg), 0x1E800, 0x1EA00) || \
558
	 REG_RANGE((reg), 0x30000, 0x38000))
559 560 561 562 563 564

#define FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x4000, 0x5000) || \
	 REG_RANGE((reg), 0x8000, 0x8300) || \
	 REG_RANGE((reg), 0x8500, 0x8600) || \
	 REG_RANGE((reg), 0x9000, 0xB000) || \
565
	 REG_RANGE((reg), 0xF000, 0x10000))
566

567
#define FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) \
568
	REG_RANGE((reg), 0xB00,  0x2000)
569 570

#define FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) \
571 572
	(REG_RANGE((reg), 0x2000, 0x2700) || \
	 REG_RANGE((reg), 0x3000, 0x4000) || \
573
	 REG_RANGE((reg), 0x5200, 0x8000) || \
574
	 REG_RANGE((reg), 0x8140, 0x8160) || \
575 576 577
	 REG_RANGE((reg), 0x8300, 0x8500) || \
	 REG_RANGE((reg), 0x8C00, 0x8D00) || \
	 REG_RANGE((reg), 0xB000, 0xB480) || \
578 579
	 REG_RANGE((reg), 0xE000, 0xE900) || \
	 REG_RANGE((reg), 0x24400, 0x24800))
580 581

#define FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) \
582 583
	(REG_RANGE((reg), 0x8130, 0x8140) || \
	 REG_RANGE((reg), 0x8800, 0x8A00) || \
584 585 586 587 588 589 590 591 592 593 594 595 596 597 598
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1EA00) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg) \
	REG_RANGE((reg), 0x9400, 0x9800)

#define FORCEWAKE_GEN9_BLITTER_RANGE_OFFSET(reg) \
	((reg) < 0x40000 &&\
	 !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg))

599 600 601 602 603 604
static void
ilk_dummy_write(struct drm_i915_private *dev_priv)
{
	/* WaIssueDummyWriteToWakeupFromRC6:ilk Issue a dummy write to wake up
	 * the chip from rc6 before touching it for real. MI_MODE is masked,
	 * hence harmless to write 0 into. */
605
	__raw_i915_write32(dev_priv, MI_MODE, 0);
606 607 608
}

static void
609 610
hsw_unclaimed_reg_debug(struct drm_i915_private *dev_priv, u32 reg, bool read,
			bool before)
611
{
612 613 614 615 616 617
	const char *op = read ? "reading" : "writing to";
	const char *when = before ? "before" : "after";

	if (!i915.mmio_debug)
		return;

618
	if (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM) {
619 620
		WARN(1, "Unclaimed register detected %s %s register 0x%x\n",
		     when, op, reg);
621
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
622
		i915.mmio_debug--; /* Only report the first N failures */
623 624 625 626
	}
}

static void
627
hsw_unclaimed_reg_detect(struct drm_i915_private *dev_priv)
628
{
629 630 631
	static bool mmio_debug_once = true;

	if (i915.mmio_debug || !mmio_debug_once)
632 633
		return;

634
	if (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM) {
635 636 637
		DRM_DEBUG("Unclaimed register detected, "
			  "enabling oneshot unclaimed register reporting. "
			  "Please use i915.mmio_debug=N for more information.\n");
638
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
639
		i915.mmio_debug = mmio_debug_once--;
640 641 642
	}
}

643
#define GEN2_READ_HEADER(x) \
B
Ben Widawsky 已提交
644
	u##x val = 0; \
645
	assert_device_not_suspended(dev_priv);
B
Ben Widawsky 已提交
646

647
#define GEN2_READ_FOOTER \
B
Ben Widawsky 已提交
648 649 650
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

651
#define __gen2_read(x) \
652
static u##x \
653 654
gen2_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
	GEN2_READ_HEADER(x); \
655
	val = __raw_i915_read##x(dev_priv, reg); \
656
	GEN2_READ_FOOTER; \
657 658 659 660 661
}

#define __gen5_read(x) \
static u##x \
gen5_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
662
	GEN2_READ_HEADER(x); \
663 664
	ilk_dummy_write(dev_priv); \
	val = __raw_i915_read##x(dev_priv, reg); \
665
	GEN2_READ_FOOTER; \
666 667
}

668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693
__gen5_read(8)
__gen5_read(16)
__gen5_read(32)
__gen5_read(64)
__gen2_read(8)
__gen2_read(16)
__gen2_read(32)
__gen2_read(64)

#undef __gen5_read
#undef __gen2_read

#undef GEN2_READ_FOOTER
#undef GEN2_READ_HEADER

#define GEN6_READ_HEADER(x) \
	unsigned long irqflags; \
	u##x val = 0; \
	assert_device_not_suspended(dev_priv); \
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define GEN6_READ_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags); \
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

694
static inline void __force_wake_get(struct drm_i915_private *dev_priv,
695
				    enum forcewake_domains fw_domains)
696 697
{
	struct intel_uncore_forcewake_domain *domain;
698
	enum forcewake_domain_id id;
699 700 701 702 703

	if (WARN_ON(!fw_domains))
		return;

	/* Ideally GCC would be constant-fold and eliminate this loop */
704
	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
705
		if (domain->wake_count) {
706
			fw_domains &= ~(1 << id);
707 708 709 710
			continue;
		}

		domain->wake_count++;
711
		fw_domain_arm_timer(domain);
712 713 714 715 716 717
	}

	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);
}

718 719 720 721 722 723 724 725
#define __vgpu_read(x) \
static u##x \
vgpu_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
	GEN6_READ_HEADER(x); \
	val = __raw_i915_read##x(dev_priv, reg); \
	GEN6_READ_FOOTER; \
}

726 727 728
#define __gen6_read(x) \
static u##x \
gen6_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
729
	GEN6_READ_HEADER(x); \
730
	hsw_unclaimed_reg_debug(dev_priv, reg, true, true); \
731 732
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
733
	val = __raw_i915_read##x(dev_priv, reg); \
734
	hsw_unclaimed_reg_debug(dev_priv, reg, true, false); \
735
	GEN6_READ_FOOTER; \
736 737
}

738 739 740
#define __vlv_read(x) \
static u##x \
vlv_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
741
	GEN6_READ_HEADER(x); \
742 743 744 745
	if (FORCEWAKE_VLV_RENDER_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	else if (FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
746
	val = __raw_i915_read##x(dev_priv, reg); \
747
	GEN6_READ_FOOTER; \
748 749
}

750 751 752
#define __chv_read(x) \
static u##x \
chv_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
753
	GEN6_READ_HEADER(x); \
754 755 756 757 758 759 760
	if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
	else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, \
				 FORCEWAKE_RENDER | FORCEWAKE_MEDIA); \
761
	val = __raw_i915_read##x(dev_priv, reg); \
762
	GEN6_READ_FOOTER; \
763
}
764

765 766 767 768 769 770
#define SKL_NEEDS_FORCE_WAKE(dev_priv, reg)	\
	 ((reg) < 0x40000 && !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg))

#define __gen9_read(x) \
static u##x \
gen9_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
771
	enum forcewake_domains fw_engine; \
772
	GEN6_READ_HEADER(x); \
773 774 775 776 777 778 779 780 781 782 783 784 785
	if (!SKL_NEEDS_FORCE_WAKE((dev_priv), (reg)))	\
		fw_engine = 0; \
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg))	\
		fw_engine = FORCEWAKE_RENDER; \
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_MEDIA; \
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	val = __raw_i915_read##x(dev_priv, reg); \
786
	GEN6_READ_FOOTER; \
787 788
}

789 790 791 792
__vgpu_read(8)
__vgpu_read(16)
__vgpu_read(32)
__vgpu_read(64)
793 794 795 796
__gen9_read(8)
__gen9_read(16)
__gen9_read(32)
__gen9_read(64)
797 798 799 800
__chv_read(8)
__chv_read(16)
__chv_read(32)
__chv_read(64)
801 802 803 804
__vlv_read(8)
__vlv_read(16)
__vlv_read(32)
__vlv_read(64)
805 806 807 808 809
__gen6_read(8)
__gen6_read(16)
__gen6_read(32)
__gen6_read(64)

810
#undef __gen9_read
811
#undef __chv_read
812
#undef __vlv_read
813
#undef __gen6_read
814
#undef __vgpu_read
815 816
#undef GEN6_READ_FOOTER
#undef GEN6_READ_HEADER
B
Ben Widawsky 已提交
817

818
#define GEN2_WRITE_HEADER \
B
Ben Widawsky 已提交
819
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
820
	assert_device_not_suspended(dev_priv); \
821

822
#define GEN2_WRITE_FOOTER
V
Ville Syrjälä 已提交
823

824
#define __gen2_write(x) \
825
static void \
826 827
gen2_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	GEN2_WRITE_HEADER; \
828
	__raw_i915_write##x(dev_priv, reg, val); \
829
	GEN2_WRITE_FOOTER; \
830 831 832 833 834
}

#define __gen5_write(x) \
static void \
gen5_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
835
	GEN2_WRITE_HEADER; \
836 837
	ilk_dummy_write(dev_priv); \
	__raw_i915_write##x(dev_priv, reg, val); \
838
	GEN2_WRITE_FOOTER; \
839 840
}

841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864
__gen5_write(8)
__gen5_write(16)
__gen5_write(32)
__gen5_write(64)
__gen2_write(8)
__gen2_write(16)
__gen2_write(32)
__gen2_write(64)

#undef __gen5_write
#undef __gen2_write

#undef GEN2_WRITE_FOOTER
#undef GEN2_WRITE_HEADER

#define GEN6_WRITE_HEADER \
	unsigned long irqflags; \
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
	assert_device_not_suspended(dev_priv); \
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define GEN6_WRITE_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags)

865 866 867 868
#define __gen6_write(x) \
static void \
gen6_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	u32 __fifo_ret = 0; \
869
	GEN6_WRITE_HEADER; \
870 871 872 873 874 875 876
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) { \
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
	__raw_i915_write##x(dev_priv, reg, val); \
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
877
	GEN6_WRITE_FOOTER; \
878 879 880 881 882
}

#define __hsw_write(x) \
static void \
hsw_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
883
	u32 __fifo_ret = 0; \
884
	GEN6_WRITE_HEADER; \
885 886 887
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) { \
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
888
	hsw_unclaimed_reg_debug(dev_priv, reg, false, true); \
889
	__raw_i915_write##x(dev_priv, reg, val); \
890 891 892
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
893 894
	hsw_unclaimed_reg_debug(dev_priv, reg, false, false); \
	hsw_unclaimed_reg_detect(dev_priv); \
895
	GEN6_WRITE_FOOTER; \
896
}
897

898 899 900 901 902 903 904 905
#define __vgpu_write(x) \
static void vgpu_write##x(struct drm_i915_private *dev_priv, \
			  off_t reg, u##x val, bool trace) { \
	GEN6_WRITE_HEADER; \
	__raw_i915_write##x(dev_priv, reg, val); \
	GEN6_WRITE_FOOTER; \
}

906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929
static const u32 gen8_shadowed_regs[] = {
	FORCEWAKE_MT,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	/* TODO: Other registers are not yet used */
};

static bool is_gen8_shadowed(struct drm_i915_private *dev_priv, u32 reg)
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen8_shadowed_regs); i++)
		if (reg == gen8_shadowed_regs[i])
			return true;

	return false;
}

#define __gen8_write(x) \
static void \
gen8_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
930
	GEN6_WRITE_HEADER; \
931
	hsw_unclaimed_reg_debug(dev_priv, reg, false, true); \
932 933 934
	if (reg < 0x40000 && !is_gen8_shadowed(dev_priv, reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	__raw_i915_write##x(dev_priv, reg, val); \
935 936
	hsw_unclaimed_reg_debug(dev_priv, reg, false, false); \
	hsw_unclaimed_reg_detect(dev_priv); \
937
	GEN6_WRITE_FOOTER; \
938 939
}

940 941 942 943
#define __chv_write(x) \
static void \
chv_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	bool shadowed = is_gen8_shadowed(dev_priv, reg); \
944
	GEN6_WRITE_HEADER; \
945
	if (!shadowed) { \
946 947 948 949 950 951
		if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
		else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
		else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_RENDER | FORCEWAKE_MEDIA); \
952 953
	} \
	__raw_i915_write##x(dev_priv, reg, val); \
954
	GEN6_WRITE_FOOTER; \
955 956
}

Z
Zhe Wang 已提交
957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979
static const u32 gen9_shadowed_regs[] = {
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	FORCEWAKE_BLITTER_GEN9,
	FORCEWAKE_RENDER_GEN9,
	FORCEWAKE_MEDIA_GEN9,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	/* TODO: Other registers are not yet used */
};

static bool is_gen9_shadowed(struct drm_i915_private *dev_priv, u32 reg)
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen9_shadowed_regs); i++)
		if (reg == gen9_shadowed_regs[i])
			return true;

	return false;
}

980 981 982 983
#define __gen9_write(x) \
static void \
gen9_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, \
		bool trace) { \
984
	enum forcewake_domains fw_engine; \
985
	GEN6_WRITE_HEADER; \
986 987 988 989 990 991 992 993 994 995 996 997 998 999
	if (!SKL_NEEDS_FORCE_WAKE((dev_priv), (reg)) ||	\
	    is_gen9_shadowed(dev_priv, reg)) \
		fw_engine = 0; \
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER; \
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_MEDIA; \
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	__raw_i915_write##x(dev_priv, reg, val); \
1000
	GEN6_WRITE_FOOTER; \
1001 1002 1003 1004 1005 1006
}

__gen9_write(8)
__gen9_write(16)
__gen9_write(32)
__gen9_write(64)
1007 1008 1009 1010
__chv_write(8)
__chv_write(16)
__chv_write(32)
__chv_write(64)
1011 1012 1013 1014
__gen8_write(8)
__gen8_write(16)
__gen8_write(32)
__gen8_write(64)
1015 1016 1017 1018 1019 1020 1021 1022
__hsw_write(8)
__hsw_write(16)
__hsw_write(32)
__hsw_write(64)
__gen6_write(8)
__gen6_write(16)
__gen6_write(32)
__gen6_write(64)
1023 1024 1025 1026
__vgpu_write(8)
__vgpu_write(16)
__vgpu_write(32)
__vgpu_write(64)
1027

1028
#undef __gen9_write
1029
#undef __chv_write
1030
#undef __gen8_write
1031 1032
#undef __hsw_write
#undef __gen6_write
1033
#undef __vgpu_write
1034 1035
#undef GEN6_WRITE_FOOTER
#undef GEN6_WRITE_HEADER
1036

1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052
#define ASSIGN_WRITE_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_writeb = x##_write8; \
	dev_priv->uncore.funcs.mmio_writew = x##_write16; \
	dev_priv->uncore.funcs.mmio_writel = x##_write32; \
	dev_priv->uncore.funcs.mmio_writeq = x##_write64; \
} while (0)

#define ASSIGN_READ_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_readb = x##_read8; \
	dev_priv->uncore.funcs.mmio_readw = x##_read16; \
	dev_priv->uncore.funcs.mmio_readl = x##_read32; \
	dev_priv->uncore.funcs.mmio_readq = x##_read64; \
} while (0)

1053 1054

static void fw_domain_init(struct drm_i915_private *dev_priv,
1055 1056
			   enum forcewake_domain_id domain_id,
			   u32 reg_set, u32 reg_ack)
1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075
{
	struct intel_uncore_forcewake_domain *d;

	if (WARN_ON(domain_id >= FW_DOMAIN_ID_COUNT))
		return;

	d = &dev_priv->uncore.fw_domain[domain_id];

	WARN_ON(d->wake_count);

	d->wake_count = 0;
	d->reg_set = reg_set;
	d->reg_ack = reg_ack;

	if (IS_GEN6(dev_priv)) {
		d->val_reset = 0;
		d->val_set = FORCEWAKE_KERNEL;
		d->val_clear = 0;
	} else {
1076
		/* WaRsClearFWBitsAtReset:bdw,skl */
1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091
		d->val_reset = _MASKED_BIT_DISABLE(0xffff);
		d->val_set = _MASKED_BIT_ENABLE(FORCEWAKE_KERNEL);
		d->val_clear = _MASKED_BIT_DISABLE(FORCEWAKE_KERNEL);
	}

	if (IS_VALLEYVIEW(dev_priv))
		d->reg_post = FORCEWAKE_ACK_VLV;
	else if (IS_GEN6(dev_priv) || IS_GEN7(dev_priv) || IS_GEN8(dev_priv))
		d->reg_post = ECOBUS;
	else
		d->reg_post = 0;

	d->i915 = dev_priv;
	d->id = domain_id;

1092
	setup_timer(&d->timer, intel_uncore_fw_release_timer, (unsigned long)d);
1093 1094

	dev_priv->uncore.fw_domains |= (1 << domain_id);
1095 1096

	fw_domain_reset(d);
1097 1098
}

1099
static void intel_uncore_fw_domains_init(struct drm_device *dev)
1100 1101 1102
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1103 1104 1105
	if (INTEL_INFO(dev_priv->dev)->gen <= 5)
		return;

Z
Zhe Wang 已提交
1106
	if (IS_GEN9(dev)) {
1107 1108 1109 1110 1111 1112 1113 1114 1115 1116
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_RENDER_GEN9,
			       FORCEWAKE_ACK_RENDER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_BLITTER,
			       FORCEWAKE_BLITTER_GEN9,
			       FORCEWAKE_ACK_BLITTER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_GEN9, FORCEWAKE_ACK_MEDIA_GEN9);
Z
Zhe Wang 已提交
1117
	} else if (IS_VALLEYVIEW(dev)) {
1118
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
1119 1120 1121 1122 1123
		if (!IS_CHERRYVIEW(dev))
			dev_priv->uncore.funcs.force_wake_put =
				fw_domains_put_with_fifo;
		else
			dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
1124 1125 1126 1127
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_VLV, FORCEWAKE_ACK_VLV);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_VLV, FORCEWAKE_ACK_MEDIA_VLV);
1128
	} else if (IS_HASWELL(dev) || IS_BROADWELL(dev)) {
1129 1130 1131 1132 1133
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_ACK_HSW);
1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145
	} else if (IS_IVYBRIDGE(dev)) {
		u32 ecobus;

		/* IVB configs may use multi-threaded forcewake */

		/* A small trick here - if the bios hasn't configured
		 * MT forcewake, and if the device is in RC6, then
		 * force_wake_mt_get will not wake the device and the
		 * ECOBUS read will return zero. Which will be
		 * (correctly) interpreted by the test below as MT
		 * forcewake being disabled.
		 */
1146 1147 1148 1149 1150
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put =
			fw_domains_put_with_fifo;

1151 1152
		/* We need to init first for ECOBUS access and then
		 * determine later if we want to reinit, in case of MT access is
1153 1154 1155
		 * not working. In this stage we don't know which flavour this
		 * ivb is, so it is better to reset also the gen6 fw registers
		 * before the ecobus check.
1156
		 */
1157 1158 1159 1160

		__raw_i915_write32(dev_priv, FORCEWAKE, 0);
		__raw_posting_read(dev_priv, ECOBUS);

1161 1162
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_MT_ACK);
1163

1164
		mutex_lock(&dev->struct_mutex);
1165
		fw_domains_get_with_thread_status(dev_priv, FORCEWAKE_ALL);
1166
		ecobus = __raw_i915_read32(dev_priv, ECOBUS);
1167
		fw_domains_put_with_fifo(dev_priv, FORCEWAKE_ALL);
1168 1169
		mutex_unlock(&dev->struct_mutex);

1170
		if (!(ecobus & FORCEWAKE_MT_ENABLE)) {
1171 1172
			DRM_INFO("No MT forcewake available on Ivybridge, this can result in issues\n");
			DRM_INFO("when using vblank-synced partial screen updates.\n");
1173 1174
			fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
				       FORCEWAKE, FORCEWAKE_ACK);
1175 1176 1177
		}
	} else if (IS_GEN6(dev)) {
		dev_priv->uncore.funcs.force_wake_get =
1178
			fw_domains_get_with_thread_status;
1179
		dev_priv->uncore.funcs.force_wake_put =
1180 1181 1182
			fw_domains_put_with_fifo;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE, FORCEWAKE_ACK);
1183
	}
1184 1185 1186

	/* All future platforms are expected to require complex power gating */
	WARN_ON(dev_priv->uncore.fw_domains == 0);
1187 1188 1189 1190 1191 1192
}

void intel_uncore_init(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1193 1194
	i915_check_vgpu(dev);

1195 1196 1197
	intel_uncore_ellc_detect(dev);
	intel_uncore_fw_domains_init(dev);
	__intel_uncore_early_sanitize(dev, false);
1198

1199
	switch (INTEL_INFO(dev)->gen) {
1200
	default:
1201
		MISSING_CASE(INTEL_INFO(dev)->gen);
1202 1203 1204 1205 1206 1207
		return;
	case 9:
		ASSIGN_WRITE_MMIO_VFUNCS(gen9);
		ASSIGN_READ_MMIO_VFUNCS(gen9);
		break;
	case 8:
1208
		if (IS_CHERRYVIEW(dev)) {
1209 1210
			ASSIGN_WRITE_MMIO_VFUNCS(chv);
			ASSIGN_READ_MMIO_VFUNCS(chv);
1211 1212

		} else {
1213 1214
			ASSIGN_WRITE_MMIO_VFUNCS(gen8);
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1215
		}
1216
		break;
1217 1218
	case 7:
	case 6:
1219
		if (IS_HASWELL(dev)) {
1220
			ASSIGN_WRITE_MMIO_VFUNCS(hsw);
1221
		} else {
1222
			ASSIGN_WRITE_MMIO_VFUNCS(gen6);
1223
		}
1224 1225

		if (IS_VALLEYVIEW(dev)) {
1226
			ASSIGN_READ_MMIO_VFUNCS(vlv);
1227
		} else {
1228
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1229
		}
1230 1231
		break;
	case 5:
1232 1233
		ASSIGN_WRITE_MMIO_VFUNCS(gen5);
		ASSIGN_READ_MMIO_VFUNCS(gen5);
1234 1235 1236 1237
		break;
	case 4:
	case 3:
	case 2:
1238 1239
		ASSIGN_WRITE_MMIO_VFUNCS(gen2);
		ASSIGN_READ_MMIO_VFUNCS(gen2);
1240 1241
		break;
	}
1242

1243 1244 1245 1246 1247
	if (intel_vgpu_active(dev)) {
		ASSIGN_WRITE_MMIO_VFUNCS(vgpu);
		ASSIGN_READ_MMIO_VFUNCS(vgpu);
	}

1248
	i915_check_and_clear_faults(dev);
1249
}
1250 1251
#undef ASSIGN_WRITE_MMIO_VFUNCS
#undef ASSIGN_READ_MMIO_VFUNCS
1252 1253 1254 1255 1256

void intel_uncore_fini(struct drm_device *dev)
{
	/* Paranoia: make sure we have disabled everything before we exit. */
	intel_uncore_sanitize(dev);
1257
	intel_uncore_forcewake_reset(dev, false);
1258 1259
}

1260 1261
#define GEN_RANGE(l, h) GENMASK(h, l)

1262 1263 1264
static const struct register_whitelist {
	uint64_t offset;
	uint32_t size;
1265 1266
	/* supported gens, 0x10 for 4, 0x30 for 4 and 5, etc. */
	uint32_t gen_bitmask;
1267
} whitelist[] = {
1268
	{ RING_TIMESTAMP(RENDER_RING_BASE), 8, GEN_RANGE(4, 9) },
1269 1270 1271 1272 1273 1274 1275 1276
};

int i915_reg_read_ioctl(struct drm_device *dev,
			void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reg_read *reg = data;
	struct register_whitelist const *entry = whitelist;
1277
	int i, ret = 0;
1278 1279 1280 1281 1282 1283 1284 1285 1286 1287

	for (i = 0; i < ARRAY_SIZE(whitelist); i++, entry++) {
		if (entry->offset == reg->offset &&
		    (1 << INTEL_INFO(dev)->gen & entry->gen_bitmask))
			break;
	}

	if (i == ARRAY_SIZE(whitelist))
		return -EINVAL;

1288 1289
	intel_runtime_pm_get(dev_priv);

1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303
	switch (entry->size) {
	case 8:
		reg->val = I915_READ64(reg->offset);
		break;
	case 4:
		reg->val = I915_READ(reg->offset);
		break;
	case 2:
		reg->val = I915_READ16(reg->offset);
		break;
	case 1:
		reg->val = I915_READ8(reg->offset);
		break;
	default:
1304
		MISSING_CASE(entry->size);
1305 1306
		ret = -EINVAL;
		goto out;
1307 1308
	}

1309 1310 1311
out:
	intel_runtime_pm_put(dev_priv);
	return ret;
1312 1313
}

1314 1315 1316 1317 1318 1319
int i915_get_reset_stats_ioctl(struct drm_device *dev,
			       void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reset_stats *args = data;
	struct i915_ctx_hang_stats *hs;
1320
	struct intel_context *ctx;
1321 1322
	int ret;

1323 1324 1325
	if (args->flags || args->pad)
		return -EINVAL;

1326
	if (args->ctx_id == DEFAULT_CONTEXT_HANDLE && !capable(CAP_SYS_ADMIN))
1327 1328 1329 1330 1331 1332
		return -EPERM;

	ret = mutex_lock_interruptible(&dev->struct_mutex);
	if (ret)
		return ret;

1333 1334
	ctx = i915_gem_context_get(file->driver_priv, args->ctx_id);
	if (IS_ERR(ctx)) {
1335
		mutex_unlock(&dev->struct_mutex);
1336
		return PTR_ERR(ctx);
1337
	}
1338
	hs = &ctx->hang_stats;
1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352

	if (capable(CAP_SYS_ADMIN))
		args->reset_count = i915_reset_count(&dev_priv->gpu_error);
	else
		args->reset_count = 0;

	args->batch_active = hs->batch_active;
	args->batch_pending = hs->batch_pending;

	mutex_unlock(&dev->struct_mutex);

	return 0;
}

1353
static int i915_reset_complete(struct drm_device *dev)
1354 1355
{
	u8 gdrst;
1356
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1357
	return (gdrst & GRDOM_RESET_STATUS) == 0;
1358 1359
}

1360
static int i915_do_reset(struct drm_device *dev)
1361
{
V
Ville Syrjälä 已提交
1362
	/* assert reset for at least 20 usec */
1363
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1364
	udelay(20);
1365
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1366

1367
	return wait_for(i915_reset_complete(dev), 500);
V
Ville Syrjälä 已提交
1368 1369 1370 1371 1372
}

static int g4x_reset_complete(struct drm_device *dev)
{
	u8 gdrst;
1373
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1374
	return (gdrst & GRDOM_RESET_ENABLE) == 0;
1375 1376
}

1377 1378 1379 1380 1381 1382
static int g33_do_reset(struct drm_device *dev)
{
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
	return wait_for(g4x_reset_complete(dev), 500);
}

1383 1384 1385 1386 1387
static int g4x_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

1388
	pci_write_config_byte(dev->pdev, I915_GDRST,
1389
			      GRDOM_RENDER | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1390
	ret =  wait_for(g4x_reset_complete(dev), 500);
1391 1392 1393 1394 1395 1396 1397
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) | VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1398
	pci_write_config_byte(dev->pdev, I915_GDRST,
1399
			      GRDOM_MEDIA | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1400
	ret =  wait_for(g4x_reset_complete(dev), 500);
1401 1402 1403 1404 1405 1406 1407
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) & ~VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1408
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1409 1410 1411 1412

	return 0;
}

1413 1414 1415 1416 1417 1418
static int ironlake_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR,
1419
		   ILK_GRDOM_RENDER | ILK_GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1420
	ret = wait_for((I915_READ(MCHBAR_MIRROR_BASE + ILK_GDSR) &
1421
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
1422 1423 1424 1425
	if (ret)
		return ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR,
1426
		   ILK_GRDOM_MEDIA | ILK_GRDOM_RESET_ENABLE);
1427 1428 1429 1430 1431 1432 1433 1434
	ret = wait_for((I915_READ(MCHBAR_MIRROR_BASE + ILK_GDSR) &
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
	if (ret)
		return ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR, 0);

	return 0;
1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447
}

static int gen6_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int	ret;

	/* Reset the chip */

	/* GEN6_GDRST is not in the gt power well, no need to check
	 * for fifo space for the write or forcewake the chip for
	 * the read
	 */
1448
	__raw_i915_write32(dev_priv, GEN6_GDRST, GEN6_GRDOM_FULL);
1449 1450

	/* Spin waiting for the device to ack the reset request */
1451
	ret = wait_for((__raw_i915_read32(dev_priv, GEN6_GDRST) & GEN6_GRDOM_FULL) == 0, 500);
1452

1453
	intel_uncore_forcewake_reset(dev, true);
1454

1455 1456 1457
	return ret;
}

1458
static int (*intel_get_gpu_reset(struct drm_device *dev))(struct drm_device *)
1459
{
1460
	if (INTEL_INFO(dev)->gen >= 6)
1461
		return gen6_do_reset;
1462
	else if (IS_GEN5(dev))
1463
		return ironlake_do_reset;
1464
	else if (IS_G4X(dev))
1465
		return g4x_do_reset;
1466
	else if (IS_G33(dev))
1467
		return g33_do_reset;
1468
	else if (INTEL_INFO(dev)->gen >= 3)
1469
		return i915_do_reset;
1470
	else
1471 1472 1473 1474 1475 1476 1477 1478 1479
		return NULL;
}

int intel_gpu_reset(struct drm_device *dev)
{
	int (*reset)(struct drm_device *);

	reset = intel_get_gpu_reset(dev);
	if (reset == NULL)
1480
		return -ENODEV;
1481 1482 1483 1484 1485 1486 1487

	return reset(dev);
}

bool intel_has_gpu_reset(struct drm_device *dev)
{
	return intel_get_gpu_reset(dev) != NULL;
1488 1489 1490 1491 1492 1493 1494
}

void intel_uncore_check_errors(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

	if (HAS_FPGA_DBG_UNCLAIMED(dev) &&
1495
	    (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM)) {
1496
		DRM_ERROR("Unclaimed register before interrupt\n");
1497
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
1498 1499
	}
}