intel_uncore.c 38.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * Copyright © 2013 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 */

#include "i915_drv.h"
#include "intel_drv.h"
26
#include "i915_vgpu.h"
27

28 29
#include <linux/pm_runtime.h>

30 31
#define FORCEWAKE_ACK_TIMEOUT_MS 2

32 33 34 35 36 37 38 39 40 41 42 43 44 45
#define __raw_i915_read8(dev_priv__, reg__) readb((dev_priv__)->regs + (reg__))
#define __raw_i915_write8(dev_priv__, reg__, val__) writeb(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read16(dev_priv__, reg__) readw((dev_priv__)->regs + (reg__))
#define __raw_i915_write16(dev_priv__, reg__, val__) writew(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read32(dev_priv__, reg__) readl((dev_priv__)->regs + (reg__))
#define __raw_i915_write32(dev_priv__, reg__, val__) writel(val__, (dev_priv__)->regs + (reg__))

#define __raw_i915_read64(dev_priv__, reg__) readq((dev_priv__)->regs + (reg__))
#define __raw_i915_write64(dev_priv__, reg__, val__) writeq(val__, (dev_priv__)->regs + (reg__))

#define __raw_posting_read(dev_priv__, reg__) (void)__raw_i915_read32(dev_priv__, reg__)

46 47 48 49 50 51 52
static const char * const forcewake_domain_names[] = {
	"render",
	"blitter",
	"media",
};

const char *
53
intel_uncore_forcewake_domain_to_str(const enum forcewake_domain_id id)
54 55 56 57 58 59 60 61 62 63 64 65
{
	BUILD_BUG_ON((sizeof(forcewake_domain_names)/sizeof(const char *)) !=
		     FW_DOMAIN_ID_COUNT);

	if (id >= 0 && id < FW_DOMAIN_ID_COUNT)
		return forcewake_domain_names[id];

	WARN_ON(id);

	return "unknown";
}

66 67 68
static void
assert_device_not_suspended(struct drm_i915_private *dev_priv)
{
69 70
	WARN_ONCE(HAS_RUNTIME_PM(dev_priv->dev) && dev_priv->pm.suspended,
		  "Device suspended\n");
71
}
72

73 74
static inline void
fw_domain_reset(const struct intel_uncore_forcewake_domain *d)
75
{
76
	WARN_ON(d->reg_set == 0);
77
	__raw_i915_write32(d->i915, d->reg_set, d->val_reset);
78 79
}

80 81
static inline void
fw_domain_arm_timer(struct intel_uncore_forcewake_domain *d)
82
{
83
	mod_timer_pinned(&d->timer, jiffies + 1);
84 85
}

86 87
static inline void
fw_domain_wait_ack_clear(const struct intel_uncore_forcewake_domain *d)
88
{
89 90
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL) == 0,
91
			    FORCEWAKE_ACK_TIMEOUT_MS))
92 93 94
		DRM_ERROR("%s: timed out waiting for forcewake ack to clear.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
95

96 97 98 99 100
static inline void
fw_domain_get(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_set);
}
101

102 103 104 105 106
static inline void
fw_domain_wait_ack(const struct intel_uncore_forcewake_domain *d)
{
	if (wait_for_atomic((__raw_i915_read32(d->i915, d->reg_ack) &
			     FORCEWAKE_KERNEL),
107
			    FORCEWAKE_ACK_TIMEOUT_MS))
108 109 110
		DRM_ERROR("%s: timed out waiting for forcewake ack request.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
}
111

112 113 114 115
static inline void
fw_domain_put(const struct intel_uncore_forcewake_domain *d)
{
	__raw_i915_write32(d->i915, d->reg_set, d->val_clear);
116 117
}

118 119
static inline void
fw_domain_posting_read(const struct intel_uncore_forcewake_domain *d)
120
{
121 122 123
	/* something from same cacheline, but not from the set register */
	if (d->reg_post)
		__raw_posting_read(d->i915, d->reg_post);
124 125
}

126
static void
127
fw_domains_get(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
128
{
129
	struct intel_uncore_forcewake_domain *d;
130
	enum forcewake_domain_id id;
131

132 133 134 135 136 137
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_wait_ack_clear(d);
		fw_domain_get(d);
		fw_domain_wait_ack(d);
	}
}
138

139
static void
140
fw_domains_put(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
141 142
{
	struct intel_uncore_forcewake_domain *d;
143
	enum forcewake_domain_id id;
144

145 146 147 148 149
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id) {
		fw_domain_put(d);
		fw_domain_posting_read(d);
	}
}
150

151 152 153 154
static void
fw_domains_posting_read(struct drm_i915_private *dev_priv)
{
	struct intel_uncore_forcewake_domain *d;
155
	enum forcewake_domain_id id;
156 157 158 159 160 161 162 163 164

	/* No need to do for all, just do for first found */
	for_each_fw_domain(d, dev_priv, id) {
		fw_domain_posting_read(d);
		break;
	}
}

static void
165
fw_domains_reset(struct drm_i915_private *dev_priv, enum forcewake_domains fw_domains)
166 167
{
	struct intel_uncore_forcewake_domain *d;
168
	enum forcewake_domain_id id;
169

170 171
	if (dev_priv->uncore.fw_domains == 0)
		return;
172

173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
	for_each_fw_domain_mask(d, fw_domains, dev_priv, id)
		fw_domain_reset(d);

	fw_domains_posting_read(dev_priv);
}

static void __gen6_gt_wait_for_thread_c0(struct drm_i915_private *dev_priv)
{
	/* w/a for a sporadic read returning 0 by waiting for the GT
	 * thread to wake up.
	 */
	if (wait_for_atomic_us((__raw_i915_read32(dev_priv, GEN6_GT_THREAD_STATUS_REG) &
				GEN6_GT_THREAD_STATUS_CORE_MASK) == 0, 500))
		DRM_ERROR("GT thread status wait timed out\n");
}

static void fw_domains_get_with_thread_status(struct drm_i915_private *dev_priv,
190
					      enum forcewake_domains fw_domains)
191 192
{
	fw_domains_get(dev_priv, fw_domains);
193

194
	/* WaRsForcewakeWaitTC0:snb,ivb,hsw,bdw,vlv */
195
	__gen6_gt_wait_for_thread_c0(dev_priv);
196 197 198 199 200
}

static void gen6_gt_check_fifodbg(struct drm_i915_private *dev_priv)
{
	u32 gtfifodbg;
201 202

	gtfifodbg = __raw_i915_read32(dev_priv, GTFIFODBG);
203 204
	if (WARN(gtfifodbg, "GT wake FIFO error 0x%x\n", gtfifodbg))
		__raw_i915_write32(dev_priv, GTFIFODBG, gtfifodbg);
205 206
}

207
static void fw_domains_put_with_fifo(struct drm_i915_private *dev_priv,
208
				     enum forcewake_domains fw_domains)
209
{
210
	fw_domains_put(dev_priv, fw_domains);
211 212 213
	gen6_gt_check_fifodbg(dev_priv);
}

214 215 216 217 218 219 220
static inline u32 fifo_free_entries(struct drm_i915_private *dev_priv)
{
	u32 count = __raw_i915_read32(dev_priv, GTFIFOCTL);

	return count & GT_FIFO_FREE_ENTRIES_MASK;
}

221 222 223 224
static int __gen6_gt_wait_for_fifo(struct drm_i915_private *dev_priv)
{
	int ret = 0;

225 226 227
	/* On VLV, FIFO will be shared by both SW and HW.
	 * So, we need to read the FREE_ENTRIES everytime */
	if (IS_VALLEYVIEW(dev_priv->dev))
228
		dev_priv->uncore.fifo_count = fifo_free_entries(dev_priv);
229

230 231
	if (dev_priv->uncore.fifo_count < GT_FIFO_NUM_RESERVED_ENTRIES) {
		int loop = 500;
232 233
		u32 fifo = fifo_free_entries(dev_priv);

234 235
		while (fifo <= GT_FIFO_NUM_RESERVED_ENTRIES && loop--) {
			udelay(10);
236
			fifo = fifo_free_entries(dev_priv);
237 238 239 240 241 242 243 244 245 246
		}
		if (WARN_ON(loop < 0 && fifo <= GT_FIFO_NUM_RESERVED_ENTRIES))
			++ret;
		dev_priv->uncore.fifo_count = fifo;
	}
	dev_priv->uncore.fifo_count--;

	return ret;
}

247
static void intel_uncore_fw_release_timer(unsigned long arg)
Z
Zhe Wang 已提交
248
{
249 250
	struct intel_uncore_forcewake_domain *domain = (void *)arg;
	unsigned long irqflags;
Z
Zhe Wang 已提交
251

252
	assert_device_not_suspended(domain->i915);
Z
Zhe Wang 已提交
253

254 255 256 257 258 259 260 261 262
	spin_lock_irqsave(&domain->i915->uncore.lock, irqflags);
	if (WARN_ON(domain->wake_count == 0))
		domain->wake_count++;

	if (--domain->wake_count == 0)
		domain->i915->uncore.funcs.force_wake_put(domain->i915,
							  1 << domain->id);

	spin_unlock_irqrestore(&domain->i915->uncore.lock, irqflags);
Z
Zhe Wang 已提交
263 264
}

265
void intel_uncore_forcewake_reset(struct drm_device *dev, bool restore)
Z
Zhe Wang 已提交
266
{
267
	struct drm_i915_private *dev_priv = dev->dev_private;
268
	unsigned long irqflags;
269
	struct intel_uncore_forcewake_domain *domain;
270 271 272
	int retry_count = 100;
	enum forcewake_domain_id id;
	enum forcewake_domains fw = 0, active_domains;
Z
Zhe Wang 已提交
273

274 275 276 277 278 279
	/* Hold uncore.lock across reset to prevent any register access
	 * with forcewake not set correctly. Wait until all pending
	 * timers are run before holding.
	 */
	while (1) {
		active_domains = 0;
Z
Zhe Wang 已提交
280

281 282 283
		for_each_fw_domain(domain, dev_priv, id) {
			if (del_timer_sync(&domain->timer) == 0)
				continue;
Z
Zhe Wang 已提交
284

285
			intel_uncore_fw_release_timer((unsigned long)domain);
286
		}
287

288
		spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
289

290 291 292 293
		for_each_fw_domain(domain, dev_priv, id) {
			if (timer_pending(&domain->timer))
				active_domains |= (1 << id);
		}
294

295 296
		if (active_domains == 0)
			break;
297

298 299 300 301
		if (--retry_count == 0) {
			DRM_ERROR("Timed out waiting for forcewake timers to finish\n");
			break;
		}
302

303 304 305
		spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
		cond_resched();
	}
306

307 308 309 310 311 312 313 314
	WARN_ON(active_domains);

	for_each_fw_domain(domain, dev_priv, id)
		if (domain->wake_count)
			fw |= 1 << id;

	if (fw)
		dev_priv->uncore.funcs.force_wake_put(dev_priv, fw);
315

316
	fw_domains_reset(dev_priv, FORCEWAKE_ALL);
Z
Zhe Wang 已提交
317

318 319 320 321 322 323
	if (restore) { /* If reset with a user forcewake, try to restore */
		if (fw)
			dev_priv->uncore.funcs.force_wake_get(dev_priv, fw);

		if (IS_GEN6(dev) || IS_GEN7(dev))
			dev_priv->uncore.fifo_count =
324
				fifo_free_entries(dev_priv);
325 326
	}

327
	if (!restore)
328
		assert_forcewakes_inactive(dev_priv);
329

330
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
331 332
}

333
static void intel_uncore_ellc_detect(struct drm_device *dev)
334 335 336
{
	struct drm_i915_private *dev_priv = dev->dev_private;

337 338
	if ((IS_HASWELL(dev) || IS_BROADWELL(dev) ||
	     INTEL_INFO(dev)->gen >= 9) &&
339
	    (__raw_i915_read32(dev_priv, HSW_EDRAM_PRESENT) & EDRAM_ENABLED)) {
340 341 342 343 344 345 346 347
		/* The docs do not explain exactly how the calculation can be
		 * made. It is somewhat guessable, but for now, it's always
		 * 128MB.
		 * NB: We can't write IDICR yet because we do not have gt funcs
		 * set up */
		dev_priv->ellc_size = 128;
		DRM_INFO("Found %zuMB of eLLC\n", dev_priv->ellc_size);
	}
348 349 350 351 352 353 354 355 356
}

static void __intel_uncore_early_sanitize(struct drm_device *dev,
					  bool restore_forcewake)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

	if (HAS_FPGA_DBG_UNCLAIMED(dev))
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
357

358 359 360 361 362
	/* clear out old GT FIFO errors */
	if (IS_GEN6(dev) || IS_GEN7(dev))
		__raw_i915_write32(dev_priv, GTFIFODBG,
				   __raw_i915_read32(dev_priv, GTFIFODBG));

363 364 365 366 367 368 369 370
	/* WaDisableShadowRegForCpd:chv */
	if (IS_CHERRYVIEW(dev)) {
		__raw_i915_write32(dev_priv, GTFIFOCTL,
				   __raw_i915_read32(dev_priv, GTFIFOCTL) |
				   GT_FIFO_CTL_BLOCK_ALL_POLICY_STALL |
				   GT_FIFO_CTL_RC6_POLICY_STALL);
	}

371
	intel_uncore_forcewake_reset(dev, restore_forcewake);
372 373
}

374 375 376 377 378 379
void intel_uncore_early_sanitize(struct drm_device *dev, bool restore_forcewake)
{
	__intel_uncore_early_sanitize(dev, restore_forcewake);
	i915_check_and_clear_faults(dev);
}

380 381
void intel_uncore_sanitize(struct drm_device *dev)
{
382 383 384 385
	/* BIOS often leaves RC6 enabled, but disable it for hw init */
	intel_disable_gt_powersave(dev);
}

386 387 388 389 390 391 392 393 394 395 396 397
/**
 * intel_uncore_forcewake_get - grab forcewake domain references
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to get reference on
 *
 * This function can be used get GT's forcewake domain references.
 * Normal register access will handle the forcewake domains automatically.
 * However if some sequence requires the GT to not power down a particular
 * forcewake domains this function should be called at the beginning of the
 * sequence. And subsequently the reference should be dropped by symmetric
 * call to intel_unforce_forcewake_put(). Usually caller wants all the domains
 * to be kept awake so the @fw_domains would be then FORCEWAKE_ALL.
398
 */
399
void intel_uncore_forcewake_get(struct drm_i915_private *dev_priv,
400
				enum forcewake_domains fw_domains)
401 402
{
	unsigned long irqflags;
403
	struct intel_uncore_forcewake_domain *domain;
404
	enum forcewake_domain_id id;
405

406 407 408
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

409
	WARN_ON(dev_priv->pm.suspended);
410

411 412
	fw_domains &= dev_priv->uncore.fw_domains;

413
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);
Z
Zhe Wang 已提交
414

415 416 417
	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (domain->wake_count++)
			fw_domains &= ~(1 << id);
418
	}
419

420 421 422
	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);

423 424 425
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

426 427 428 429 430 431 432
/**
 * intel_uncore_forcewake_put - release a forcewake domain reference
 * @dev_priv: i915 device instance
 * @fw_domains: forcewake domains to put references
 *
 * This function drops the device-level forcewakes for specified
 * domains obtained by intel_uncore_forcewake_get().
433
 */
434
void intel_uncore_forcewake_put(struct drm_i915_private *dev_priv,
435
				enum forcewake_domains fw_domains)
436 437
{
	unsigned long irqflags;
438
	struct intel_uncore_forcewake_domain *domain;
439
	enum forcewake_domain_id id;
440

441 442 443
	if (!dev_priv->uncore.funcs.force_wake_put)
		return;

444 445
	fw_domains &= dev_priv->uncore.fw_domains;

446 447
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags);

448 449 450 451 452 453 454 455
	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
		if (WARN_ON(domain->wake_count == 0))
			continue;

		if (--domain->wake_count)
			continue;

		domain->wake_count++;
456
		fw_domain_arm_timer(domain);
457
	}
458

459 460 461
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags);
}

462
void assert_forcewakes_inactive(struct drm_i915_private *dev_priv)
463
{
464
	struct intel_uncore_forcewake_domain *domain;
465
	enum forcewake_domain_id id;
466

467 468 469
	if (!dev_priv->uncore.funcs.force_wake_get)
		return;

470
	for_each_fw_domain(domain, dev_priv, id)
471
		WARN_ON(domain->wake_count);
472 473
}

474 475
/* We give fast paths for the really cool registers */
#define NEEDS_FORCE_WAKE(dev_priv, reg) \
476
	 ((reg) < 0x40000 && (reg) != FORCEWAKE)
477

478
#define REG_RANGE(reg, start, end) ((reg) >= (start) && (reg) < (end))
479

480 481 482 483 484 485 486 487 488 489 490 491 492
#define FORCEWAKE_VLV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
	 REG_RANGE((reg), 0x5000, 0x8000) || \
	 REG_RANGE((reg), 0xB000, 0x12000) || \
	 REG_RANGE((reg), 0x2E000, 0x30000))

#define FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x22000, 0x24000) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x2000, 0x4000) || \
493
	 REG_RANGE((reg), 0x5200, 0x8000) || \
494
	 REG_RANGE((reg), 0x8300, 0x8500) || \
495
	 REG_RANGE((reg), 0xB000, 0xB480) || \
496 497 498 499 500 501 502 503
	 REG_RANGE((reg), 0xE000, 0xE800))

#define FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x8800, 0x8900) || \
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1C000) || \
	 REG_RANGE((reg), 0x1E800, 0x1EA00) || \
504
	 REG_RANGE((reg), 0x30000, 0x38000))
505 506 507 508 509 510

#define FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg) \
	(REG_RANGE((reg), 0x4000, 0x5000) || \
	 REG_RANGE((reg), 0x8000, 0x8300) || \
	 REG_RANGE((reg), 0x8500, 0x8600) || \
	 REG_RANGE((reg), 0x9000, 0xB000) || \
511
	 REG_RANGE((reg), 0xF000, 0x10000))
512

513
#define FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) \
514
	REG_RANGE((reg), 0xB00,  0x2000)
515 516

#define FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) \
517 518
	(REG_RANGE((reg), 0x2000, 0x2700) || \
	 REG_RANGE((reg), 0x3000, 0x4000) || \
519
	 REG_RANGE((reg), 0x5200, 0x8000) || \
520
	 REG_RANGE((reg), 0x8140, 0x8160) || \
521 522 523
	 REG_RANGE((reg), 0x8300, 0x8500) || \
	 REG_RANGE((reg), 0x8C00, 0x8D00) || \
	 REG_RANGE((reg), 0xB000, 0xB480) || \
524 525
	 REG_RANGE((reg), 0xE000, 0xE900) || \
	 REG_RANGE((reg), 0x24400, 0x24800))
526 527

#define FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) \
528 529
	(REG_RANGE((reg), 0x8130, 0x8140) || \
	 REG_RANGE((reg), 0x8800, 0x8A00) || \
530 531 532 533 534 535 536 537 538 539 540 541 542 543 544
	 REG_RANGE((reg), 0xD000, 0xD800) || \
	 REG_RANGE((reg), 0x12000, 0x14000) || \
	 REG_RANGE((reg), 0x1A000, 0x1EA00) || \
	 REG_RANGE((reg), 0x30000, 0x40000))

#define FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg) \
	REG_RANGE((reg), 0x9400, 0x9800)

#define FORCEWAKE_GEN9_BLITTER_RANGE_OFFSET(reg) \
	((reg) < 0x40000 &&\
	 !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg) && \
	 !FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg))

545 546 547 548 549 550
static void
ilk_dummy_write(struct drm_i915_private *dev_priv)
{
	/* WaIssueDummyWriteToWakeupFromRC6:ilk Issue a dummy write to wake up
	 * the chip from rc6 before touching it for real. MI_MODE is masked,
	 * hence harmless to write 0 into. */
551
	__raw_i915_write32(dev_priv, MI_MODE, 0);
552 553 554
}

static void
555 556
hsw_unclaimed_reg_debug(struct drm_i915_private *dev_priv, u32 reg, bool read,
			bool before)
557
{
558 559 560 561 562 563
	const char *op = read ? "reading" : "writing to";
	const char *when = before ? "before" : "after";

	if (!i915.mmio_debug)
		return;

564
	if (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM) {
565 566
		WARN(1, "Unclaimed register detected %s %s register 0x%x\n",
		     when, op, reg);
567
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
568
		i915.mmio_debug--; /* Only report the first N failures */
569 570 571 572
	}
}

static void
573
hsw_unclaimed_reg_detect(struct drm_i915_private *dev_priv)
574
{
575 576 577
	static bool mmio_debug_once = true;

	if (i915.mmio_debug || !mmio_debug_once)
578 579
		return;

580
	if (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM) {
581 582 583
		DRM_DEBUG("Unclaimed register detected, "
			  "enabling oneshot unclaimed register reporting. "
			  "Please use i915.mmio_debug=N for more information.\n");
584
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
585
		i915.mmio_debug = mmio_debug_once--;
586 587 588
	}
}

589
#define GEN2_READ_HEADER(x) \
B
Ben Widawsky 已提交
590
	u##x val = 0; \
591
	assert_device_not_suspended(dev_priv);
B
Ben Widawsky 已提交
592

593
#define GEN2_READ_FOOTER \
B
Ben Widawsky 已提交
594 595 596
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

597
#define __gen2_read(x) \
598
static u##x \
599 600
gen2_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
	GEN2_READ_HEADER(x); \
601
	val = __raw_i915_read##x(dev_priv, reg); \
602
	GEN2_READ_FOOTER; \
603 604 605 606 607
}

#define __gen5_read(x) \
static u##x \
gen5_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
608
	GEN2_READ_HEADER(x); \
609 610
	ilk_dummy_write(dev_priv); \
	val = __raw_i915_read##x(dev_priv, reg); \
611
	GEN2_READ_FOOTER; \
612 613
}

614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639
__gen5_read(8)
__gen5_read(16)
__gen5_read(32)
__gen5_read(64)
__gen2_read(8)
__gen2_read(16)
__gen2_read(32)
__gen2_read(64)

#undef __gen5_read
#undef __gen2_read

#undef GEN2_READ_FOOTER
#undef GEN2_READ_HEADER

#define GEN6_READ_HEADER(x) \
	unsigned long irqflags; \
	u##x val = 0; \
	assert_device_not_suspended(dev_priv); \
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define GEN6_READ_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags); \
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

640
static inline void __force_wake_get(struct drm_i915_private *dev_priv,
641
				    enum forcewake_domains fw_domains)
642 643
{
	struct intel_uncore_forcewake_domain *domain;
644
	enum forcewake_domain_id id;
645 646 647 648 649

	if (WARN_ON(!fw_domains))
		return;

	/* Ideally GCC would be constant-fold and eliminate this loop */
650
	for_each_fw_domain_mask(domain, fw_domains, dev_priv, id) {
651
		if (domain->wake_count) {
652
			fw_domains &= ~(1 << id);
653 654 655 656
			continue;
		}

		domain->wake_count++;
657
		fw_domain_arm_timer(domain);
658 659 660 661 662 663
	}

	if (fw_domains)
		dev_priv->uncore.funcs.force_wake_get(dev_priv, fw_domains);
}

664 665 666 667 668 669 670 671
#define __vgpu_read(x) \
static u##x \
vgpu_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
	GEN6_READ_HEADER(x); \
	val = __raw_i915_read##x(dev_priv, reg); \
	GEN6_READ_FOOTER; \
}

672 673 674
#define __gen6_read(x) \
static u##x \
gen6_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
675
	GEN6_READ_HEADER(x); \
676
	hsw_unclaimed_reg_debug(dev_priv, reg, true, true); \
677 678
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
679
	val = __raw_i915_read##x(dev_priv, reg); \
680
	hsw_unclaimed_reg_debug(dev_priv, reg, true, false); \
681
	GEN6_READ_FOOTER; \
682 683
}

684 685 686
#define __vlv_read(x) \
static u##x \
vlv_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
687
	GEN6_READ_HEADER(x); \
688 689 690 691
	if (FORCEWAKE_VLV_RENDER_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	else if (FORCEWAKE_VLV_MEDIA_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
692
	val = __raw_i915_read##x(dev_priv, reg); \
693
	GEN6_READ_FOOTER; \
694 695
}

696 697 698
#define __chv_read(x) \
static u##x \
chv_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
699
	GEN6_READ_HEADER(x); \
700 701 702 703 704 705 706
	if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
	else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg)) \
		__force_wake_get(dev_priv, \
				 FORCEWAKE_RENDER | FORCEWAKE_MEDIA); \
707
	val = __raw_i915_read##x(dev_priv, reg); \
708
	GEN6_READ_FOOTER; \
709
}
710

711 712 713 714 715 716
#define SKL_NEEDS_FORCE_WAKE(dev_priv, reg)	\
	 ((reg) < 0x40000 && !FORCEWAKE_GEN9_UNCORE_RANGE_OFFSET(reg))

#define __gen9_read(x) \
static u##x \
gen9_read##x(struct drm_i915_private *dev_priv, off_t reg, bool trace) { \
717
	enum forcewake_domains fw_engine; \
718
	GEN6_READ_HEADER(x); \
719 720 721 722 723 724 725 726 727 728 729 730 731
	if (!SKL_NEEDS_FORCE_WAKE((dev_priv), (reg)))	\
		fw_engine = 0; \
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg))	\
		fw_engine = FORCEWAKE_RENDER; \
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_MEDIA; \
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	val = __raw_i915_read##x(dev_priv, reg); \
732
	GEN6_READ_FOOTER; \
733 734
}

735 736 737 738
__vgpu_read(8)
__vgpu_read(16)
__vgpu_read(32)
__vgpu_read(64)
739 740 741 742
__gen9_read(8)
__gen9_read(16)
__gen9_read(32)
__gen9_read(64)
743 744 745 746
__chv_read(8)
__chv_read(16)
__chv_read(32)
__chv_read(64)
747 748 749 750
__vlv_read(8)
__vlv_read(16)
__vlv_read(32)
__vlv_read(64)
751 752 753 754 755
__gen6_read(8)
__gen6_read(16)
__gen6_read(32)
__gen6_read(64)

756
#undef __gen9_read
757
#undef __chv_read
758
#undef __vlv_read
759
#undef __gen6_read
760
#undef __vgpu_read
761 762
#undef GEN6_READ_FOOTER
#undef GEN6_READ_HEADER
B
Ben Widawsky 已提交
763

764
#define GEN2_WRITE_HEADER \
B
Ben Widawsky 已提交
765
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
766
	assert_device_not_suspended(dev_priv); \
767

768
#define GEN2_WRITE_FOOTER
V
Ville Syrjälä 已提交
769

770
#define __gen2_write(x) \
771
static void \
772 773
gen2_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	GEN2_WRITE_HEADER; \
774
	__raw_i915_write##x(dev_priv, reg, val); \
775
	GEN2_WRITE_FOOTER; \
776 777 778 779 780
}

#define __gen5_write(x) \
static void \
gen5_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
781
	GEN2_WRITE_HEADER; \
782 783
	ilk_dummy_write(dev_priv); \
	__raw_i915_write##x(dev_priv, reg, val); \
784
	GEN2_WRITE_FOOTER; \
785 786
}

787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810
__gen5_write(8)
__gen5_write(16)
__gen5_write(32)
__gen5_write(64)
__gen2_write(8)
__gen2_write(16)
__gen2_write(32)
__gen2_write(64)

#undef __gen5_write
#undef __gen2_write

#undef GEN2_WRITE_FOOTER
#undef GEN2_WRITE_HEADER

#define GEN6_WRITE_HEADER \
	unsigned long irqflags; \
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
	assert_device_not_suspended(dev_priv); \
	spin_lock_irqsave(&dev_priv->uncore.lock, irqflags)

#define GEN6_WRITE_FOOTER \
	spin_unlock_irqrestore(&dev_priv->uncore.lock, irqflags)

811 812 813 814
#define __gen6_write(x) \
static void \
gen6_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	u32 __fifo_ret = 0; \
815
	GEN6_WRITE_HEADER; \
816 817 818 819 820 821 822
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) { \
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
	__raw_i915_write##x(dev_priv, reg, val); \
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
823
	GEN6_WRITE_FOOTER; \
824 825 826 827 828
}

#define __hsw_write(x) \
static void \
hsw_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
829
	u32 __fifo_ret = 0; \
830
	GEN6_WRITE_HEADER; \
831 832 833
	if (NEEDS_FORCE_WAKE((dev_priv), (reg))) { \
		__fifo_ret = __gen6_gt_wait_for_fifo(dev_priv); \
	} \
834
	hsw_unclaimed_reg_debug(dev_priv, reg, false, true); \
835
	__raw_i915_write##x(dev_priv, reg, val); \
836 837 838
	if (unlikely(__fifo_ret)) { \
		gen6_gt_check_fifodbg(dev_priv); \
	} \
839 840
	hsw_unclaimed_reg_debug(dev_priv, reg, false, false); \
	hsw_unclaimed_reg_detect(dev_priv); \
841
	GEN6_WRITE_FOOTER; \
842
}
843

844 845 846 847 848 849 850 851
#define __vgpu_write(x) \
static void vgpu_write##x(struct drm_i915_private *dev_priv, \
			  off_t reg, u##x val, bool trace) { \
	GEN6_WRITE_HEADER; \
	__raw_i915_write##x(dev_priv, reg, val); \
	GEN6_WRITE_FOOTER; \
}

852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875
static const u32 gen8_shadowed_regs[] = {
	FORCEWAKE_MT,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	/* TODO: Other registers are not yet used */
};

static bool is_gen8_shadowed(struct drm_i915_private *dev_priv, u32 reg)
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen8_shadowed_regs); i++)
		if (reg == gen8_shadowed_regs[i])
			return true;

	return false;
}

#define __gen8_write(x) \
static void \
gen8_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
876
	GEN6_WRITE_HEADER; \
877
	hsw_unclaimed_reg_debug(dev_priv, reg, false, true); \
878 879 880
	if (reg < 0x40000 && !is_gen8_shadowed(dev_priv, reg)) \
		__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
	__raw_i915_write##x(dev_priv, reg, val); \
881 882
	hsw_unclaimed_reg_debug(dev_priv, reg, false, false); \
	hsw_unclaimed_reg_detect(dev_priv); \
883
	GEN6_WRITE_FOOTER; \
884 885
}

886 887 888 889
#define __chv_write(x) \
static void \
chv_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, bool trace) { \
	bool shadowed = is_gen8_shadowed(dev_priv, reg); \
890
	GEN6_WRITE_HEADER; \
891
	if (!shadowed) { \
892 893 894 895 896 897
		if (FORCEWAKE_CHV_RENDER_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_RENDER); \
		else if (FORCEWAKE_CHV_MEDIA_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_MEDIA); \
		else if (FORCEWAKE_CHV_COMMON_RANGE_OFFSET(reg)) \
			__force_wake_get(dev_priv, FORCEWAKE_RENDER | FORCEWAKE_MEDIA); \
898 899
	} \
	__raw_i915_write##x(dev_priv, reg, val); \
900
	GEN6_WRITE_FOOTER; \
901 902
}

Z
Zhe Wang 已提交
903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925
static const u32 gen9_shadowed_regs[] = {
	RING_TAIL(RENDER_RING_BASE),
	RING_TAIL(GEN6_BSD_RING_BASE),
	RING_TAIL(VEBOX_RING_BASE),
	RING_TAIL(BLT_RING_BASE),
	FORCEWAKE_BLITTER_GEN9,
	FORCEWAKE_RENDER_GEN9,
	FORCEWAKE_MEDIA_GEN9,
	GEN6_RPNSWREQ,
	GEN6_RC_VIDEO_FREQ,
	/* TODO: Other registers are not yet used */
};

static bool is_gen9_shadowed(struct drm_i915_private *dev_priv, u32 reg)
{
	int i;
	for (i = 0; i < ARRAY_SIZE(gen9_shadowed_regs); i++)
		if (reg == gen9_shadowed_regs[i])
			return true;

	return false;
}

926 927 928 929
#define __gen9_write(x) \
static void \
gen9_write##x(struct drm_i915_private *dev_priv, off_t reg, u##x val, \
		bool trace) { \
930
	enum forcewake_domains fw_engine; \
931
	GEN6_WRITE_HEADER; \
932 933 934 935 936 937 938 939 940 941 942 943 944 945
	if (!SKL_NEEDS_FORCE_WAKE((dev_priv), (reg)) ||	\
	    is_gen9_shadowed(dev_priv, reg)) \
		fw_engine = 0; \
	else if (FORCEWAKE_GEN9_RENDER_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER; \
	else if (FORCEWAKE_GEN9_MEDIA_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_MEDIA; \
	else if (FORCEWAKE_GEN9_COMMON_RANGE_OFFSET(reg)) \
		fw_engine = FORCEWAKE_RENDER | FORCEWAKE_MEDIA; \
	else \
		fw_engine = FORCEWAKE_BLITTER; \
	if (fw_engine) \
		__force_wake_get(dev_priv, fw_engine); \
	__raw_i915_write##x(dev_priv, reg, val); \
946
	GEN6_WRITE_FOOTER; \
947 948 949 950 951 952
}

__gen9_write(8)
__gen9_write(16)
__gen9_write(32)
__gen9_write(64)
953 954 955 956
__chv_write(8)
__chv_write(16)
__chv_write(32)
__chv_write(64)
957 958 959 960
__gen8_write(8)
__gen8_write(16)
__gen8_write(32)
__gen8_write(64)
961 962 963 964 965 966 967 968
__hsw_write(8)
__hsw_write(16)
__hsw_write(32)
__hsw_write(64)
__gen6_write(8)
__gen6_write(16)
__gen6_write(32)
__gen6_write(64)
969 970 971 972
__vgpu_write(8)
__vgpu_write(16)
__vgpu_write(32)
__vgpu_write(64)
973

974
#undef __gen9_write
975
#undef __chv_write
976
#undef __gen8_write
977 978
#undef __hsw_write
#undef __gen6_write
979
#undef __vgpu_write
980 981
#undef GEN6_WRITE_FOOTER
#undef GEN6_WRITE_HEADER
982

983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998
#define ASSIGN_WRITE_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_writeb = x##_write8; \
	dev_priv->uncore.funcs.mmio_writew = x##_write16; \
	dev_priv->uncore.funcs.mmio_writel = x##_write32; \
	dev_priv->uncore.funcs.mmio_writeq = x##_write64; \
} while (0)

#define ASSIGN_READ_MMIO_VFUNCS(x) \
do { \
	dev_priv->uncore.funcs.mmio_readb = x##_read8; \
	dev_priv->uncore.funcs.mmio_readw = x##_read16; \
	dev_priv->uncore.funcs.mmio_readl = x##_read32; \
	dev_priv->uncore.funcs.mmio_readq = x##_read64; \
} while (0)

999 1000

static void fw_domain_init(struct drm_i915_private *dev_priv,
1001 1002
			   enum forcewake_domain_id domain_id,
			   u32 reg_set, u32 reg_ack)
1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021
{
	struct intel_uncore_forcewake_domain *d;

	if (WARN_ON(domain_id >= FW_DOMAIN_ID_COUNT))
		return;

	d = &dev_priv->uncore.fw_domain[domain_id];

	WARN_ON(d->wake_count);

	d->wake_count = 0;
	d->reg_set = reg_set;
	d->reg_ack = reg_ack;

	if (IS_GEN6(dev_priv)) {
		d->val_reset = 0;
		d->val_set = FORCEWAKE_KERNEL;
		d->val_clear = 0;
	} else {
1022
		/* WaRsClearFWBitsAtReset:bdw,skl */
1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037
		d->val_reset = _MASKED_BIT_DISABLE(0xffff);
		d->val_set = _MASKED_BIT_ENABLE(FORCEWAKE_KERNEL);
		d->val_clear = _MASKED_BIT_DISABLE(FORCEWAKE_KERNEL);
	}

	if (IS_VALLEYVIEW(dev_priv))
		d->reg_post = FORCEWAKE_ACK_VLV;
	else if (IS_GEN6(dev_priv) || IS_GEN7(dev_priv) || IS_GEN8(dev_priv))
		d->reg_post = ECOBUS;
	else
		d->reg_post = 0;

	d->i915 = dev_priv;
	d->id = domain_id;

1038
	setup_timer(&d->timer, intel_uncore_fw_release_timer, (unsigned long)d);
1039 1040

	dev_priv->uncore.fw_domains |= (1 << domain_id);
1041 1042

	fw_domain_reset(d);
1043 1044
}

1045
static void intel_uncore_fw_domains_init(struct drm_device *dev)
1046 1047 1048
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1049 1050 1051
	if (INTEL_INFO(dev_priv->dev)->gen <= 5)
		return;

Z
Zhe Wang 已提交
1052
	if (IS_GEN9(dev)) {
1053 1054 1055 1056 1057 1058 1059 1060 1061 1062
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_RENDER_GEN9,
			       FORCEWAKE_ACK_RENDER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_BLITTER,
			       FORCEWAKE_BLITTER_GEN9,
			       FORCEWAKE_ACK_BLITTER_GEN9);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_GEN9, FORCEWAKE_ACK_MEDIA_GEN9);
Z
Zhe Wang 已提交
1063
	} else if (IS_VALLEYVIEW(dev)) {
1064
		dev_priv->uncore.funcs.force_wake_get = fw_domains_get;
1065 1066 1067 1068 1069
		if (!IS_CHERRYVIEW(dev))
			dev_priv->uncore.funcs.force_wake_put =
				fw_domains_put_with_fifo;
		else
			dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
1070 1071 1072 1073
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_VLV, FORCEWAKE_ACK_VLV);
		fw_domain_init(dev_priv, FW_DOMAIN_ID_MEDIA,
			       FORCEWAKE_MEDIA_VLV, FORCEWAKE_ACK_MEDIA_VLV);
1074
	} else if (IS_HASWELL(dev) || IS_BROADWELL(dev)) {
1075 1076 1077 1078 1079
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put = fw_domains_put;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_ACK_HSW);
1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091
	} else if (IS_IVYBRIDGE(dev)) {
		u32 ecobus;

		/* IVB configs may use multi-threaded forcewake */

		/* A small trick here - if the bios hasn't configured
		 * MT forcewake, and if the device is in RC6, then
		 * force_wake_mt_get will not wake the device and the
		 * ECOBUS read will return zero. Which will be
		 * (correctly) interpreted by the test below as MT
		 * forcewake being disabled.
		 */
1092 1093 1094 1095 1096
		dev_priv->uncore.funcs.force_wake_get =
			fw_domains_get_with_thread_status;
		dev_priv->uncore.funcs.force_wake_put =
			fw_domains_put_with_fifo;

1097 1098
		/* We need to init first for ECOBUS access and then
		 * determine later if we want to reinit, in case of MT access is
1099 1100 1101
		 * not working. In this stage we don't know which flavour this
		 * ivb is, so it is better to reset also the gen6 fw registers
		 * before the ecobus check.
1102
		 */
1103 1104 1105 1106

		__raw_i915_write32(dev_priv, FORCEWAKE, 0);
		__raw_posting_read(dev_priv, ECOBUS);

1107 1108
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE_MT, FORCEWAKE_MT_ACK);
1109

1110
		mutex_lock(&dev->struct_mutex);
1111
		fw_domains_get_with_thread_status(dev_priv, FORCEWAKE_ALL);
1112
		ecobus = __raw_i915_read32(dev_priv, ECOBUS);
1113
		fw_domains_put_with_fifo(dev_priv, FORCEWAKE_ALL);
1114 1115
		mutex_unlock(&dev->struct_mutex);

1116
		if (!(ecobus & FORCEWAKE_MT_ENABLE)) {
1117 1118
			DRM_INFO("No MT forcewake available on Ivybridge, this can result in issues\n");
			DRM_INFO("when using vblank-synced partial screen updates.\n");
1119 1120
			fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
				       FORCEWAKE, FORCEWAKE_ACK);
1121 1122 1123
		}
	} else if (IS_GEN6(dev)) {
		dev_priv->uncore.funcs.force_wake_get =
1124
			fw_domains_get_with_thread_status;
1125
		dev_priv->uncore.funcs.force_wake_put =
1126 1127 1128
			fw_domains_put_with_fifo;
		fw_domain_init(dev_priv, FW_DOMAIN_ID_RENDER,
			       FORCEWAKE, FORCEWAKE_ACK);
1129
	}
1130 1131 1132

	/* All future platforms are expected to require complex power gating */
	WARN_ON(dev_priv->uncore.fw_domains == 0);
1133 1134 1135 1136 1137 1138
}

void intel_uncore_init(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

1139 1140
	i915_check_vgpu(dev);

1141 1142 1143
	intel_uncore_ellc_detect(dev);
	intel_uncore_fw_domains_init(dev);
	__intel_uncore_early_sanitize(dev, false);
1144

1145
	switch (INTEL_INFO(dev)->gen) {
1146
	default:
1147
		MISSING_CASE(INTEL_INFO(dev)->gen);
1148 1149 1150 1151 1152 1153
		return;
	case 9:
		ASSIGN_WRITE_MMIO_VFUNCS(gen9);
		ASSIGN_READ_MMIO_VFUNCS(gen9);
		break;
	case 8:
1154
		if (IS_CHERRYVIEW(dev)) {
1155 1156
			ASSIGN_WRITE_MMIO_VFUNCS(chv);
			ASSIGN_READ_MMIO_VFUNCS(chv);
1157 1158

		} else {
1159 1160
			ASSIGN_WRITE_MMIO_VFUNCS(gen8);
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1161
		}
1162
		break;
1163 1164
	case 7:
	case 6:
1165
		if (IS_HASWELL(dev)) {
1166
			ASSIGN_WRITE_MMIO_VFUNCS(hsw);
1167
		} else {
1168
			ASSIGN_WRITE_MMIO_VFUNCS(gen6);
1169
		}
1170 1171

		if (IS_VALLEYVIEW(dev)) {
1172
			ASSIGN_READ_MMIO_VFUNCS(vlv);
1173
		} else {
1174
			ASSIGN_READ_MMIO_VFUNCS(gen6);
1175
		}
1176 1177
		break;
	case 5:
1178 1179
		ASSIGN_WRITE_MMIO_VFUNCS(gen5);
		ASSIGN_READ_MMIO_VFUNCS(gen5);
1180 1181 1182 1183
		break;
	case 4:
	case 3:
	case 2:
1184 1185
		ASSIGN_WRITE_MMIO_VFUNCS(gen2);
		ASSIGN_READ_MMIO_VFUNCS(gen2);
1186 1187
		break;
	}
1188

1189 1190 1191 1192 1193
	if (intel_vgpu_active(dev)) {
		ASSIGN_WRITE_MMIO_VFUNCS(vgpu);
		ASSIGN_READ_MMIO_VFUNCS(vgpu);
	}

1194
	i915_check_and_clear_faults(dev);
1195
}
1196 1197
#undef ASSIGN_WRITE_MMIO_VFUNCS
#undef ASSIGN_READ_MMIO_VFUNCS
1198 1199 1200 1201 1202

void intel_uncore_fini(struct drm_device *dev)
{
	/* Paranoia: make sure we have disabled everything before we exit. */
	intel_uncore_sanitize(dev);
1203
	intel_uncore_forcewake_reset(dev, false);
1204 1205
}

1206 1207
#define GEN_RANGE(l, h) GENMASK(h, l)

1208 1209 1210
static const struct register_whitelist {
	uint64_t offset;
	uint32_t size;
1211 1212
	/* supported gens, 0x10 for 4, 0x30 for 4 and 5, etc. */
	uint32_t gen_bitmask;
1213
} whitelist[] = {
1214
	{ RING_TIMESTAMP(RENDER_RING_BASE), 8, GEN_RANGE(4, 9) },
1215 1216 1217 1218 1219 1220 1221 1222
};

int i915_reg_read_ioctl(struct drm_device *dev,
			void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reg_read *reg = data;
	struct register_whitelist const *entry = whitelist;
1223
	int i, ret = 0;
1224 1225 1226 1227 1228 1229 1230 1231 1232 1233

	for (i = 0; i < ARRAY_SIZE(whitelist); i++, entry++) {
		if (entry->offset == reg->offset &&
		    (1 << INTEL_INFO(dev)->gen & entry->gen_bitmask))
			break;
	}

	if (i == ARRAY_SIZE(whitelist))
		return -EINVAL;

1234 1235
	intel_runtime_pm_get(dev_priv);

1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249
	switch (entry->size) {
	case 8:
		reg->val = I915_READ64(reg->offset);
		break;
	case 4:
		reg->val = I915_READ(reg->offset);
		break;
	case 2:
		reg->val = I915_READ16(reg->offset);
		break;
	case 1:
		reg->val = I915_READ8(reg->offset);
		break;
	default:
1250
		MISSING_CASE(entry->size);
1251 1252
		ret = -EINVAL;
		goto out;
1253 1254
	}

1255 1256 1257
out:
	intel_runtime_pm_put(dev_priv);
	return ret;
1258 1259
}

1260 1261 1262 1263 1264 1265
int i915_get_reset_stats_ioctl(struct drm_device *dev,
			       void *data, struct drm_file *file)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	struct drm_i915_reset_stats *args = data;
	struct i915_ctx_hang_stats *hs;
1266
	struct intel_context *ctx;
1267 1268
	int ret;

1269 1270 1271
	if (args->flags || args->pad)
		return -EINVAL;

1272
	if (args->ctx_id == DEFAULT_CONTEXT_HANDLE && !capable(CAP_SYS_ADMIN))
1273 1274 1275 1276 1277 1278
		return -EPERM;

	ret = mutex_lock_interruptible(&dev->struct_mutex);
	if (ret)
		return ret;

1279 1280
	ctx = i915_gem_context_get(file->driver_priv, args->ctx_id);
	if (IS_ERR(ctx)) {
1281
		mutex_unlock(&dev->struct_mutex);
1282
		return PTR_ERR(ctx);
1283
	}
1284
	hs = &ctx->hang_stats;
1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298

	if (capable(CAP_SYS_ADMIN))
		args->reset_count = i915_reset_count(&dev_priv->gpu_error);
	else
		args->reset_count = 0;

	args->batch_active = hs->batch_active;
	args->batch_pending = hs->batch_pending;

	mutex_unlock(&dev->struct_mutex);

	return 0;
}

1299
static int i915_reset_complete(struct drm_device *dev)
1300 1301
{
	u8 gdrst;
1302
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1303
	return (gdrst & GRDOM_RESET_STATUS) == 0;
1304 1305
}

1306
static int i915_do_reset(struct drm_device *dev)
1307
{
V
Ville Syrjälä 已提交
1308
	/* assert reset for at least 20 usec */
1309
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1310
	udelay(20);
1311
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1312

1313
	return wait_for(i915_reset_complete(dev), 500);
V
Ville Syrjälä 已提交
1314 1315 1316 1317 1318
}

static int g4x_reset_complete(struct drm_device *dev)
{
	u8 gdrst;
1319
	pci_read_config_byte(dev->pdev, I915_GDRST, &gdrst);
V
Ville Syrjälä 已提交
1320
	return (gdrst & GRDOM_RESET_ENABLE) == 0;
1321 1322
}

1323 1324 1325 1326 1327 1328
static int g33_do_reset(struct drm_device *dev)
{
	pci_write_config_byte(dev->pdev, I915_GDRST, GRDOM_RESET_ENABLE);
	return wait_for(g4x_reset_complete(dev), 500);
}

1329 1330 1331 1332 1333
static int g4x_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

1334
	pci_write_config_byte(dev->pdev, I915_GDRST,
1335
			      GRDOM_RENDER | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1336
	ret =  wait_for(g4x_reset_complete(dev), 500);
1337 1338 1339 1340 1341 1342 1343
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) | VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1344
	pci_write_config_byte(dev->pdev, I915_GDRST,
1345
			      GRDOM_MEDIA | GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1346
	ret =  wait_for(g4x_reset_complete(dev), 500);
1347 1348 1349 1350 1351 1352 1353
	if (ret)
		return ret;

	/* WaVcpClkGateDisableForMediaReset:ctg,elk */
	I915_WRITE(VDECCLK_GATE_D, I915_READ(VDECCLK_GATE_D) & ~VCP_UNIT_CLOCK_GATE_DISABLE);
	POSTING_READ(VDECCLK_GATE_D);

1354
	pci_write_config_byte(dev->pdev, I915_GDRST, 0);
1355 1356 1357 1358

	return 0;
}

1359 1360 1361 1362 1363 1364
static int ironlake_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR,
1365
		   ILK_GRDOM_RENDER | ILK_GRDOM_RESET_ENABLE);
V
Ville Syrjälä 已提交
1366
	ret = wait_for((I915_READ(MCHBAR_MIRROR_BASE + ILK_GDSR) &
1367
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
1368 1369 1370 1371
	if (ret)
		return ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR,
1372
		   ILK_GRDOM_MEDIA | ILK_GRDOM_RESET_ENABLE);
1373 1374 1375 1376 1377 1378 1379 1380
	ret = wait_for((I915_READ(MCHBAR_MIRROR_BASE + ILK_GDSR) &
			ILK_GRDOM_RESET_ENABLE) == 0, 500);
	if (ret)
		return ret;

	I915_WRITE(MCHBAR_MIRROR_BASE + ILK_GDSR, 0);

	return 0;
1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393
}

static int gen6_do_reset(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;
	int	ret;

	/* Reset the chip */

	/* GEN6_GDRST is not in the gt power well, no need to check
	 * for fifo space for the write or forcewake the chip for
	 * the read
	 */
1394
	__raw_i915_write32(dev_priv, GEN6_GDRST, GEN6_GRDOM_FULL);
1395 1396

	/* Spin waiting for the device to ack the reset request */
1397
	ret = wait_for((__raw_i915_read32(dev_priv, GEN6_GDRST) & GEN6_GRDOM_FULL) == 0, 500);
1398

1399
	intel_uncore_forcewake_reset(dev, true);
1400

1401 1402 1403 1404 1405
	return ret;
}

int intel_gpu_reset(struct drm_device *dev)
{
1406 1407 1408 1409 1410 1411
	if (INTEL_INFO(dev)->gen >= 6)
		return gen6_do_reset(dev);
	else if (IS_GEN5(dev))
		return ironlake_do_reset(dev);
	else if (IS_G4X(dev))
		return g4x_do_reset(dev);
1412 1413 1414
	else if (IS_G33(dev))
		return g33_do_reset(dev);
	else if (INTEL_INFO(dev)->gen >= 3)
1415
		return i915_do_reset(dev);
1416 1417
	else
		return -ENODEV;
1418 1419 1420 1421 1422 1423 1424
}

void intel_uncore_check_errors(struct drm_device *dev)
{
	struct drm_i915_private *dev_priv = dev->dev_private;

	if (HAS_FPGA_DBG_UNCLAIMED(dev) &&
1425
	    (__raw_i915_read32(dev_priv, FPGA_DBG) & FPGA_DBG_RM_NOCLAIM)) {
1426
		DRM_ERROR("Unclaimed register before interrupt\n");
1427
		__raw_i915_write32(dev_priv, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
1428 1429
	}
}