intel_uncore.c 57.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * Copyright © 2013 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 */

24 25 26
#include <linux/pm_runtime.h>
#include <asm/iosf_mbi.h>

27
#include "i915_drv.h"
28
#include "i915_trace.h"
29
#include "i915_vgpu.h"
30
#include "intel_pm.h"
31

32
#define FORCEWAKE_ACK_TIMEOUT_MS 50
33
#define GT_FIFO_TIMEOUT_MS	 10
34

35
#define __raw_posting_read(...) ((void)__raw_uncore_read32(__VA_ARGS__))
36

37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
void
intel_uncore_mmio_debug_init_early(struct intel_uncore_mmio_debug *mmio_debug)
{
	spin_lock_init(&mmio_debug->lock);
	mmio_debug->unclaimed_mmio_check = 1;
}

static void mmio_debug_suspend(struct intel_uncore_mmio_debug *mmio_debug)
{
	lockdep_assert_held(&mmio_debug->lock);

	/* Save and disable mmio debugging for the user bypass */
	if (!mmio_debug->suspend_count++) {
		mmio_debug->saved_mmio_check = mmio_debug->unclaimed_mmio_check;
		mmio_debug->unclaimed_mmio_check = 0;
	}
}

static void mmio_debug_resume(struct intel_uncore_mmio_debug *mmio_debug)
{
	lockdep_assert_held(&mmio_debug->lock);

	if (!--mmio_debug->suspend_count)
		mmio_debug->unclaimed_mmio_check = mmio_debug->saved_mmio_check;
}

63 64 65 66
static const char * const forcewake_domain_names[] = {
	"render",
	"blitter",
	"media",
67 68 69 70 71 72
	"vdbox0",
	"vdbox1",
	"vdbox2",
	"vdbox3",
	"vebox0",
	"vebox1",
73 74 75
};

const char *
76
intel_uncore_forcewake_domain_to_str(const enum forcewake_domain_id id)
77
{
78
	BUILD_BUG_ON(ARRAY_SIZE(forcewake_domain_names) != FW_DOMAIN_ID_COUNT);
79 80 81 82 83 84 85 86 87

	if (id >= 0 && id < FW_DOMAIN_ID_COUNT)
		return forcewake_domain_names[id];

	WARN_ON(id);

	return "unknown";
}

88
#define fw_ack(d) readl((d)->reg_ack)
89 90
#define fw_set(d, val) writel(_MASKED_BIT_ENABLE((val)), (d)->reg_set)
#define fw_clear(d, val) writel(_MASKED_BIT_DISABLE((val)), (d)->reg_set)
91

92
static inline void
93
fw_domain_reset(const struct intel_uncore_forcewake_domain *d)
94
{
95 96 97 98 99
	/*
	 * We don't really know if the powerwell for the forcewake domain we are
	 * trying to reset here does exist at this point (engines could be fused
	 * off in ICL+), so no waiting for acks
	 */
100 101
	/* WaRsClearFWBitsAtReset:bdw,skl */
	fw_clear(d, 0xffff);
102 103
}

104 105
static inline void
fw_domain_arm_timer(struct intel_uncore_forcewake_domain *d)
106
{
107 108
	GEM_BUG_ON(d->uncore->fw_domains_timer & d->mask);
	d->uncore->fw_domains_timer |= d->mask;
109 110
	d->wake_count++;
	hrtimer_start_range_ns(&d->timer,
T
Thomas Gleixner 已提交
111
			       NSEC_PER_MSEC,
112 113
			       NSEC_PER_MSEC,
			       HRTIMER_MODE_REL);
114 115
}

116
static inline int
117
__wait_for_ack(const struct intel_uncore_forcewake_domain *d,
118 119 120
	       const u32 ack,
	       const u32 value)
{
121
	return wait_for_atomic((fw_ack(d) & ack) == value,
122 123 124 125
			       FORCEWAKE_ACK_TIMEOUT_MS);
}

static inline int
126
wait_ack_clear(const struct intel_uncore_forcewake_domain *d,
127 128
	       const u32 ack)
{
129
	return __wait_for_ack(d, ack, 0);
130 131 132
}

static inline int
133
wait_ack_set(const struct intel_uncore_forcewake_domain *d,
134 135
	     const u32 ack)
{
136
	return __wait_for_ack(d, ack, ack);
137 138
}

139
static inline void
140
fw_domain_wait_ack_clear(const struct intel_uncore_forcewake_domain *d)
141
{
142
	if (wait_ack_clear(d, FORCEWAKE_KERNEL)) {
143 144
		DRM_ERROR("%s: timed out waiting for forcewake ack to clear.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
145 146
		add_taint_for_CI(TAINT_WARN); /* CI now unreliable */
	}
147
}
148

149 150 151 152 153 154
enum ack_type {
	ACK_CLEAR = 0,
	ACK_SET
};

static int
155
fw_domain_wait_ack_with_fallback(const struct intel_uncore_forcewake_domain *d,
156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171
				 const enum ack_type type)
{
	const u32 ack_bit = FORCEWAKE_KERNEL;
	const u32 value = type == ACK_SET ? ack_bit : 0;
	unsigned int pass;
	bool ack_detected;

	/*
	 * There is a possibility of driver's wake request colliding
	 * with hardware's own wake requests and that can cause
	 * hardware to not deliver the driver's ack message.
	 *
	 * Use a fallback bit toggle to kick the gpu state machine
	 * in the hope that the original ack will be delivered along with
	 * the fallback ack.
	 *
172 173 174
	 * This workaround is described in HSDES #1604254524 and it's known as:
	 * WaRsForcewakeAddDelayForAck:skl,bxt,kbl,glk,cfl,cnl,icl
	 * although the name is a bit misleading.
175 176 177 178
	 */

	pass = 1;
	do {
179
		wait_ack_clear(d, FORCEWAKE_KERNEL_FALLBACK);
180

181
		fw_set(d, FORCEWAKE_KERNEL_FALLBACK);
182 183
		/* Give gt some time to relax before the polling frenzy */
		udelay(10 * pass);
184
		wait_ack_set(d, FORCEWAKE_KERNEL_FALLBACK);
185

186
		ack_detected = (fw_ack(d) & ack_bit) == value;
187

188
		fw_clear(d, FORCEWAKE_KERNEL_FALLBACK);
189 190 191 192 193
	} while (!ack_detected && pass++ < 10);

	DRM_DEBUG_DRIVER("%s had to use fallback to %s ack, 0x%x (passes %u)\n",
			 intel_uncore_forcewake_domain_to_str(d->id),
			 type == ACK_SET ? "set" : "clear",
194
			 fw_ack(d),
195 196 197 198 199 200
			 pass);

	return ack_detected ? 0 : -ETIMEDOUT;
}

static inline void
201
fw_domain_wait_ack_clear_fallback(const struct intel_uncore_forcewake_domain *d)
202
{
203
	if (likely(!wait_ack_clear(d, FORCEWAKE_KERNEL)))
204 205
		return;

206 207
	if (fw_domain_wait_ack_with_fallback(d, ACK_CLEAR))
		fw_domain_wait_ack_clear(d);
208 209
}

210
static inline void
211
fw_domain_get(const struct intel_uncore_forcewake_domain *d)
212
{
213
	fw_set(d, FORCEWAKE_KERNEL);
214
}
215

216
static inline void
217
fw_domain_wait_ack_set(const struct intel_uncore_forcewake_domain *d)
218
{
219
	if (wait_ack_set(d, FORCEWAKE_KERNEL)) {
220 221
		DRM_ERROR("%s: timed out waiting for forcewake ack request.\n",
			  intel_uncore_forcewake_domain_to_str(d->id));
222 223
		add_taint_for_CI(TAINT_WARN); /* CI now unreliable */
	}
224
}
225

226
static inline void
227
fw_domain_wait_ack_set_fallback(const struct intel_uncore_forcewake_domain *d)
228
{
229
	if (likely(!wait_ack_set(d, FORCEWAKE_KERNEL)))
230 231
		return;

232 233
	if (fw_domain_wait_ack_with_fallback(d, ACK_SET))
		fw_domain_wait_ack_set(d);
234 235
}

236
static inline void
237
fw_domain_put(const struct intel_uncore_forcewake_domain *d)
238
{
239
	fw_clear(d, FORCEWAKE_KERNEL);
240 241
}

242
static void
243
fw_domains_get(struct intel_uncore *uncore, enum forcewake_domains fw_domains)
244
{
245
	struct intel_uncore_forcewake_domain *d;
C
Chris Wilson 已提交
246
	unsigned int tmp;
247

248
	GEM_BUG_ON(fw_domains & ~uncore->fw_domains);
C
Chris Wilson 已提交
249

250
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp) {
251
		fw_domain_wait_ack_clear(d);
252
		fw_domain_get(d);
253
	}
254

255
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp)
256
		fw_domain_wait_ack_set(d);
257

258
	uncore->fw_domains_active |= fw_domains;
259 260 261
}

static void
262
fw_domains_get_with_fallback(struct intel_uncore *uncore,
263 264 265 266 267
			     enum forcewake_domains fw_domains)
{
	struct intel_uncore_forcewake_domain *d;
	unsigned int tmp;

268
	GEM_BUG_ON(fw_domains & ~uncore->fw_domains);
269

270
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp) {
271
		fw_domain_wait_ack_clear_fallback(d);
272
		fw_domain_get(d);
273 274
	}

275
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp)
276
		fw_domain_wait_ack_set_fallback(d);
277

278
	uncore->fw_domains_active |= fw_domains;
279
}
280

281
static void
282
fw_domains_put(struct intel_uncore *uncore, enum forcewake_domains fw_domains)
283 284
{
	struct intel_uncore_forcewake_domain *d;
C
Chris Wilson 已提交
285 286
	unsigned int tmp;

287
	GEM_BUG_ON(fw_domains & ~uncore->fw_domains);
288

289
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp)
290
		fw_domain_put(d);
291

292
	uncore->fw_domains_active &= ~fw_domains;
293
}
294

295
static void
296
fw_domains_reset(struct intel_uncore *uncore,
297
		 enum forcewake_domains fw_domains)
298 299
{
	struct intel_uncore_forcewake_domain *d;
C
Chris Wilson 已提交
300
	unsigned int tmp;
301

C
Chris Wilson 已提交
302
	if (!fw_domains)
303
		return;
304

305
	GEM_BUG_ON(fw_domains & ~uncore->fw_domains);
C
Chris Wilson 已提交
306

307
	for_each_fw_domain_masked(d, fw_domains, uncore, tmp)
308
		fw_domain_reset(d);
309 310
}

311
static inline u32 gt_thread_status(struct intel_uncore *uncore)
312 313 314
{
	u32 val;

315
	val = __raw_uncore_read32(uncore, GEN6_GT_THREAD_STATUS_REG);
316 317 318 319 320
	val &= GEN6_GT_THREAD_STATUS_CORE_MASK;

	return val;
}

321
static void __gen6_gt_wait_for_thread_c0(struct intel_uncore *uncore)
322
{
323 324
	/*
	 * w/a for a sporadic read returning 0 by waiting for the GT
325 326
	 * thread to wake up.
	 */
327
	WARN_ONCE(wait_for_atomic_us(gt_thread_status(uncore) == 0, 5000),
328
		  "GT thread status wait timed out\n");
329 330
}

331
static void fw_domains_get_with_thread_status(struct intel_uncore *uncore,
332
					      enum forcewake_domains fw_domains)
333
{
334
	fw_domains_get(uncore, fw_domains);
335

336
	/* WaRsForcewakeWaitTC0:snb,ivb,hsw,bdw,vlv */
337
	__gen6_gt_wait_for_thread_c0(uncore);
338 339
}

340
static inline u32 fifo_free_entries(struct intel_uncore *uncore)
341
{
342
	u32 count = __raw_uncore_read32(uncore, GTFIFOCTL);
343 344 345 346

	return count & GT_FIFO_FREE_ENTRIES_MASK;
}

347
static void __gen6_gt_wait_for_fifo(struct intel_uncore *uncore)
348
{
349
	u32 n;
350

351 352
	/* On VLV, FIFO will be shared by both SW and HW.
	 * So, we need to read the FREE_ENTRIES everytime */
353
	if (IS_VALLEYVIEW(uncore->i915))
354
		n = fifo_free_entries(uncore);
355
	else
356
		n = uncore->fifo_count;
357 358

	if (n <= GT_FIFO_NUM_RESERVED_ENTRIES) {
359
		if (wait_for_atomic((n = fifo_free_entries(uncore)) >
360 361 362 363
				    GT_FIFO_NUM_RESERVED_ENTRIES,
				    GT_FIFO_TIMEOUT_MS)) {
			DRM_DEBUG("GT_FIFO timeout, entries: %u\n", n);
			return;
364 365 366
		}
	}

367
	uncore->fifo_count = n - 1;
368 369
}

370 371
static enum hrtimer_restart
intel_uncore_fw_release_timer(struct hrtimer *timer)
Z
Zhe Wang 已提交
372
{
373 374
	struct intel_uncore_forcewake_domain *domain =
	       container_of(timer, struct intel_uncore_forcewake_domain, timer);
375
	struct intel_uncore *uncore = domain->uncore;
376
	unsigned long irqflags;
Z
Zhe Wang 已提交
377

378
	assert_rpm_device_not_suspended(uncore->rpm);
Z
Zhe Wang 已提交
379

380 381 382
	if (xchg(&domain->active, false))
		return HRTIMER_RESTART;

383
	spin_lock_irqsave(&uncore->lock, irqflags);
384

385 386 387
	uncore->fw_domains_timer &= ~domain->mask;

	GEM_BUG_ON(!domain->wake_count);
388
	if (--domain->wake_count == 0)
389
		uncore->funcs.force_wake_put(uncore, domain->mask);
390

391
	spin_unlock_irqrestore(&uncore->lock, irqflags);
392 393

	return HRTIMER_NORESTART;
Z
Zhe Wang 已提交
394 395
}

396
/* Note callers must have acquired the PUNIT->PMIC bus, before calling this. */
397
static unsigned int
398
intel_uncore_forcewake_reset(struct intel_uncore *uncore)
Z
Zhe Wang 已提交
399
{
400
	unsigned long irqflags;
401
	struct intel_uncore_forcewake_domain *domain;
402
	int retry_count = 100;
403
	enum forcewake_domains fw, active_domains;
Z
Zhe Wang 已提交
404

405 406
	iosf_mbi_assert_punit_acquired();

407 408 409 410 411
	/* Hold uncore.lock across reset to prevent any register access
	 * with forcewake not set correctly. Wait until all pending
	 * timers are run before holding.
	 */
	while (1) {
C
Chris Wilson 已提交
412 413
		unsigned int tmp;

414
		active_domains = 0;
Z
Zhe Wang 已提交
415

416
		for_each_fw_domain(domain, uncore, tmp) {
417
			smp_store_mb(domain->active, false);
418
			if (hrtimer_cancel(&domain->timer) == 0)
419
				continue;
Z
Zhe Wang 已提交
420

421
			intel_uncore_fw_release_timer(&domain->timer);
422
		}
423

424
		spin_lock_irqsave(&uncore->lock, irqflags);
425

426
		for_each_fw_domain(domain, uncore, tmp) {
427
			if (hrtimer_active(&domain->timer))
428
				active_domains |= domain->mask;
429
		}
430

431 432
		if (active_domains == 0)
			break;
433

434 435 436 437
		if (--retry_count == 0) {
			DRM_ERROR("Timed out waiting for forcewake timers to finish\n");
			break;
		}
438

439
		spin_unlock_irqrestore(&uncore->lock, irqflags);
440 441
		cond_resched();
	}
442

443 444
	WARN_ON(active_domains);

445
	fw = uncore->fw_domains_active;
446
	if (fw)
447
		uncore->funcs.force_wake_put(uncore, fw);
448

449 450
	fw_domains_reset(uncore, uncore->fw_domains);
	assert_forcewakes_inactive(uncore);
451

452
	spin_unlock_irqrestore(&uncore->lock, irqflags);
453 454

	return fw; /* track the lost user forcewake domains */
455 456
}

457
static bool
458
fpga_check_for_unclaimed_mmio(struct intel_uncore *uncore)
459 460 461
{
	u32 dbg;

462
	dbg = __raw_uncore_read32(uncore, FPGA_DBG);
463 464 465
	if (likely(!(dbg & FPGA_DBG_RM_NOCLAIM)))
		return false;

466
	__raw_uncore_write32(uncore, FPGA_DBG, FPGA_DBG_RM_NOCLAIM);
467 468 469 470

	return true;
}

471
static bool
472
vlv_check_for_unclaimed_mmio(struct intel_uncore *uncore)
473 474 475
{
	u32 cer;

476
	cer = __raw_uncore_read32(uncore, CLAIM_ER);
477 478 479
	if (likely(!(cer & (CLAIM_ER_OVERFLOW | CLAIM_ER_CTR_MASK))))
		return false;

480
	__raw_uncore_write32(uncore, CLAIM_ER, CLAIM_ER_CLR);
481 482 483 484

	return true;
}

485
static bool
486
gen6_check_for_fifo_debug(struct intel_uncore *uncore)
487 488 489
{
	u32 fifodbg;

490
	fifodbg = __raw_uncore_read32(uncore, GTFIFODBG);
491 492 493

	if (unlikely(fifodbg)) {
		DRM_DEBUG_DRIVER("GTFIFODBG = 0x08%x\n", fifodbg);
494
		__raw_uncore_write32(uncore, GTFIFODBG, fifodbg);
495 496 497 498 499
	}

	return fifodbg;
}

500
static bool
501
check_for_unclaimed_mmio(struct intel_uncore *uncore)
502
{
503 504
	bool ret = false;

505 506 507 508 509
	lockdep_assert_held(&uncore->debug->lock);

	if (uncore->debug->suspend_count)
		return false;

510
	if (intel_uncore_has_fpga_dbg_unclaimed(uncore))
511
		ret |= fpga_check_for_unclaimed_mmio(uncore);
512

513
	if (intel_uncore_has_dbg_unclaimed(uncore))
514
		ret |= vlv_check_for_unclaimed_mmio(uncore);
515

516
	if (intel_uncore_has_fifo(uncore))
517
		ret |= gen6_check_for_fifo_debug(uncore);
518

519
	return ret;
520 521
}

522 523
static void forcewake_early_sanitize(struct intel_uncore *uncore,
				     unsigned int restore_forcewake)
524
{
525
	GEM_BUG_ON(!intel_uncore_has_forcewake(uncore));
526

527
	/* WaDisableShadowRegForCpd:chv */
528
	if (IS_CHERRYVIEW(uncore->i915)) {
529 530 531 532
		__raw_uncore_write32(uncore, GTFIFOCTL,
				     __raw_uncore_read32(uncore, GTFIFOCTL) |
				     GT_FIFO_CTL_BLOCK_ALL_POLICY_STALL |
				     GT_FIFO_CTL_RC6_POLICY_STALL);
533 534
	}

535
	iosf_mbi_punit_acquire();
536
	intel_uncore_forcewake_reset(uncore);
537
	if (restore_forcewake) {
538 539 540
		spin_lock_irq(&uncore->lock);
		uncore->funcs.force_wake_get(uncore, restore_forcewake);

541
		if (intel_uncore_has_fifo(uncore))
542
			uncore->fifo_count = fifo_free_entries(uncore);
543
		spin_unlock_irq(&uncore->lock);
544
	}
545
	iosf_mbi_punit_release();
546 547
}

548
void intel_uncore_suspend(struct intel_uncore *uncore)
549
{
550 551 552
	if (!intel_uncore_has_forcewake(uncore))
		return;

553 554
	iosf_mbi_punit_acquire();
	iosf_mbi_unregister_pmic_bus_access_notifier_unlocked(
555 556
		&uncore->pmic_bus_access_nb);
	uncore->fw_domains_saved = intel_uncore_forcewake_reset(uncore);
557
	iosf_mbi_punit_release();
558 559
}

560
void intel_uncore_resume_early(struct intel_uncore *uncore)
561
{
562 563
	unsigned int restore_forcewake;

564 565 566 567 568 569
	if (intel_uncore_unclaimed_mmio(uncore))
		DRM_DEBUG("unclaimed mmio detected on resume, clearing\n");

	if (!intel_uncore_has_forcewake(uncore))
		return;

570
	restore_forcewake = fetch_and_zero(&uncore->fw_domains_saved);
571
	forcewake_early_sanitize(uncore, restore_forcewake);
572

573
	iosf_mbi_register_pmic_bus_access_notifier(&uncore->pmic_bus_access_nb);
574 575
}

576
void intel_uncore_runtime_resume(struct intel_uncore *uncore)
577
{
578 579 580
	if (!intel_uncore_has_forcewake(uncore))
		return;

581
	iosf_mbi_register_pmic_bus_access_notifier(&uncore->pmic_bus_access_nb);
582 583
}

584
static void __intel_uncore_forcewake_get(struct intel_uncore *uncore,
585 586 587
					 enum forcewake_domains fw_domains)
{
	struct intel_uncore_forcewake_domain *domain;
C
Chris Wilson 已提交
588
	unsigned int tmp;
589

590
	fw_domains &= uncore->fw_domains;
591

592
	for_each_fw_domain_masked(domain, fw_domains, uncore, tmp) {
593
		if (domain->wake_count++) {
594
			fw_domains &= ~domain->mask;
595 596 597
			domain->active = true;
		}
	}
598

599
	if (fw_domains)
600
		uncore->funcs.force_wake_get(uncore, fw_domains);
601 602
}

603 604
/**
 * intel_uncore_forcewake_get - grab forcewake domain references
605
 * @uncore: the intel_uncore structure
606 607 608 609 610 611 612 613 614
 * @fw_domains: forcewake domains to get reference on
 *
 * This function can be used get GT's forcewake domain references.
 * Normal register access will handle the forcewake domains automatically.
 * However if some sequence requires the GT to not power down a particular
 * forcewake domains this function should be called at the beginning of the
 * sequence. And subsequently the reference should be dropped by symmetric
 * call to intel_unforce_forcewake_put(). Usually caller wants all the domains
 * to be kept awake so the @fw_domains would be then FORCEWAKE_ALL.
615
 */
616
void intel_uncore_forcewake_get(struct intel_uncore *uncore,
617
				enum forcewake_domains fw_domains)
618 619 620
{
	unsigned long irqflags;

621
	if (!uncore->funcs.force_wake_get)
622 623
		return;

624
	assert_rpm_wakelock_held(uncore->rpm);
625

626 627 628
	spin_lock_irqsave(&uncore->lock, irqflags);
	__intel_uncore_forcewake_get(uncore, fw_domains);
	spin_unlock_irqrestore(&uncore->lock, irqflags);
629 630
}

631 632
/**
 * intel_uncore_forcewake_user_get - claim forcewake on behalf of userspace
633
 * @uncore: the intel_uncore structure
634 635 636 637 638
 *
 * This function is a wrapper around intel_uncore_forcewake_get() to acquire
 * the GT powerwell and in the process disable our debugging for the
 * duration of userspace's bypass.
 */
639
void intel_uncore_forcewake_user_get(struct intel_uncore *uncore)
640
{
641
	spin_lock_irq(&uncore->lock);
642
	if (!uncore->user_forcewake_count++) {
643
		intel_uncore_forcewake_get__locked(uncore, FORCEWAKE_ALL);
644 645 646
		spin_lock(&uncore->debug->lock);
		mmio_debug_suspend(uncore->debug);
		spin_unlock(&uncore->debug->lock);
647
	}
648
	spin_unlock_irq(&uncore->lock);
649 650 651 652
}

/**
 * intel_uncore_forcewake_user_put - release forcewake on behalf of userspace
653
 * @uncore: the intel_uncore structure
654 655 656 657
 *
 * This function complements intel_uncore_forcewake_user_get() and releases
 * the GT powerwell taken on behalf of the userspace bypass.
 */
658
void intel_uncore_forcewake_user_put(struct intel_uncore *uncore)
659
{
660
	spin_lock_irq(&uncore->lock);
661 662 663 664 665
	if (!--uncore->user_forcewake_count) {
		spin_lock(&uncore->debug->lock);
		mmio_debug_resume(uncore->debug);

		if (check_for_unclaimed_mmio(uncore))
666
			dev_info(uncore->i915->drm.dev,
667
				 "Invalid mmio detected during user access\n");
668
		spin_unlock(&uncore->debug->lock);
669

670
		intel_uncore_forcewake_put__locked(uncore, FORCEWAKE_ALL);
671
	}
672
	spin_unlock_irq(&uncore->lock);
673 674
}

675
/**
676
 * intel_uncore_forcewake_get__locked - grab forcewake domain references
677
 * @uncore: the intel_uncore structure
678
 * @fw_domains: forcewake domains to get reference on
679
 *
680 681
 * See intel_uncore_forcewake_get(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
682
 */
683
void intel_uncore_forcewake_get__locked(struct intel_uncore *uncore,
684 685
					enum forcewake_domains fw_domains)
{
686 687 688
	lockdep_assert_held(&uncore->lock);

	if (!uncore->funcs.force_wake_get)
689 690
		return;

691
	__intel_uncore_forcewake_get(uncore, fw_domains);
692 693
}

694
static void __intel_uncore_forcewake_put(struct intel_uncore *uncore,
695
					 enum forcewake_domains fw_domains)
696
{
697
	struct intel_uncore_forcewake_domain *domain;
C
Chris Wilson 已提交
698
	unsigned int tmp;
699

700
	fw_domains &= uncore->fw_domains;
701

702
	for_each_fw_domain_masked(domain, fw_domains, uncore, tmp) {
703
		GEM_BUG_ON(!domain->wake_count);
704

705 706
		if (--domain->wake_count) {
			domain->active = true;
707
			continue;
708
		}
709

710
		fw_domain_arm_timer(domain);
711
	}
712
}
713

714 715
/**
 * intel_uncore_forcewake_put - release a forcewake domain reference
716
 * @uncore: the intel_uncore structure
717 718 719 720 721
 * @fw_domains: forcewake domains to put references
 *
 * This function drops the device-level forcewakes for specified
 * domains obtained by intel_uncore_forcewake_get().
 */
722
void intel_uncore_forcewake_put(struct intel_uncore *uncore,
723 724 725 726
				enum forcewake_domains fw_domains)
{
	unsigned long irqflags;

727
	if (!uncore->funcs.force_wake_put)
728 729
		return;

730 731 732
	spin_lock_irqsave(&uncore->lock, irqflags);
	__intel_uncore_forcewake_put(uncore, fw_domains);
	spin_unlock_irqrestore(&uncore->lock, irqflags);
733 734
}

735 736
/**
 * intel_uncore_forcewake_put__locked - grab forcewake domain references
737
 * @uncore: the intel_uncore structure
738 739 740 741 742
 * @fw_domains: forcewake domains to get reference on
 *
 * See intel_uncore_forcewake_put(). This variant places the onus
 * on the caller to explicitly handle the dev_priv->uncore.lock spinlock.
 */
743
void intel_uncore_forcewake_put__locked(struct intel_uncore *uncore,
744 745
					enum forcewake_domains fw_domains)
{
746 747 748
	lockdep_assert_held(&uncore->lock);

	if (!uncore->funcs.force_wake_put)
749 750
		return;

751
	__intel_uncore_forcewake_put(uncore, fw_domains);
752 753
}

754
void assert_forcewakes_inactive(struct intel_uncore *uncore)
755
{
756
	if (!uncore->funcs.force_wake_get)
757 758
		return;

759
	WARN(uncore->fw_domains_active,
760
	     "Expected all fw_domains to be inactive, but %08x are still on\n",
761
	     uncore->fw_domains_active);
762 763
}

764
void assert_forcewakes_active(struct intel_uncore *uncore,
765 766
			      enum forcewake_domains fw_domains)
{
767 768 769 770 771 772
	struct intel_uncore_forcewake_domain *domain;
	unsigned int tmp;

	if (!IS_ENABLED(CONFIG_DRM_I915_DEBUG_RUNTIME_PM))
		return;

773
	if (!uncore->funcs.force_wake_get)
774 775
		return;

776 777
	spin_lock_irq(&uncore->lock);

778
	assert_rpm_wakelock_held(uncore->rpm);
779

780 781
	fw_domains &= uncore->fw_domains;
	WARN(fw_domains & ~uncore->fw_domains_active,
782
	     "Expected %08x fw_domains to be active, but %08x are off\n",
783
	     fw_domains, fw_domains & ~uncore->fw_domains_active);
784 785 786 787 788 789

	/*
	 * Check that the caller has an explicit wakeref and we don't mistake
	 * it for the auto wakeref.
	 */
	for_each_fw_domain_masked(domain, fw_domains, uncore, tmp) {
790
		unsigned int actual = READ_ONCE(domain->wake_count);
791 792
		unsigned int expect = 1;

793
		if (uncore->fw_domains_timer & domain->mask)
794 795
			expect++; /* pending automatic release */

796
		if (WARN(actual < expect,
797
			 "Expected domain %d to be held awake by caller, count=%d\n",
798
			 domain->id, actual))
799 800
			break;
	}
801 802

	spin_unlock_irq(&uncore->lock);
803 804
}

805
/* We give fast paths for the really cool registers */
806
#define NEEDS_FORCE_WAKE(reg) ((reg) < 0x40000)
807

808
#define __gen6_reg_read_fw_domains(uncore, offset) \
809 810 811 812 813 814 815 816 817
({ \
	enum forcewake_domains __fwd; \
	if (NEEDS_FORCE_WAKE(offset)) \
		__fwd = FORCEWAKE_RENDER; \
	else \
		__fwd = 0; \
	__fwd; \
})

T
Tvrtko Ursulin 已提交
818
static int fw_range_cmp(u32 offset, const struct intel_forcewake_range *entry)
819 820 821 822 823 824 825 826 827
{
	if (offset < entry->start)
		return -1;
	else if (offset > entry->end)
		return 1;
	else
		return 0;
}

T
Tvrtko Ursulin 已提交
828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846
/* Copied and "macroized" from lib/bsearch.c */
#define BSEARCH(key, base, num, cmp) ({                                 \
	unsigned int start__ = 0, end__ = (num);                        \
	typeof(base) result__ = NULL;                                   \
	while (start__ < end__) {                                       \
		unsigned int mid__ = start__ + (end__ - start__) / 2;   \
		int ret__ = (cmp)((key), (base) + mid__);               \
		if (ret__ < 0) {                                        \
			end__ = mid__;                                  \
		} else if (ret__ > 0) {                                 \
			start__ = mid__ + 1;                            \
		} else {                                                \
			result__ = (base) + mid__;                      \
			break;                                          \
		}                                                       \
	}                                                               \
	result__;                                                       \
})

847
static enum forcewake_domains
848
find_fw_domain(struct intel_uncore *uncore, u32 offset)
849
{
T
Tvrtko Ursulin 已提交
850
	const struct intel_forcewake_range *entry;
851

T
Tvrtko Ursulin 已提交
852
	entry = BSEARCH(offset,
853 854
			uncore->fw_domains_table,
			uncore->fw_domains_table_entries,
855
			fw_range_cmp);
856

857 858 859
	if (!entry)
		return 0;

860 861 862 863 864 865
	/*
	 * The list of FW domains depends on the SKU in gen11+ so we
	 * can't determine it statically. We use FORCEWAKE_ALL and
	 * translate it here to the list of available domains.
	 */
	if (entry->domains == FORCEWAKE_ALL)
866
		return uncore->fw_domains;
867

868
	WARN(entry->domains & ~uncore->fw_domains,
869
	     "Uninitialized forcewake domain(s) 0x%x accessed at 0x%x\n",
870
	     entry->domains & ~uncore->fw_domains, offset);
871 872

	return entry->domains;
873 874 875 876
}

#define GEN_FW_RANGE(s, e, d) \
	{ .start = (s), .end = (e), .domains = (d) }
877

T
Tvrtko Ursulin 已提交
878
#define HAS_FWTABLE(dev_priv) \
879
	(INTEL_GEN(dev_priv) >= 9 || \
T
Tvrtko Ursulin 已提交
880 881 882
	 IS_CHERRYVIEW(dev_priv) || \
	 IS_VALLEYVIEW(dev_priv))

883
/* *Must* be sorted by offset ranges! See intel_fw_table_check(). */
884 885 886 887 888 889
static const struct intel_forcewake_range __vlv_fw_ranges[] = {
	GEN_FW_RANGE(0x2000, 0x3fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x5000, 0x7fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0xb000, 0x11fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x12000, 0x13fff, FORCEWAKE_MEDIA),
	GEN_FW_RANGE(0x22000, 0x23fff, FORCEWAKE_MEDIA),
890
	GEN_FW_RANGE(0x2e000, 0x2ffff, FORCEWAKE_RENDER),
891 892
	GEN_FW_RANGE(0x30000, 0x3ffff, FORCEWAKE_MEDIA),
};
893

894
#define __fwtable_reg_read_fw_domains(uncore, offset) \
895 896
({ \
	enum forcewake_domains __fwd = 0; \
897
	if (NEEDS_FORCE_WAKE((offset))) \
898
		__fwd = find_fw_domain(uncore, offset); \
899 900 901
	__fwd; \
})

902
#define __gen11_fwtable_reg_read_fw_domains(uncore, offset) \
903
	find_fw_domain(uncore, offset)
904

905
/* *Must* be sorted by offset! See intel_shadow_table_check(). */
906
static const i915_reg_t gen8_shadowed_regs[] = {
907 908 909 910 911 912
	RING_TAIL(RENDER_RING_BASE),	/* 0x2000 (base) */
	GEN6_RPNSWREQ,			/* 0xA008 */
	GEN6_RC_VIDEO_FREQ,		/* 0xA00C */
	RING_TAIL(GEN6_BSD_RING_BASE),	/* 0x12000 (base) */
	RING_TAIL(VEBOX_RING_BASE),	/* 0x1a000 (base) */
	RING_TAIL(BLT_RING_BASE),	/* 0x22000 (base) */
913 914 915
	/* TODO: Other registers are not yet used */
};

916 917 918 919 920 921 922 923 924 925 926 927 928 929
static const i915_reg_t gen11_shadowed_regs[] = {
	RING_TAIL(RENDER_RING_BASE),		/* 0x2000 (base) */
	GEN6_RPNSWREQ,				/* 0xA008 */
	GEN6_RC_VIDEO_FREQ,			/* 0xA00C */
	RING_TAIL(BLT_RING_BASE),		/* 0x22000 (base) */
	RING_TAIL(GEN11_BSD_RING_BASE),		/* 0x1C0000 (base) */
	RING_TAIL(GEN11_BSD2_RING_BASE),	/* 0x1C4000 (base) */
	RING_TAIL(GEN11_VEBOX_RING_BASE),	/* 0x1C8000 (base) */
	RING_TAIL(GEN11_BSD3_RING_BASE),	/* 0x1D0000 (base) */
	RING_TAIL(GEN11_BSD4_RING_BASE),	/* 0x1D4000 (base) */
	RING_TAIL(GEN11_VEBOX2_RING_BASE),	/* 0x1D8000 (base) */
	/* TODO: Other registers are not yet used */
};

T
Tvrtko Ursulin 已提交
930
static int mmio_reg_cmp(u32 key, const i915_reg_t *reg)
931
{
T
Tvrtko Ursulin 已提交
932
	u32 offset = i915_mmio_reg_offset(*reg);
933

T
Tvrtko Ursulin 已提交
934
	if (key < offset)
935
		return -1;
T
Tvrtko Ursulin 已提交
936
	else if (key > offset)
937 938 939 940 941
		return 1;
	else
		return 0;
}

942 943 944 945 946 947
#define __is_genX_shadowed(x) \
static bool is_gen##x##_shadowed(u32 offset) \
{ \
	const i915_reg_t *regs = gen##x##_shadowed_regs; \
	return BSEARCH(offset, regs, ARRAY_SIZE(gen##x##_shadowed_regs), \
		       mmio_reg_cmp); \
948 949
}

950 951 952
__is_genX_shadowed(8)
__is_genX_shadowed(11)

953 954 955 956 957 958
static enum forcewake_domains
gen6_reg_write_fw_domains(struct intel_uncore *uncore, i915_reg_t reg)
{
	return FORCEWAKE_RENDER;
}

959
#define __gen8_reg_write_fw_domains(uncore, offset) \
960 961 962 963 964 965 966 967 968
({ \
	enum forcewake_domains __fwd; \
	if (NEEDS_FORCE_WAKE(offset) && !is_gen8_shadowed(offset)) \
		__fwd = FORCEWAKE_RENDER; \
	else \
		__fwd = 0; \
	__fwd; \
})

969
/* *Must* be sorted by offset ranges! See intel_fw_table_check(). */
970 971
static const struct intel_forcewake_range __chv_fw_ranges[] = {
	GEN_FW_RANGE(0x2000, 0x3fff, FORCEWAKE_RENDER),
972
	GEN_FW_RANGE(0x4000, 0x4fff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
973
	GEN_FW_RANGE(0x5200, 0x7fff, FORCEWAKE_RENDER),
974
	GEN_FW_RANGE(0x8000, 0x82ff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
975
	GEN_FW_RANGE(0x8300, 0x84ff, FORCEWAKE_RENDER),
976
	GEN_FW_RANGE(0x8500, 0x85ff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
977
	GEN_FW_RANGE(0x8800, 0x88ff, FORCEWAKE_MEDIA),
978 979
	GEN_FW_RANGE(0x9000, 0xafff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
	GEN_FW_RANGE(0xb000, 0xb47f, FORCEWAKE_RENDER),
980
	GEN_FW_RANGE(0xd000, 0xd7ff, FORCEWAKE_MEDIA),
981 982
	GEN_FW_RANGE(0xe000, 0xe7ff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0xf000, 0xffff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
983 984 985 986 987
	GEN_FW_RANGE(0x12000, 0x13fff, FORCEWAKE_MEDIA),
	GEN_FW_RANGE(0x1a000, 0x1bfff, FORCEWAKE_MEDIA),
	GEN_FW_RANGE(0x1e800, 0x1e9ff, FORCEWAKE_MEDIA),
	GEN_FW_RANGE(0x30000, 0x37fff, FORCEWAKE_MEDIA),
};
988

989
#define __fwtable_reg_write_fw_domains(uncore, offset) \
990 991
({ \
	enum forcewake_domains __fwd = 0; \
992
	if (NEEDS_FORCE_WAKE((offset)) && !is_gen8_shadowed(offset)) \
993
		__fwd = find_fw_domain(uncore, offset); \
994 995 996
	__fwd; \
})

997
#define __gen11_fwtable_reg_write_fw_domains(uncore, offset) \
998 999
({ \
	enum forcewake_domains __fwd = 0; \
1000 1001 1002
	const u32 __offset = (offset); \
	if (!is_gen11_shadowed(__offset)) \
		__fwd = find_fw_domain(uncore, __offset); \
1003 1004 1005
	__fwd; \
})

1006
/* *Must* be sorted by offset ranges! See intel_fw_table_check(). */
1007
static const struct intel_forcewake_range __gen9_fw_ranges[] = {
1008
	GEN_FW_RANGE(0x0, 0xaff, FORCEWAKE_BLITTER),
1009 1010
	GEN_FW_RANGE(0xb00, 0x1fff, 0), /* uncore range */
	GEN_FW_RANGE(0x2000, 0x26ff, FORCEWAKE_RENDER),
1011
	GEN_FW_RANGE(0x2700, 0x2fff, FORCEWAKE_BLITTER),
1012
	GEN_FW_RANGE(0x3000, 0x3fff, FORCEWAKE_RENDER),
1013
	GEN_FW_RANGE(0x4000, 0x51ff, FORCEWAKE_BLITTER),
1014
	GEN_FW_RANGE(0x5200, 0x7fff, FORCEWAKE_RENDER),
1015
	GEN_FW_RANGE(0x8000, 0x812f, FORCEWAKE_BLITTER),
1016
	GEN_FW_RANGE(0x8130, 0x813f, FORCEWAKE_MEDIA),
1017
	GEN_FW_RANGE(0x8140, 0x815f, FORCEWAKE_RENDER),
1018
	GEN_FW_RANGE(0x8160, 0x82ff, FORCEWAKE_BLITTER),
1019
	GEN_FW_RANGE(0x8300, 0x84ff, FORCEWAKE_RENDER),
1020
	GEN_FW_RANGE(0x8500, 0x87ff, FORCEWAKE_BLITTER),
1021
	GEN_FW_RANGE(0x8800, 0x89ff, FORCEWAKE_MEDIA),
1022
	GEN_FW_RANGE(0x8a00, 0x8bff, FORCEWAKE_BLITTER),
1023
	GEN_FW_RANGE(0x8c00, 0x8cff, FORCEWAKE_RENDER),
1024
	GEN_FW_RANGE(0x8d00, 0x93ff, FORCEWAKE_BLITTER),
1025
	GEN_FW_RANGE(0x9400, 0x97ff, FORCEWAKE_RENDER | FORCEWAKE_MEDIA),
1026
	GEN_FW_RANGE(0x9800, 0xafff, FORCEWAKE_BLITTER),
1027
	GEN_FW_RANGE(0xb000, 0xb47f, FORCEWAKE_RENDER),
1028
	GEN_FW_RANGE(0xb480, 0xcfff, FORCEWAKE_BLITTER),
1029
	GEN_FW_RANGE(0xd000, 0xd7ff, FORCEWAKE_MEDIA),
1030
	GEN_FW_RANGE(0xd800, 0xdfff, FORCEWAKE_BLITTER),
1031
	GEN_FW_RANGE(0xe000, 0xe8ff, FORCEWAKE_RENDER),
1032
	GEN_FW_RANGE(0xe900, 0x11fff, FORCEWAKE_BLITTER),
1033
	GEN_FW_RANGE(0x12000, 0x13fff, FORCEWAKE_MEDIA),
1034
	GEN_FW_RANGE(0x14000, 0x19fff, FORCEWAKE_BLITTER),
1035
	GEN_FW_RANGE(0x1a000, 0x1e9ff, FORCEWAKE_MEDIA),
1036
	GEN_FW_RANGE(0x1ea00, 0x243ff, FORCEWAKE_BLITTER),
1037
	GEN_FW_RANGE(0x24400, 0x247ff, FORCEWAKE_RENDER),
1038
	GEN_FW_RANGE(0x24800, 0x2ffff, FORCEWAKE_BLITTER),
1039 1040
	GEN_FW_RANGE(0x30000, 0x3ffff, FORCEWAKE_MEDIA),
};
1041

1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060
/* *Must* be sorted by offset ranges! See intel_fw_table_check(). */
static const struct intel_forcewake_range __gen11_fw_ranges[] = {
	GEN_FW_RANGE(0x0, 0xaff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0xb00, 0x1fff, 0), /* uncore range */
	GEN_FW_RANGE(0x2000, 0x26ff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x2700, 0x2fff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x3000, 0x3fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x4000, 0x51ff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x5200, 0x7fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x8000, 0x813f, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x8140, 0x815f, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x8160, 0x82ff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x8300, 0x84ff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x8500, 0x8bff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x8c00, 0x8cff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x8d00, 0x93ff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x9400, 0x97ff, FORCEWAKE_ALL),
	GEN_FW_RANGE(0x9800, 0xafff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0xb000, 0xb47f, FORCEWAKE_RENDER),
1061 1062 1063 1064 1065
	GEN_FW_RANGE(0xb480, 0xdeff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0xdf00, 0xe8ff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0xe900, 0x16dff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x16e00, 0x19fff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x1a000, 0x243ff, FORCEWAKE_BLITTER),
1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077
	GEN_FW_RANGE(0x24400, 0x247ff, FORCEWAKE_RENDER),
	GEN_FW_RANGE(0x24800, 0x3ffff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x40000, 0x1bffff, 0),
	GEN_FW_RANGE(0x1c0000, 0x1c3fff, FORCEWAKE_MEDIA_VDBOX0),
	GEN_FW_RANGE(0x1c4000, 0x1c7fff, FORCEWAKE_MEDIA_VDBOX1),
	GEN_FW_RANGE(0x1c8000, 0x1cbfff, FORCEWAKE_MEDIA_VEBOX0),
	GEN_FW_RANGE(0x1cc000, 0x1cffff, FORCEWAKE_BLITTER),
	GEN_FW_RANGE(0x1d0000, 0x1d3fff, FORCEWAKE_MEDIA_VDBOX2),
	GEN_FW_RANGE(0x1d4000, 0x1d7fff, FORCEWAKE_MEDIA_VDBOX3),
	GEN_FW_RANGE(0x1d8000, 0x1dbfff, FORCEWAKE_MEDIA_VEBOX1)
};

1078
static void
1079
ilk_dummy_write(struct intel_uncore *uncore)
1080 1081 1082 1083
{
	/* WaIssueDummyWriteToWakeupFromRC6:ilk Issue a dummy write to wake up
	 * the chip from rc6 before touching it for real. MI_MODE is masked,
	 * hence harmless to write 0 into. */
1084
	__raw_uncore_write32(uncore, MI_MODE, 0);
1085 1086 1087
}

static void
1088
__unclaimed_reg_debug(struct intel_uncore *uncore,
1089 1090 1091
		      const i915_reg_t reg,
		      const bool read,
		      const bool before)
1092
{
1093
	if (WARN(check_for_unclaimed_mmio(uncore) && !before,
1094 1095
		 "Unclaimed %s register 0x%x\n",
		 read ? "read from" : "write to",
1096
		 i915_mmio_reg_offset(reg)))
1097 1098
		/* Only report the first N failures */
		i915_modparams.mmio_debug--;
1099 1100
}

1101
static inline void
1102
unclaimed_reg_debug(struct intel_uncore *uncore,
1103 1104 1105 1106
		    const i915_reg_t reg,
		    const bool read,
		    const bool before)
{
1107
	if (likely(!i915_modparams.mmio_debug))
1108 1109
		return;

1110 1111 1112 1113 1114 1115
	/* interrupts are disabled and re-enabled around uncore->lock usage */
	lockdep_assert_held(&uncore->lock);

	if (before)
		spin_lock(&uncore->debug->lock);

1116
	__unclaimed_reg_debug(uncore, reg, read, before);
1117 1118 1119

	if (!before)
		spin_unlock(&uncore->debug->lock);
1120 1121
}

1122
#define GEN2_READ_HEADER(x) \
B
Ben Widawsky 已提交
1123
	u##x val = 0; \
1124
	assert_rpm_wakelock_held(uncore->rpm);
B
Ben Widawsky 已提交
1125

1126
#define GEN2_READ_FOOTER \
B
Ben Widawsky 已提交
1127 1128 1129
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

1130
#define __gen2_read(x) \
1131
static u##x \
1132
gen2_read##x(struct intel_uncore *uncore, i915_reg_t reg, bool trace) { \
1133
	GEN2_READ_HEADER(x); \
1134
	val = __raw_uncore_read##x(uncore, reg); \
1135
	GEN2_READ_FOOTER; \
1136 1137 1138 1139
}

#define __gen5_read(x) \
static u##x \
1140
gen5_read##x(struct intel_uncore *uncore, i915_reg_t reg, bool trace) { \
1141
	GEN2_READ_HEADER(x); \
1142
	ilk_dummy_write(uncore); \
1143
	val = __raw_uncore_read##x(uncore, reg); \
1144
	GEN2_READ_FOOTER; \
1145 1146
}

1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162
__gen5_read(8)
__gen5_read(16)
__gen5_read(32)
__gen5_read(64)
__gen2_read(8)
__gen2_read(16)
__gen2_read(32)
__gen2_read(64)

#undef __gen5_read
#undef __gen2_read

#undef GEN2_READ_FOOTER
#undef GEN2_READ_HEADER

#define GEN6_READ_HEADER(x) \
1163
	u32 offset = i915_mmio_reg_offset(reg); \
1164 1165
	unsigned long irqflags; \
	u##x val = 0; \
1166
	assert_rpm_wakelock_held(uncore->rpm); \
1167
	spin_lock_irqsave(&uncore->lock, irqflags); \
1168
	unclaimed_reg_debug(uncore, reg, true, true)
1169 1170

#define GEN6_READ_FOOTER \
1171
	unclaimed_reg_debug(uncore, reg, true, false); \
1172
	spin_unlock_irqrestore(&uncore->lock, irqflags); \
1173 1174 1175
	trace_i915_reg_rw(false, reg, val, sizeof(val), trace); \
	return val

1176
static noinline void ___force_wake_auto(struct intel_uncore *uncore,
1177
					enum forcewake_domains fw_domains)
1178 1179
{
	struct intel_uncore_forcewake_domain *domain;
C
Chris Wilson 已提交
1180 1181
	unsigned int tmp;

1182
	GEM_BUG_ON(fw_domains & ~uncore->fw_domains);
1183

1184
	for_each_fw_domain_masked(domain, fw_domains, uncore, tmp)
1185 1186
		fw_domain_arm_timer(domain);

1187
	uncore->funcs.force_wake_get(uncore, fw_domains);
1188 1189
}

1190
static inline void __force_wake_auto(struct intel_uncore *uncore,
1191 1192
				     enum forcewake_domains fw_domains)
{
1193
	GEM_BUG_ON(!fw_domains);
1194

1195
	/* Turn on all requested but inactive supported forcewake domains. */
1196 1197
	fw_domains &= uncore->fw_domains;
	fw_domains &= ~uncore->fw_domains_active;
1198

1199
	if (fw_domains)
1200
		___force_wake_auto(uncore, fw_domains);
1201 1202
}

1203
#define __gen_read(func, x) \
1204
static u##x \
1205
func##_read##x(struct intel_uncore *uncore, i915_reg_t reg, bool trace) { \
1206
	enum forcewake_domains fw_engine; \
1207
	GEN6_READ_HEADER(x); \
1208
	fw_engine = __##func##_reg_read_fw_domains(uncore, offset); \
1209
	if (fw_engine) \
1210
		__force_wake_auto(uncore, fw_engine); \
1211
	val = __raw_uncore_read##x(uncore, reg); \
1212
	GEN6_READ_FOOTER; \
1213
}
1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230

#define __gen_reg_read_funcs(func) \
static enum forcewake_domains \
func##_reg_read_fw_domains(struct intel_uncore *uncore, i915_reg_t reg) { \
	return __##func##_reg_read_fw_domains(uncore, i915_mmio_reg_offset(reg)); \
} \
\
__gen_read(func, 8) \
__gen_read(func, 16) \
__gen_read(func, 32) \
__gen_read(func, 64)

__gen_reg_read_funcs(gen11_fwtable);
__gen_reg_read_funcs(fwtable);
__gen_reg_read_funcs(gen6);

#undef __gen_reg_read_funcs
1231 1232
#undef GEN6_READ_FOOTER
#undef GEN6_READ_HEADER
B
Ben Widawsky 已提交
1233

1234
#define GEN2_WRITE_HEADER \
B
Ben Widawsky 已提交
1235
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
1236
	assert_rpm_wakelock_held(uncore->rpm); \
1237

1238
#define GEN2_WRITE_FOOTER
V
Ville Syrjälä 已提交
1239

1240
#define __gen2_write(x) \
1241
static void \
1242
gen2_write##x(struct intel_uncore *uncore, i915_reg_t reg, u##x val, bool trace) { \
1243
	GEN2_WRITE_HEADER; \
1244
	__raw_uncore_write##x(uncore, reg, val); \
1245
	GEN2_WRITE_FOOTER; \
1246 1247 1248 1249
}

#define __gen5_write(x) \
static void \
1250
gen5_write##x(struct intel_uncore *uncore, i915_reg_t reg, u##x val, bool trace) { \
1251
	GEN2_WRITE_HEADER; \
1252
	ilk_dummy_write(uncore); \
1253
	__raw_uncore_write##x(uncore, reg, val); \
1254
	GEN2_WRITE_FOOTER; \
1255 1256
}

1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270
__gen5_write(8)
__gen5_write(16)
__gen5_write(32)
__gen2_write(8)
__gen2_write(16)
__gen2_write(32)

#undef __gen5_write
#undef __gen2_write

#undef GEN2_WRITE_FOOTER
#undef GEN2_WRITE_HEADER

#define GEN6_WRITE_HEADER \
1271
	u32 offset = i915_mmio_reg_offset(reg); \
1272 1273
	unsigned long irqflags; \
	trace_i915_reg_rw(true, reg, val, sizeof(val), trace); \
1274
	assert_rpm_wakelock_held(uncore->rpm); \
1275
	spin_lock_irqsave(&uncore->lock, irqflags); \
1276
	unclaimed_reg_debug(uncore, reg, false, true)
1277 1278

#define GEN6_WRITE_FOOTER \
1279
	unclaimed_reg_debug(uncore, reg, false, false); \
1280
	spin_unlock_irqrestore(&uncore->lock, irqflags)
1281

1282 1283
#define __gen6_write(x) \
static void \
1284
gen6_write##x(struct intel_uncore *uncore, i915_reg_t reg, u##x val, bool trace) { \
1285
	GEN6_WRITE_HEADER; \
1286
	if (NEEDS_FORCE_WAKE(offset)) \
1287
		__gen6_gt_wait_for_fifo(uncore); \
1288
	__raw_uncore_write##x(uncore, reg, val); \
1289
	GEN6_WRITE_FOOTER; \
1290
}
1291 1292 1293
__gen6_write(8)
__gen6_write(16)
__gen6_write(32)
1294

1295
#define __gen_write(func, x) \
1296
static void \
1297
func##_write##x(struct intel_uncore *uncore, i915_reg_t reg, u##x val, bool trace) { \
1298
	enum forcewake_domains fw_engine; \
1299
	GEN6_WRITE_HEADER; \
1300
	fw_engine = __##func##_reg_write_fw_domains(uncore, offset); \
1301
	if (fw_engine) \
1302
		__force_wake_auto(uncore, fw_engine); \
1303
	__raw_uncore_write##x(uncore, reg, val); \
1304
	GEN6_WRITE_FOOTER; \
1305
}
1306

1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321
#define __gen_reg_write_funcs(func) \
static enum forcewake_domains \
func##_reg_write_fw_domains(struct intel_uncore *uncore, i915_reg_t reg) { \
	return __##func##_reg_write_fw_domains(uncore, i915_mmio_reg_offset(reg)); \
} \
\
__gen_write(func, 8) \
__gen_write(func, 16) \
__gen_write(func, 32)

__gen_reg_write_funcs(gen11_fwtable);
__gen_reg_write_funcs(fwtable);
__gen_reg_write_funcs(gen8);

#undef __gen_reg_write_funcs
1322 1323
#undef GEN6_WRITE_FOOTER
#undef GEN6_WRITE_HEADER
1324

1325
#define ASSIGN_RAW_WRITE_MMIO_VFUNCS(uncore, x) \
1326
do { \
1327 1328 1329
	(uncore)->funcs.mmio_writeb = x##_write8; \
	(uncore)->funcs.mmio_writew = x##_write16; \
	(uncore)->funcs.mmio_writel = x##_write32; \
1330 1331
} while (0)

1332
#define ASSIGN_RAW_READ_MMIO_VFUNCS(uncore, x) \
1333
do { \
1334 1335 1336 1337
	(uncore)->funcs.mmio_readb = x##_read8; \
	(uncore)->funcs.mmio_readw = x##_read16; \
	(uncore)->funcs.mmio_readl = x##_read32; \
	(uncore)->funcs.mmio_readq = x##_read64; \
1338 1339
} while (0)

1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350
#define ASSIGN_WRITE_MMIO_VFUNCS(uncore, x) \
do { \
	ASSIGN_RAW_WRITE_MMIO_VFUNCS((uncore), x); \
	(uncore)->funcs.write_fw_domains = x##_reg_write_fw_domains; \
} while (0)

#define ASSIGN_READ_MMIO_VFUNCS(uncore, x) \
do { \
	ASSIGN_RAW_READ_MMIO_VFUNCS(uncore, x); \
	(uncore)->funcs.read_fw_domains = x##_reg_read_fw_domains; \
} while (0)
1351

1352 1353 1354 1355
static int __fw_domain_init(struct intel_uncore *uncore,
			    enum forcewake_domain_id domain_id,
			    i915_reg_t reg_set,
			    i915_reg_t reg_ack)
1356 1357 1358
{
	struct intel_uncore_forcewake_domain *d;

1359 1360
	GEM_BUG_ON(domain_id >= FW_DOMAIN_ID_COUNT);
	GEM_BUG_ON(uncore->fw_domain[domain_id]);
1361

1362
	if (i915_inject_probe_failure(uncore->i915))
1363
		return -ENOMEM;
1364

1365 1366 1367
	d = kzalloc(sizeof(*d), GFP_KERNEL);
	if (!d)
		return -ENOMEM;
1368

1369 1370 1371
	WARN_ON(!i915_mmio_reg_valid(reg_set));
	WARN_ON(!i915_mmio_reg_valid(reg_ack));

1372
	d->uncore = uncore;
1373
	d->wake_count = 0;
1374 1375
	d->reg_set = uncore->regs + i915_mmio_reg_offset(reg_set);
	d->reg_ack = uncore->regs + i915_mmio_reg_offset(reg_ack);
1376 1377 1378

	d->id = domain_id;

1379 1380 1381
	BUILD_BUG_ON(FORCEWAKE_RENDER != (1 << FW_DOMAIN_ID_RENDER));
	BUILD_BUG_ON(FORCEWAKE_BLITTER != (1 << FW_DOMAIN_ID_BLITTER));
	BUILD_BUG_ON(FORCEWAKE_MEDIA != (1 << FW_DOMAIN_ID_MEDIA));
1382 1383 1384 1385 1386 1387 1388
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VDBOX0 != (1 << FW_DOMAIN_ID_MEDIA_VDBOX0));
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VDBOX1 != (1 << FW_DOMAIN_ID_MEDIA_VDBOX1));
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VDBOX2 != (1 << FW_DOMAIN_ID_MEDIA_VDBOX2));
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VDBOX3 != (1 << FW_DOMAIN_ID_MEDIA_VDBOX3));
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VEBOX0 != (1 << FW_DOMAIN_ID_MEDIA_VEBOX0));
	BUILD_BUG_ON(FORCEWAKE_MEDIA_VEBOX1 != (1 << FW_DOMAIN_ID_MEDIA_VEBOX1));

C
Chris Wilson 已提交
1389
	d->mask = BIT(domain_id);
1390

1391 1392
	hrtimer_init(&d->timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
	d->timer.function = intel_uncore_fw_release_timer;
1393

1394
	uncore->fw_domains |= BIT(domain_id);
1395

1396
	fw_domain_reset(d);
1397 1398 1399 1400

	uncore->fw_domain[domain_id] = d;

	return 0;
1401 1402
}

1403
static void fw_domain_fini(struct intel_uncore *uncore,
1404 1405 1406 1407
			   enum forcewake_domain_id domain_id)
{
	struct intel_uncore_forcewake_domain *d;

1408
	GEM_BUG_ON(domain_id >= FW_DOMAIN_ID_COUNT);
1409

1410 1411 1412
	d = fetch_and_zero(&uncore->fw_domain[domain_id]);
	if (!d)
		return;
1413

1414
	uncore->fw_domains &= ~BIT(domain_id);
1415 1416
	WARN_ON(d->wake_count);
	WARN_ON(hrtimer_cancel(&d->timer));
1417 1418
	kfree(d);
}
1419

1420 1421 1422 1423 1424 1425 1426
static void intel_uncore_fw_domains_fini(struct intel_uncore *uncore)
{
	struct intel_uncore_forcewake_domain *d;
	int tmp;

	for_each_fw_domain(d, uncore, tmp)
		fw_domain_fini(uncore, d->id);
1427 1428
}

1429
static int intel_uncore_fw_domains_init(struct intel_uncore *uncore)
1430
{
1431
	struct drm_i915_private *i915 = uncore->i915;
1432
	int ret = 0;
1433

1434
	GEM_BUG_ON(!intel_uncore_has_forcewake(uncore));
1435

1436 1437 1438
#define fw_domain_init(uncore__, id__, set__, ack__) \
	(ret ?: (ret = __fw_domain_init((uncore__), (id__), (set__), (ack__))))

1439
	if (INTEL_GEN(i915) >= 11) {
1440 1441
		int i;

1442
		uncore->funcs.force_wake_get = fw_domains_get_with_fallback;
1443 1444
		uncore->funcs.force_wake_put = fw_domains_put;
		fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1445 1446
			       FORCEWAKE_RENDER_GEN9,
			       FORCEWAKE_ACK_RENDER_GEN9);
1447
		fw_domain_init(uncore, FW_DOMAIN_ID_BLITTER,
1448 1449
			       FORCEWAKE_BLITTER_GEN9,
			       FORCEWAKE_ACK_BLITTER_GEN9);
1450

1451
		for (i = 0; i < I915_MAX_VCS; i++) {
1452
			if (!HAS_ENGINE(i915, _VCS(i)))
1453 1454
				continue;

1455
			fw_domain_init(uncore, FW_DOMAIN_ID_MEDIA_VDBOX0 + i,
1456 1457 1458 1459
				       FORCEWAKE_MEDIA_VDBOX_GEN11(i),
				       FORCEWAKE_ACK_MEDIA_VDBOX_GEN11(i));
		}
		for (i = 0; i < I915_MAX_VECS; i++) {
1460
			if (!HAS_ENGINE(i915, _VECS(i)))
1461 1462
				continue;

1463
			fw_domain_init(uncore, FW_DOMAIN_ID_MEDIA_VEBOX0 + i,
1464 1465 1466
				       FORCEWAKE_MEDIA_VEBOX_GEN11(i),
				       FORCEWAKE_ACK_MEDIA_VEBOX_GEN11(i));
		}
1467
	} else if (IS_GEN_RANGE(i915, 9, 10)) {
1468
		uncore->funcs.force_wake_get = fw_domains_get_with_fallback;
1469 1470
		uncore->funcs.force_wake_put = fw_domains_put;
		fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1471 1472
			       FORCEWAKE_RENDER_GEN9,
			       FORCEWAKE_ACK_RENDER_GEN9);
1473
		fw_domain_init(uncore, FW_DOMAIN_ID_BLITTER,
1474 1475
			       FORCEWAKE_BLITTER_GEN9,
			       FORCEWAKE_ACK_BLITTER_GEN9);
1476
		fw_domain_init(uncore, FW_DOMAIN_ID_MEDIA,
1477
			       FORCEWAKE_MEDIA_GEN9, FORCEWAKE_ACK_MEDIA_GEN9);
1478 1479 1480 1481
	} else if (IS_VALLEYVIEW(i915) || IS_CHERRYVIEW(i915)) {
		uncore->funcs.force_wake_get = fw_domains_get;
		uncore->funcs.force_wake_put = fw_domains_put;
		fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1482
			       FORCEWAKE_VLV, FORCEWAKE_ACK_VLV);
1483
		fw_domain_init(uncore, FW_DOMAIN_ID_MEDIA,
1484
			       FORCEWAKE_MEDIA_VLV, FORCEWAKE_ACK_MEDIA_VLV);
1485 1486
	} else if (IS_HASWELL(i915) || IS_BROADWELL(i915)) {
		uncore->funcs.force_wake_get =
1487
			fw_domains_get_with_thread_status;
1488 1489
		uncore->funcs.force_wake_put = fw_domains_put;
		fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1490
			       FORCEWAKE_MT, FORCEWAKE_ACK_HSW);
1491
	} else if (IS_IVYBRIDGE(i915)) {
1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502
		u32 ecobus;

		/* IVB configs may use multi-threaded forcewake */

		/* A small trick here - if the bios hasn't configured
		 * MT forcewake, and if the device is in RC6, then
		 * force_wake_mt_get will not wake the device and the
		 * ECOBUS read will return zero. Which will be
		 * (correctly) interpreted by the test below as MT
		 * forcewake being disabled.
		 */
1503
		uncore->funcs.force_wake_get =
1504
			fw_domains_get_with_thread_status;
1505
		uncore->funcs.force_wake_put = fw_domains_put;
1506

1507 1508
		/* We need to init first for ECOBUS access and then
		 * determine later if we want to reinit, in case of MT access is
1509 1510 1511
		 * not working. In this stage we don't know which flavour this
		 * ivb is, so it is better to reset also the gen6 fw registers
		 * before the ecobus check.
1512
		 */
1513

1514
		__raw_uncore_write32(uncore, FORCEWAKE, 0);
1515
		__raw_posting_read(uncore, ECOBUS);
1516

1517 1518 1519 1520
		ret = __fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
				       FORCEWAKE_MT, FORCEWAKE_MT_ACK);
		if (ret)
			goto out;
1521

1522 1523
		spin_lock_irq(&uncore->lock);
		fw_domains_get_with_thread_status(uncore, FORCEWAKE_RENDER);
1524
		ecobus = __raw_uncore_read32(uncore, ECOBUS);
1525 1526
		fw_domains_put(uncore, FORCEWAKE_RENDER);
		spin_unlock_irq(&uncore->lock);
1527

1528
		if (!(ecobus & FORCEWAKE_MT_ENABLE)) {
1529 1530
			DRM_INFO("No MT forcewake available on Ivybridge, this can result in issues\n");
			DRM_INFO("when using vblank-synced partial screen updates.\n");
1531
			fw_domain_fini(uncore, FW_DOMAIN_ID_RENDER);
1532
			fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1533
				       FORCEWAKE, FORCEWAKE_ACK);
1534
		}
1535 1536
	} else if (IS_GEN(i915, 6)) {
		uncore->funcs.force_wake_get =
1537
			fw_domains_get_with_thread_status;
1538 1539
		uncore->funcs.force_wake_put = fw_domains_put;
		fw_domain_init(uncore, FW_DOMAIN_ID_RENDER,
1540
			       FORCEWAKE, FORCEWAKE_ACK);
1541
	}
1542

1543 1544
#undef fw_domain_init

1545
	/* All future platforms are expected to require complex power gating */
1546 1547 1548 1549 1550 1551 1552
	WARN_ON(!ret && uncore->fw_domains == 0);

out:
	if (ret)
		intel_uncore_fw_domains_fini(uncore);

	return ret;
1553 1554
}

1555
#define ASSIGN_FW_DOMAINS_TABLE(uncore, d) \
1556
{ \
1557
	(uncore)->fw_domains_table = \
1558
			(struct intel_forcewake_range *)(d); \
1559
	(uncore)->fw_domains_table_entries = ARRAY_SIZE((d)); \
1560 1561
}

1562 1563 1564
static int i915_pmic_bus_access_notifier(struct notifier_block *nb,
					 unsigned long action, void *data)
{
1565 1566
	struct intel_uncore *uncore = container_of(nb,
			struct intel_uncore, pmic_bus_access_nb);
1567 1568 1569 1570 1571 1572 1573 1574 1575 1576

	switch (action) {
	case MBI_PMIC_BUS_ACCESS_BEGIN:
		/*
		 * forcewake all now to make sure that we don't need to do a
		 * forcewake later which on systems where this notifier gets
		 * called requires the punit to access to the shared pmic i2c
		 * bus, which will be busy after this notification, leading to:
		 * "render: timed out waiting for forcewake ack request."
		 * errors.
1577 1578 1579 1580 1581
		 *
		 * The notifier is unregistered during intel_runtime_suspend(),
		 * so it's ok to access the HW here without holding a RPM
		 * wake reference -> disable wakeref asserts for the time of
		 * the access.
1582
		 */
1583 1584 1585
		disable_rpm_wakeref_asserts(uncore->rpm);
		intel_uncore_forcewake_get(uncore, FORCEWAKE_ALL);
		enable_rpm_wakeref_asserts(uncore->rpm);
1586 1587
		break;
	case MBI_PMIC_BUS_ACCESS_END:
1588
		intel_uncore_forcewake_put(uncore, FORCEWAKE_ALL);
1589 1590 1591 1592 1593 1594
		break;
	}

	return NOTIFY_OK;
}

1595 1596
static int uncore_mmio_setup(struct intel_uncore *uncore)
{
1597
	struct drm_i915_private *i915 = uncore->i915;
1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626
	struct pci_dev *pdev = i915->drm.pdev;
	int mmio_bar;
	int mmio_size;

	mmio_bar = IS_GEN(i915, 2) ? 1 : 0;
	/*
	 * Before gen4, the registers and the GTT are behind different BARs.
	 * However, from gen4 onwards, the registers and the GTT are shared
	 * in the same BAR, so we want to restrict this ioremap from
	 * clobbering the GTT which we want ioremap_wc instead. Fortunately,
	 * the register BAR remains the same size for all the earlier
	 * generations up to Ironlake.
	 */
	if (INTEL_GEN(i915) < 5)
		mmio_size = 512 * 1024;
	else
		mmio_size = 2 * 1024 * 1024;
	uncore->regs = pci_iomap(pdev, mmio_bar, mmio_size);
	if (uncore->regs == NULL) {
		DRM_ERROR("failed to map registers\n");

		return -EIO;
	}

	return 0;
}

static void uncore_mmio_cleanup(struct intel_uncore *uncore)
{
1627
	struct pci_dev *pdev = uncore->i915->drm.pdev;
1628 1629 1630 1631

	pci_iounmap(pdev, uncore->regs);
}

1632 1633
void intel_uncore_init_early(struct intel_uncore *uncore,
			     struct drm_i915_private *i915)
1634 1635
{
	spin_lock_init(&uncore->lock);
1636 1637
	uncore->i915 = i915;
	uncore->rpm = &i915->runtime_pm;
1638
	uncore->debug = &i915->mmio_debug;
1639
}
1640

1641
static void uncore_raw_init(struct intel_uncore *uncore)
1642
{
1643
	GEM_BUG_ON(intel_uncore_has_forcewake(uncore));
1644

1645 1646 1647 1648 1649 1650 1651 1652
	if (IS_GEN(uncore->i915, 5)) {
		ASSIGN_RAW_WRITE_MMIO_VFUNCS(uncore, gen5);
		ASSIGN_RAW_READ_MMIO_VFUNCS(uncore, gen5);
	} else {
		ASSIGN_RAW_WRITE_MMIO_VFUNCS(uncore, gen2);
		ASSIGN_RAW_READ_MMIO_VFUNCS(uncore, gen2);
	}
}
1653

1654
static int uncore_forcewake_init(struct intel_uncore *uncore)
1655 1656
{
	struct drm_i915_private *i915 = uncore->i915;
1657
	int ret;
1658

1659
	GEM_BUG_ON(!intel_uncore_has_forcewake(uncore));
1660

1661 1662 1663
	ret = intel_uncore_fw_domains_init(uncore);
	if (ret)
		return ret;
1664
	forcewake_early_sanitize(uncore, 0);
1665

1666
	if (IS_GEN_RANGE(i915, 6, 7)) {
1667 1668 1669 1670 1671
		ASSIGN_WRITE_MMIO_VFUNCS(uncore, gen6);

		if (IS_VALLEYVIEW(i915)) {
			ASSIGN_FW_DOMAINS_TABLE(uncore, __vlv_fw_ranges);
			ASSIGN_READ_MMIO_VFUNCS(uncore, fwtable);
1672
		} else {
1673
			ASSIGN_READ_MMIO_VFUNCS(uncore, gen6);
1674
		}
1675 1676 1677 1678 1679
	} else if (IS_GEN(i915, 8)) {
		if (IS_CHERRYVIEW(i915)) {
			ASSIGN_FW_DOMAINS_TABLE(uncore, __chv_fw_ranges);
			ASSIGN_WRITE_MMIO_VFUNCS(uncore, fwtable);
			ASSIGN_READ_MMIO_VFUNCS(uncore, fwtable);
1680
		} else {
1681 1682
			ASSIGN_WRITE_MMIO_VFUNCS(uncore, gen8);
			ASSIGN_READ_MMIO_VFUNCS(uncore, gen6);
1683
		}
1684 1685 1686 1687
	} else if (IS_GEN_RANGE(i915, 9, 10)) {
		ASSIGN_FW_DOMAINS_TABLE(uncore, __gen9_fw_ranges);
		ASSIGN_WRITE_MMIO_VFUNCS(uncore, fwtable);
		ASSIGN_READ_MMIO_VFUNCS(uncore, fwtable);
1688
	} else {
1689 1690 1691
		ASSIGN_FW_DOMAINS_TABLE(uncore, __gen11_fw_ranges);
		ASSIGN_WRITE_MMIO_VFUNCS(uncore, gen11_fwtable);
		ASSIGN_READ_MMIO_VFUNCS(uncore, gen11_fwtable);
1692
	}
1693

1694 1695
	uncore->pmic_bus_access_nb.notifier_call = i915_pmic_bus_access_notifier;
	iosf_mbi_register_pmic_bus_access_notifier(&uncore->pmic_bus_access_nb);
1696 1697

	return 0;
1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711
}

int intel_uncore_init_mmio(struct intel_uncore *uncore)
{
	struct drm_i915_private *i915 = uncore->i915;
	int ret;

	ret = uncore_mmio_setup(uncore);
	if (ret)
		return ret;

	if (INTEL_GEN(i915) > 5 && !intel_vgpu_active(i915))
		uncore->flags |= UNCORE_HAS_FORCEWAKE;

1712
	if (!intel_uncore_has_forcewake(uncore)) {
1713
		uncore_raw_init(uncore);
1714 1715 1716 1717 1718
	} else {
		ret = uncore_forcewake_init(uncore);
		if (ret)
			goto out_mmio_cleanup;
	}
1719

1720 1721 1722 1723 1724 1725
	/* make sure fw funcs are set if and only if we have fw*/
	GEM_BUG_ON(intel_uncore_has_forcewake(uncore) != !!uncore->funcs.force_wake_get);
	GEM_BUG_ON(intel_uncore_has_forcewake(uncore) != !!uncore->funcs.force_wake_put);
	GEM_BUG_ON(intel_uncore_has_forcewake(uncore) != !!uncore->funcs.read_fw_domains);
	GEM_BUG_ON(intel_uncore_has_forcewake(uncore) != !!uncore->funcs.write_fw_domains);

1726 1727 1728 1729 1730 1731 1732 1733 1734
	if (HAS_FPGA_DBG_UNCLAIMED(i915))
		uncore->flags |= UNCORE_HAS_FPGA_DBG_UNCLAIMED;

	if (IS_VALLEYVIEW(i915) || IS_CHERRYVIEW(i915))
		uncore->flags |= UNCORE_HAS_DBG_UNCLAIMED;

	if (IS_GEN_RANGE(i915, 6, 7))
		uncore->flags |= UNCORE_HAS_FIFO;

1735
	/* clear out unclaimed reg detection bit */
1736
	if (intel_uncore_unclaimed_mmio(uncore))
1737
		DRM_DEBUG("unclaimed mmio detected on uncore init, clearing\n");
1738 1739

	return 0;
1740 1741 1742 1743 1744

out_mmio_cleanup:
	uncore_mmio_cleanup(uncore);

	return ret;
1745 1746
}

1747 1748 1749 1750 1751
/*
 * We might have detected that some engines are fused off after we initialized
 * the forcewake domains. Prune them, to make sure they only reference existing
 * engines.
 */
1752
void intel_uncore_prune_mmio_domains(struct intel_uncore *uncore)
1753
{
1754
	struct drm_i915_private *i915 = uncore->i915;
1755 1756 1757
	enum forcewake_domains fw_domains = uncore->fw_domains;
	enum forcewake_domain_id domain_id;
	int i;
1758

1759 1760
	if (!intel_uncore_has_forcewake(uncore) || INTEL_GEN(i915) < 11)
		return;
1761

1762 1763
	for (i = 0; i < I915_MAX_VCS; i++) {
		domain_id = FW_DOMAIN_ID_MEDIA_VDBOX0 + i;
1764

1765 1766
		if (HAS_ENGINE(i915, _VCS(i)))
			continue;
1767

1768 1769 1770
		if (fw_domains & BIT(domain_id))
			fw_domain_fini(uncore, domain_id);
	}
1771

1772 1773
	for (i = 0; i < I915_MAX_VECS; i++) {
		domain_id = FW_DOMAIN_ID_MEDIA_VEBOX0 + i;
1774

1775 1776
		if (HAS_ENGINE(i915, _VECS(i)))
			continue;
1777

1778 1779
		if (fw_domains & BIT(domain_id))
			fw_domain_fini(uncore, domain_id);
1780 1781 1782
	}
}

1783
void intel_uncore_fini_mmio(struct intel_uncore *uncore)
1784
{
1785 1786 1787 1788 1789
	if (intel_uncore_has_forcewake(uncore)) {
		iosf_mbi_punit_acquire();
		iosf_mbi_unregister_pmic_bus_access_notifier_unlocked(
			&uncore->pmic_bus_access_nb);
		intel_uncore_forcewake_reset(uncore);
1790
		intel_uncore_fw_domains_fini(uncore);
1791 1792 1793
		iosf_mbi_punit_release();
	}

1794
	uncore_mmio_cleanup(uncore);
1795 1796
}

1797 1798 1799 1800 1801 1802 1803 1804
static const struct reg_whitelist {
	i915_reg_t offset_ldw;
	i915_reg_t offset_udw;
	u16 gen_mask;
	u8 size;
} reg_read_whitelist[] = { {
	.offset_ldw = RING_TIMESTAMP(RENDER_RING_BASE),
	.offset_udw = RING_TIMESTAMP_UDW(RENDER_RING_BASE),
1805
	.gen_mask = INTEL_GEN_MASK(4, 12),
1806 1807
	.size = 8
} };
1808 1809 1810 1811

int i915_reg_read_ioctl(struct drm_device *dev,
			void *data, struct drm_file *file)
{
1812 1813
	struct drm_i915_private *i915 = to_i915(dev);
	struct intel_uncore *uncore = &i915->uncore;
1814
	struct drm_i915_reg_read *reg = data;
1815
	struct reg_whitelist const *entry;
1816
	intel_wakeref_t wakeref;
1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829
	unsigned int flags;
	int remain;
	int ret = 0;

	entry = reg_read_whitelist;
	remain = ARRAY_SIZE(reg_read_whitelist);
	while (remain) {
		u32 entry_offset = i915_mmio_reg_offset(entry->offset_ldw);

		GEM_BUG_ON(!is_power_of_2(entry->size));
		GEM_BUG_ON(entry->size > 8);
		GEM_BUG_ON(entry_offset & (entry->size - 1));

1830
		if (INTEL_INFO(i915)->gen_mask & entry->gen_mask &&
1831
		    entry_offset == (reg->offset & -entry->size))
1832
			break;
1833 1834
		entry++;
		remain--;
1835 1836
	}

1837
	if (!remain)
1838 1839
		return -EINVAL;

1840
	flags = reg->offset & (entry->size - 1);
1841

1842
	with_intel_runtime_pm(&i915->runtime_pm, wakeref) {
1843
		if (entry->size == 8 && flags == I915_REG_READ_8B_WA)
1844 1845 1846
			reg->val = intel_uncore_read64_2x32(uncore,
							    entry->offset_ldw,
							    entry->offset_udw);
1847
		else if (entry->size == 8 && flags == 0)
1848 1849
			reg->val = intel_uncore_read64(uncore,
						       entry->offset_ldw);
1850
		else if (entry->size == 4 && flags == 0)
1851
			reg->val = intel_uncore_read(uncore, entry->offset_ldw);
1852
		else if (entry->size == 2 && flags == 0)
1853 1854
			reg->val = intel_uncore_read16(uncore,
						       entry->offset_ldw);
1855
		else if (entry->size == 1 && flags == 0)
1856 1857
			reg->val = intel_uncore_read8(uncore,
						      entry->offset_ldw);
1858 1859 1860
		else
			ret = -EINVAL;
	}
1861

1862
	return ret;
1863 1864
}

1865
/**
1866
 * __intel_wait_for_register_fw - wait until register matches expected state
1867
 * @uncore: the struct intel_uncore
1868 1869 1870
 * @reg: the register to read
 * @mask: mask to apply to register value
 * @value: expected value
1871 1872 1873
 * @fast_timeout_us: fast timeout in microsecond for atomic/tight wait
 * @slow_timeout_ms: slow timeout in millisecond
 * @out_value: optional placeholder to hold registry value
1874 1875
 *
 * This routine waits until the target register @reg contains the expected
1876 1877 1878 1879
 * @value after applying the @mask, i.e. it waits until ::
 *
 *     (I915_READ_FW(reg) & mask) == value
 *
1880
 * Otherwise, the wait will timeout after @slow_timeout_ms milliseconds.
1881
 * For atomic context @slow_timeout_ms must be zero and @fast_timeout_us
1882
 * must be not larger than 20,0000 microseconds.
1883 1884 1885 1886 1887 1888
 *
 * Note that this routine assumes the caller holds forcewake asserted, it is
 * not suitable for very long waits. See intel_wait_for_register() if you
 * wish to wait without holding forcewake for the duration (i.e. you expect
 * the wait to be slow).
 *
1889
 * Return: 0 if the register matches the desired condition, or -ETIMEDOUT.
1890
 */
1891
int __intel_wait_for_register_fw(struct intel_uncore *uncore,
1892
				 i915_reg_t reg,
1893 1894 1895 1896
				 u32 mask,
				 u32 value,
				 unsigned int fast_timeout_us,
				 unsigned int slow_timeout_ms,
1897
				 u32 *out_value)
1898
{
1899
	u32 uninitialized_var(reg_value);
1900
#define done (((reg_value = intel_uncore_read_fw(uncore, reg)) & mask) == value)
1901 1902
	int ret;

1903
	/* Catch any overuse of this function */
1904 1905
	might_sleep_if(slow_timeout_ms);
	GEM_BUG_ON(fast_timeout_us > 20000);
1906

1907 1908
	ret = -ETIMEDOUT;
	if (fast_timeout_us && fast_timeout_us <= 20000)
1909
		ret = _wait_for_atomic(done, fast_timeout_us, 0);
1910
	if (ret && slow_timeout_ms)
1911
		ret = wait_for(done, slow_timeout_ms);
1912

1913 1914
	if (out_value)
		*out_value = reg_value;
1915

1916 1917 1918 1919 1920
	return ret;
#undef done
}

/**
1921
 * __intel_wait_for_register - wait until register matches expected state
1922
 * @uncore: the struct intel_uncore
1923 1924 1925
 * @reg: the register to read
 * @mask: mask to apply to register value
 * @value: expected value
1926 1927 1928
 * @fast_timeout_us: fast timeout in microsecond for atomic/tight wait
 * @slow_timeout_ms: slow timeout in millisecond
 * @out_value: optional placeholder to hold registry value
1929 1930
 *
 * This routine waits until the target register @reg contains the expected
1931 1932 1933 1934
 * @value after applying the @mask, i.e. it waits until ::
 *
 *     (I915_READ(reg) & mask) == value
 *
1935 1936
 * Otherwise, the wait will timeout after @timeout_ms milliseconds.
 *
1937
 * Return: 0 if the register matches the desired condition, or -ETIMEDOUT.
1938
 */
1939 1940 1941 1942 1943 1944 1945 1946
int __intel_wait_for_register(struct intel_uncore *uncore,
			      i915_reg_t reg,
			      u32 mask,
			      u32 value,
			      unsigned int fast_timeout_us,
			      unsigned int slow_timeout_ms,
			      u32 *out_value)
{
1947
	unsigned fw =
1948
		intel_uncore_forcewake_for_reg(uncore, reg, FW_REG_READ);
1949
	u32 reg_value;
1950 1951
	int ret;

1952
	might_sleep_if(slow_timeout_ms);
1953

1954 1955
	spin_lock_irq(&uncore->lock);
	intel_uncore_forcewake_get__locked(uncore, fw);
1956

1957
	ret = __intel_wait_for_register_fw(uncore,
1958
					   reg, mask, value,
1959
					   fast_timeout_us, 0, &reg_value);
1960

1961 1962
	intel_uncore_forcewake_put__locked(uncore, fw);
	spin_unlock_irq(&uncore->lock);
1963

1964
	if (ret && slow_timeout_ms)
1965 1966
		ret = __wait_for(reg_value = intel_uncore_read_notrace(uncore,
								       reg),
1967 1968 1969
				 (reg_value & mask) == value,
				 slow_timeout_ms * 1000, 10, 1000);

1970 1971 1972
	/* just trace the final value */
	trace_i915_reg_rw(false, reg, reg_value, sizeof(reg_value), true);

1973 1974
	if (out_value)
		*out_value = reg_value;
1975 1976

	return ret;
1977 1978
}

1979
bool intel_uncore_unclaimed_mmio(struct intel_uncore *uncore)
1980
{
1981 1982 1983 1984 1985 1986 1987
	bool ret;

	spin_lock_irq(&uncore->debug->lock);
	ret = check_for_unclaimed_mmio(uncore);
	spin_unlock_irq(&uncore->debug->lock);

	return ret;
1988
}
1989

1990
bool
1991
intel_uncore_arm_unclaimed_mmio_detection(struct intel_uncore *uncore)
1992
{
1993 1994
	bool ret = false;

1995
	spin_lock_irq(&uncore->debug->lock);
1996

1997
	if (unlikely(uncore->debug->unclaimed_mmio_check <= 0))
1998
		goto out;
1999

2000
	if (unlikely(check_for_unclaimed_mmio(uncore))) {
2001 2002 2003 2004 2005 2006
		if (!i915_modparams.mmio_debug) {
			DRM_DEBUG("Unclaimed register detected, "
				  "enabling oneshot unclaimed register reporting. "
				  "Please use i915.mmio_debug=N for more information.\n");
			i915_modparams.mmio_debug++;
		}
2007
		uncore->debug->unclaimed_mmio_check--;
2008
		ret = true;
2009
	}
2010

2011
out:
2012
	spin_unlock_irq(&uncore->debug->lock);
2013 2014

	return ret;
2015
}
2016 2017 2018 2019

/**
 * intel_uncore_forcewake_for_reg - which forcewake domains are needed to access
 * 				    a register
2020
 * @uncore: pointer to struct intel_uncore
2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031
 * @reg: register in question
 * @op: operation bitmask of FW_REG_READ and/or FW_REG_WRITE
 *
 * Returns a set of forcewake domains required to be taken with for example
 * intel_uncore_forcewake_get for the specified register to be accessible in the
 * specified mode (read, write or read/write) with raw mmio accessors.
 *
 * NOTE: On Gen6 and Gen7 write forcewake domain (FORCEWAKE_RENDER) requires the
 * callers to do FIFO management on their own or risk losing writes.
 */
enum forcewake_domains
2032
intel_uncore_forcewake_for_reg(struct intel_uncore *uncore,
2033 2034 2035 2036 2037 2038
			       i915_reg_t reg, unsigned int op)
{
	enum forcewake_domains fw_domains = 0;

	WARN_ON(!op);

2039
	if (!intel_uncore_has_forcewake(uncore))
T
Tvrtko Ursulin 已提交
2040 2041
		return 0;

2042
	if (op & FW_REG_READ)
2043
		fw_domains = uncore->funcs.read_fw_domains(uncore, reg);
2044 2045

	if (op & FW_REG_WRITE)
2046 2047 2048
		fw_domains |= uncore->funcs.write_fw_domains(uncore, reg);

	WARN_ON(fw_domains & ~uncore->fw_domains);
2049 2050 2051

	return fw_domains;
}
2052 2053

#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
2054
#include "selftests/mock_uncore.c"
2055 2056
#include "selftests/intel_uncore.c"
#endif