intel_device_info.c 12.2 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
/*
 * Copyright © 2016 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 *
 */

#include "i915_drv.h"

void intel_device_info_dump(struct drm_i915_private *dev_priv)
{
	const struct intel_device_info *info = &dev_priv->info;

31
	DRM_DEBUG_DRIVER("i915 device info: gen=%i, pciid=0x%04x rev=0x%02x",
32 33
			 info->gen,
			 dev_priv->drm.pdev->device,
34 35 36 37
			 dev_priv->drm.pdev->revision);
#define PRINT_FLAG(name) \
	DRM_DEBUG_DRIVER("i915 device info: " #name ": %s", yesno(info->name))
	DEV_INFO_FOR_EACH_FLAG(PRINT_FLAG);
38 39 40 41 42
#undef PRINT_FLAG
}

static void cherryview_sseu_info_init(struct drm_i915_private *dev_priv)
{
43
	struct sseu_dev_info *sseu = &mkwrite_device_info(dev_priv)->sseu;
44 45 46 47
	u32 fuse, eu_dis;

	fuse = I915_READ(CHV_FUSE_GT);

48
	sseu->slice_mask = BIT(0);
49 50

	if (!(fuse & CHV_FGT_DISABLE_SS0)) {
51
		sseu->subslice_mask |= BIT(0);
52 53
		eu_dis = fuse & (CHV_FGT_EU_DIS_SS0_R0_MASK |
				 CHV_FGT_EU_DIS_SS0_R1_MASK);
54
		sseu->eu_total += 8 - hweight32(eu_dis);
55 56 57
	}

	if (!(fuse & CHV_FGT_DISABLE_SS1)) {
58
		sseu->subslice_mask |= BIT(1);
59 60
		eu_dis = fuse & (CHV_FGT_EU_DIS_SS1_R0_MASK |
				 CHV_FGT_EU_DIS_SS1_R1_MASK);
61
		sseu->eu_total += 8 - hweight32(eu_dis);
62 63 64 65 66 67
	}

	/*
	 * CHV expected to always have a uniform distribution of EU
	 * across subslices.
	*/
68 69
	sseu->eu_per_subslice = sseu_subslice_total(sseu) ?
				sseu->eu_total / sseu_subslice_total(sseu) :
70 71 72 73 74 75
				0;
	/*
	 * CHV supports subslice power gating on devices with more than
	 * one subslice, and supports EU power gating on devices with
	 * more than one EU pair per subslice.
	*/
76
	sseu->has_slice_pg = 0;
77
	sseu->has_subslice_pg = sseu_subslice_total(sseu) > 1;
78
	sseu->has_eu_pg = (sseu->eu_per_subslice > 2);
79 80 81 82 83
}

static void gen9_sseu_info_init(struct drm_i915_private *dev_priv)
{
	struct intel_device_info *info = mkwrite_device_info(dev_priv);
84
	struct sseu_dev_info *sseu = &info->sseu;
85 86
	int s_max = 3, ss_max = 4, eu_max = 8;
	int s, ss;
87
	u32 fuse2, eu_disable;
88 89 90
	u8 eu_mask = 0xff;

	fuse2 = I915_READ(GEN8_FUSE2);
91
	sseu->slice_mask = (fuse2 & GEN8_F2_S_ENA_MASK) >> GEN8_F2_S_ENA_SHIFT;
92 93 94 95 96

	/*
	 * The subslice disable field is global, i.e. it applies
	 * to each of the enabled slices.
	*/
97 98 99
	sseu->subslice_mask = (1 << ss_max) - 1;
	sseu->subslice_mask &= ~((fuse2 & GEN9_F2_SS_DIS_MASK) >>
				 GEN9_F2_SS_DIS_SHIFT);
100 101 102 103 104 105

	/*
	 * Iterate through enabled slices and subslices to
	 * count the total enabled EU.
	*/
	for (s = 0; s < s_max; s++) {
106
		if (!(sseu->slice_mask & BIT(s)))
107 108 109 110 111 112 113
			/* skip disabled slice */
			continue;

		eu_disable = I915_READ(GEN9_EU_DISABLE(s));
		for (ss = 0; ss < ss_max; ss++) {
			int eu_per_ss;

114
			if (!(sseu->subslice_mask & BIT(ss)))
115 116 117 118 119 120 121 122 123 124 125 126
				/* skip disabled subslice */
				continue;

			eu_per_ss = eu_max - hweight8((eu_disable >> (ss*8)) &
						      eu_mask);

			/*
			 * Record which subslice(s) has(have) 7 EUs. we
			 * can tune the hash used to spread work among
			 * subslices if they are unbalanced.
			 */
			if (eu_per_ss == 7)
127
				sseu->subslice_7eu[s] |= BIT(ss);
128

129
			sseu->eu_total += eu_per_ss;
130 131 132 133 134 135 136 137 138 139
		}
	}

	/*
	 * SKL is expected to always have a uniform distribution
	 * of EU across subslices with the exception that any one
	 * EU in any one subslice may be fused off for die
	 * recovery. BXT is expected to be perfectly uniform in EU
	 * distribution.
	*/
140
	sseu->eu_per_subslice = sseu_subslice_total(sseu) ?
141
				DIV_ROUND_UP(sseu->eu_total,
142
					     sseu_subslice_total(sseu)) : 0;
143 144 145 146 147 148 149 150
	/*
	 * SKL supports slice power gating on devices with more than
	 * one slice, and supports EU power gating on devices with
	 * more than one EU pair per subslice. BXT supports subslice
	 * power gating on devices with more than one subslice, and
	 * supports EU power gating on devices with more than one EU
	 * pair per subslice.
	*/
151
	sseu->has_slice_pg =
152
		(IS_SKYLAKE(dev_priv) || IS_KABYLAKE(dev_priv)) &&
153
		hweight8(sseu->slice_mask) > 1;
154
	sseu->has_subslice_pg =
155
		IS_BROXTON(dev_priv) && sseu_subslice_total(sseu) > 1;
156
	sseu->has_eu_pg = sseu->eu_per_subslice > 2;
157 158

	if (IS_BROXTON(dev_priv)) {
159
#define IS_SS_DISABLED(ss)	(!(sseu->subslice_mask & BIT(ss)))
160 161 162 163 164 165 166
		/*
		 * There is a HW issue in 2x6 fused down parts that requires
		 * Pooled EU to be enabled as a WA. The pool configuration
		 * changes depending upon which subslice is fused down. This
		 * doesn't affect if the device has all 3 subslices enabled.
		 */
		/* WaEnablePooledEuFor2x6:bxt */
167 168
		info->has_pooled_eu = ((hweight8(sseu->subslice_mask) == 3) ||
				       (hweight8(sseu->subslice_mask) == 2 &&
169 170
					INTEL_REVID(dev_priv) < BXT_REVID_C0));

171
		sseu->min_eu_in_pool = 0;
172
		if (info->has_pooled_eu) {
173
			if (IS_SS_DISABLED(2) || IS_SS_DISABLED(0))
174
				sseu->min_eu_in_pool = 3;
175
			else if (IS_SS_DISABLED(1))
176
				sseu->min_eu_in_pool = 6;
177
			else
178
				sseu->min_eu_in_pool = 9;
179 180 181 182 183 184 185
		}
#undef IS_SS_DISABLED
	}
}

static void broadwell_sseu_info_init(struct drm_i915_private *dev_priv)
{
186
	struct sseu_dev_info *sseu = &mkwrite_device_info(dev_priv)->sseu;
187 188
	const int s_max = 3, ss_max = 3, eu_max = 8;
	int s, ss;
189
	u32 fuse2, eu_disable[3]; /* s_max */
190 191

	fuse2 = I915_READ(GEN8_FUSE2);
192
	sseu->slice_mask = (fuse2 & GEN8_F2_S_ENA_MASK) >> GEN8_F2_S_ENA_SHIFT;
193 194 195 196 197 198 199
	/*
	 * The subslice disable field is global, i.e. it applies
	 * to each of the enabled slices.
	 */
	sseu->subslice_mask = BIT(ss_max) - 1;
	sseu->subslice_mask &= ~((fuse2 & GEN8_F2_SS_DIS_MASK) >>
				 GEN8_F2_SS_DIS_SHIFT);
200 201 202 203 204 205 206 207 208 209 210 211 212 213

	eu_disable[0] = I915_READ(GEN8_EU_DISABLE0) & GEN8_EU_DIS0_S0_MASK;
	eu_disable[1] = (I915_READ(GEN8_EU_DISABLE0) >> GEN8_EU_DIS0_S1_SHIFT) |
			((I915_READ(GEN8_EU_DISABLE1) & GEN8_EU_DIS1_S1_MASK) <<
			 (32 - GEN8_EU_DIS0_S1_SHIFT));
	eu_disable[2] = (I915_READ(GEN8_EU_DISABLE1) >> GEN8_EU_DIS1_S2_SHIFT) |
			((I915_READ(GEN8_EU_DISABLE2) & GEN8_EU_DIS2_S2_MASK) <<
			 (32 - GEN8_EU_DIS1_S2_SHIFT));

	/*
	 * Iterate through enabled slices and subslices to
	 * count the total enabled EU.
	 */
	for (s = 0; s < s_max; s++) {
214
		if (!(sseu->slice_mask & BIT(s)))
215 216 217 218 219 220
			/* skip disabled slice */
			continue;

		for (ss = 0; ss < ss_max; ss++) {
			u32 n_disabled;

221
			if (!(sseu->subslice_mask & BIT(ss)))
222 223 224 225 226 227 228 229 230
				/* skip disabled subslice */
				continue;

			n_disabled = hweight8(eu_disable[s] >> (ss * eu_max));

			/*
			 * Record which subslices have 7 EUs.
			 */
			if (eu_max - n_disabled == 7)
231
				sseu->subslice_7eu[s] |= 1 << ss;
232

233
			sseu->eu_total += eu_max - n_disabled;
234 235 236 237 238 239 240 241
		}
	}

	/*
	 * BDW is expected to always have a uniform distribution of EU across
	 * subslices with the exception that any one EU in any one subslice may
	 * be fused off for die recovery.
	 */
242 243 244
	sseu->eu_per_subslice = sseu_subslice_total(sseu) ?
				DIV_ROUND_UP(sseu->eu_total,
					     sseu_subslice_total(sseu)) : 0;
245 246 247 248 249

	/*
	 * BDW supports slice power gating on devices with more than
	 * one slice.
	 */
250
	sseu->has_slice_pg = hweight8(sseu->slice_mask) > 1;
251 252
	sseu->has_subslice_pg = 0;
	sseu->has_eu_pg = 0;
253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280
}

/*
 * Determine various intel_device_info fields at runtime.
 *
 * Use it when either:
 *   - it's judged too laborious to fill n static structures with the limit
 *     when a simple if statement does the job,
 *   - run-time checks (eg read fuse/strap registers) are needed.
 *
 * This function needs to be called:
 *   - after the MMIO has been setup as we are reading registers,
 *   - after the PCH has been detected,
 *   - before the first usage of the fields it can tweak.
 */
void intel_device_info_runtime_init(struct drm_i915_private *dev_priv)
{
	struct intel_device_info *info = mkwrite_device_info(dev_priv);
	enum pipe pipe;

	/*
	 * Skylake and Broxton currently don't expose the topmost plane as its
	 * use is exclusive with the legacy cursor and we only want to expose
	 * one of those, not both. Until we can safely expose the topmost plane
	 * as a DRM_PLANE_TYPE_CURSOR with all the features exposed/supported,
	 * we don't expose the topmost plane at all to prevent ABI breakage
	 * down the line.
	 */
281 282 283 284
	if (IS_GEMINILAKE(dev_priv))
		for_each_pipe(dev_priv, pipe)
			info->num_sprites[pipe] = 3;
	else if (IS_BROXTON(dev_priv)) {
285 286 287
		info->num_sprites[PIPE_A] = 2;
		info->num_sprites[PIPE_B] = 2;
		info->num_sprites[PIPE_C] = 1;
288
	} else if (IS_VALLEYVIEW(dev_priv) || IS_CHERRYVIEW(dev_priv)) {
289 290
		for_each_pipe(dev_priv, pipe)
			info->num_sprites[pipe] = 2;
291
	} else if (INTEL_GEN(dev_priv) >= 5) {
292 293
		for_each_pipe(dev_priv, pipe)
			info->num_sprites[pipe] = 1;
294
	}
295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370

	if (i915.disable_display) {
		DRM_INFO("Display disabled (module parameter)\n");
		info->num_pipes = 0;
	} else if (info->num_pipes > 0 &&
		   (IS_GEN7(dev_priv) || IS_GEN8(dev_priv)) &&
		   HAS_PCH_SPLIT(dev_priv)) {
		u32 fuse_strap = I915_READ(FUSE_STRAP);
		u32 sfuse_strap = I915_READ(SFUSE_STRAP);

		/*
		 * SFUSE_STRAP is supposed to have a bit signalling the display
		 * is fused off. Unfortunately it seems that, at least in
		 * certain cases, fused off display means that PCH display
		 * reads don't land anywhere. In that case, we read 0s.
		 *
		 * On CPT/PPT, we can detect this case as SFUSE_STRAP_FUSE_LOCK
		 * should be set when taking over after the firmware.
		 */
		if (fuse_strap & ILK_INTERNAL_DISPLAY_DISABLE ||
		    sfuse_strap & SFUSE_STRAP_DISPLAY_DISABLED ||
		    (dev_priv->pch_type == PCH_CPT &&
		     !(sfuse_strap & SFUSE_STRAP_FUSE_LOCK))) {
			DRM_INFO("Display fused off, disabling\n");
			info->num_pipes = 0;
		} else if (fuse_strap & IVB_PIPE_C_DISABLE) {
			DRM_INFO("PipeC fused off\n");
			info->num_pipes -= 1;
		}
	} else if (info->num_pipes > 0 && IS_GEN9(dev_priv)) {
		u32 dfsm = I915_READ(SKL_DFSM);
		u8 disabled_mask = 0;
		bool invalid;
		int num_bits;

		if (dfsm & SKL_DFSM_PIPE_A_DISABLE)
			disabled_mask |= BIT(PIPE_A);
		if (dfsm & SKL_DFSM_PIPE_B_DISABLE)
			disabled_mask |= BIT(PIPE_B);
		if (dfsm & SKL_DFSM_PIPE_C_DISABLE)
			disabled_mask |= BIT(PIPE_C);

		num_bits = hweight8(disabled_mask);

		switch (disabled_mask) {
		case BIT(PIPE_A):
		case BIT(PIPE_B):
		case BIT(PIPE_A) | BIT(PIPE_B):
		case BIT(PIPE_A) | BIT(PIPE_C):
			invalid = true;
			break;
		default:
			invalid = false;
		}

		if (num_bits > info->num_pipes || invalid)
			DRM_ERROR("invalid pipe fuse configuration: 0x%x\n",
				  disabled_mask);
		else
			info->num_pipes -= num_bits;
	}

	/* Initialize slice/subslice/EU info */
	if (IS_CHERRYVIEW(dev_priv))
		cherryview_sseu_info_init(dev_priv);
	else if (IS_BROADWELL(dev_priv))
		broadwell_sseu_info_init(dev_priv);
	else if (INTEL_INFO(dev_priv)->gen >= 9)
		gen9_sseu_info_init(dev_priv);

	info->has_snoop = !info->has_llc;

	/* Snooping is broken on BXT A stepping. */
	if (IS_BXT_REVID(dev_priv, 0, BXT_REVID_A1))
		info->has_snoop = false;

371
	DRM_DEBUG_DRIVER("slice mask: %04x\n", info->sseu.slice_mask);
372
	DRM_DEBUG_DRIVER("slice total: %u\n", hweight8(info->sseu.slice_mask));
373 374
	DRM_DEBUG_DRIVER("subslice total: %u\n",
			 sseu_subslice_total(&info->sseu));
375
	DRM_DEBUG_DRIVER("subslice mask %04x\n", info->sseu.subslice_mask);
376
	DRM_DEBUG_DRIVER("subslice per slice: %u\n",
377
			 hweight8(info->sseu.subslice_mask));
378 379
	DRM_DEBUG_DRIVER("EU total: %u\n", info->sseu.eu_total);
	DRM_DEBUG_DRIVER("EU per subslice: %u\n", info->sseu.eu_per_subslice);
380
	DRM_DEBUG_DRIVER("has slice power gating: %s\n",
381
			 info->sseu.has_slice_pg ? "y" : "n");
382
	DRM_DEBUG_DRIVER("has subslice power gating: %s\n",
383
			 info->sseu.has_subslice_pg ? "y" : "n");
384
	DRM_DEBUG_DRIVER("has EU power gating: %s\n",
385
			 info->sseu.has_eu_pg ? "y" : "n");
386
}