adreno_gpu.c 13.1 KB
Newer Older
R
Rob Clark 已提交
1 2 3 4
/*
 * Copyright (C) 2013 Red Hat
 * Author: Rob Clark <robdclark@gmail.com>
 *
5 6
 * Copyright (c) 2014 The Linux Foundation. All rights reserved.
 *
R
Rob Clark 已提交
7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 as published by
 * the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program.  If not, see <http://www.gnu.org/licenses/>.
 */

#include "adreno_gpu.h"
#include "msm_gem.h"
22
#include "msm_mmu.h"
R
Rob Clark 已提交
23 24

#define RB_SIZE    SZ_32K
25
#define RB_BLKSIZE 32
R
Rob Clark 已提交
26 27 28 29 30 31 32 33 34 35

int adreno_get_param(struct msm_gpu *gpu, uint32_t param, uint64_t *value)
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);

	switch (param) {
	case MSM_PARAM_GPU_ID:
		*value = adreno_gpu->info->revn;
		return 0;
	case MSM_PARAM_GMEM_SIZE:
R
Rob Clark 已提交
36
		*value = adreno_gpu->gmem;
R
Rob Clark 已提交
37
		return 0;
J
Jordan Crouse 已提交
38 39 40
	case MSM_PARAM_GMEM_BASE:
		*value = 0x100000;
		return 0;
R
Rob Clark 已提交
41 42 43 44 45 46
	case MSM_PARAM_CHIP_ID:
		*value = adreno_gpu->rev.patchid |
				(adreno_gpu->rev.minor << 8) |
				(adreno_gpu->rev.major << 16) |
				(adreno_gpu->rev.core << 24);
		return 0;
47 48 49
	case MSM_PARAM_MAX_FREQ:
		*value = adreno_gpu->base.fast_rate;
		return 0;
R
Rob Clark 已提交
50
	case MSM_PARAM_TIMESTAMP:
51 52 53 54 55 56 57 58 59
		if (adreno_gpu->funcs->get_timestamp) {
			int ret;

			pm_runtime_get_sync(&gpu->pdev->dev);
			ret = adreno_gpu->funcs->get_timestamp(gpu, value);
			pm_runtime_put_autosuspend(&gpu->pdev->dev);

			return ret;
		}
R
Rob Clark 已提交
60
		return -EINVAL;
R
Rob Clark 已提交
61 62 63 64 65 66
	default:
		DBG("%s: invalid param: %u", gpu->name, param);
		return -EINVAL;
	}
}

67 68
const struct firmware *
adreno_request_fw(struct adreno_gpu *adreno_gpu, const char *fwname)
69 70
{
	struct drm_device *drm = adreno_gpu->base.dev;
71
	const struct firmware *fw = NULL;
72
	char newname[strlen("qcom/") + strlen(fwname) + 1];
73 74
	int ret;

75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133
	sprintf(newname, "qcom/%s", fwname);

	/*
	 * Try first to load from qcom/$fwfile using a direct load (to avoid
	 * a potential timeout waiting for usermode helper)
	 */
	if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
	    (adreno_gpu->fwloc == FW_LOCATION_NEW)) {

		ret = request_firmware_direct(&fw, newname, drm->dev);
		if (!ret) {
			dev_info(drm->dev, "loaded %s from new location\n",
				newname);
			adreno_gpu->fwloc = FW_LOCATION_NEW;
			return fw;
		} else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
			dev_err(drm->dev, "failed to load %s: %d\n",
				newname, ret);
			return ERR_PTR(ret);
		}
	}

	/*
	 * Then try the legacy location without qcom/ prefix
	 */
	if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
	    (adreno_gpu->fwloc == FW_LOCATION_LEGACY)) {

		ret = request_firmware_direct(&fw, fwname, drm->dev);
		if (!ret) {
			dev_info(drm->dev, "loaded %s from legacy location\n",
				newname);
			adreno_gpu->fwloc = FW_LOCATION_LEGACY;
			return fw;
		} else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
			dev_err(drm->dev, "failed to load %s: %d\n",
				fwname, ret);
			return ERR_PTR(ret);
		}
	}

	/*
	 * Finally fall back to request_firmware() for cases where the
	 * usermode helper is needed (I think mainly android)
	 */
	if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
	    (adreno_gpu->fwloc == FW_LOCATION_HELPER)) {

		ret = request_firmware(&fw, newname, drm->dev);
		if (!ret) {
			dev_info(drm->dev, "loaded %s with helper\n",
				newname);
			adreno_gpu->fwloc = FW_LOCATION_HELPER;
			return fw;
		} else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
			dev_err(drm->dev, "failed to load %s: %d\n",
				newname, ret);
			return ERR_PTR(ret);
		}
134 135
	}

136 137
	dev_err(drm->dev, "failed to load %s\n", fwname);
	return ERR_PTR(-ENOENT);
138 139 140 141 142 143
}

static int adreno_load_fw(struct adreno_gpu *adreno_gpu)
{
	const struct firmware *fw;

144 145 146
	if (adreno_gpu->pm4)
		return 0;

147 148 149 150
	fw = adreno_request_fw(adreno_gpu, adreno_gpu->info->pm4fw);
	if (IS_ERR(fw))
		return PTR_ERR(fw);
	adreno_gpu->pm4 = fw;
151

152 153
	fw = adreno_request_fw(adreno_gpu, adreno_gpu->info->pfpfw);
	if (IS_ERR(fw)) {
154 155
		release_firmware(adreno_gpu->pm4);
		adreno_gpu->pm4 = NULL;
156
		return PTR_ERR(fw);
157
	}
158
	adreno_gpu->pfp = fw;
159 160 161 162

	return 0;
}

R
Rob Clark 已提交
163 164 165
int adreno_hw_init(struct msm_gpu *gpu)
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
R
Rob Clark 已提交
166
	int ret;
R
Rob Clark 已提交
167 168 169

	DBG("%s", gpu->name);

170 171 172 173
	ret = adreno_load_fw(adreno_gpu);
	if (ret)
		return ret;

174
	ret = msm_gem_get_iova(gpu->rb->bo, gpu->aspace, &gpu->rb_iova);
R
Rob Clark 已提交
175 176 177 178 179 180
	if (ret) {
		gpu->rb_iova = 0;
		dev_err(gpu->dev->dev, "could not map ringbuffer: %d\n", ret);
		return ret;
	}

181 182 183 184
	/* reset ringbuffer: */
	gpu->rb->cur = gpu->rb->start;

	/* reset completed fence seqno: */
J
Jordan Crouse 已提交
185 186
	gpu->memptrs->fence = gpu->fctx->completed_fence;
	gpu->memptrs->rptr  = 0;
187

R
Rob Clark 已提交
188
	/* Setup REG_CP_RB_CNTL: */
189
	adreno_gpu_write(adreno_gpu, REG_ADRENO_CP_RB_CNTL,
R
Rob Clark 已提交
190 191
			/* size is log2(quad-words): */
			AXXX_CP_RB_CNTL_BUFSZ(ilog2(gpu->rb->size / 8)) |
192 193
			AXXX_CP_RB_CNTL_BLKSZ(ilog2(RB_BLKSIZE / 8)) |
			(adreno_is_a430(adreno_gpu) ? AXXX_CP_RB_CNTL_NO_UPDATE : 0));
R
Rob Clark 已提交
194 195

	/* Setup ringbuffer address: */
J
Jordan Crouse 已提交
196 197
	adreno_gpu_write64(adreno_gpu, REG_ADRENO_CP_RB_BASE,
		REG_ADRENO_CP_RB_BASE_HI, gpu->rb_iova);
R
Rob Clark 已提交
198

J
Jordan Crouse 已提交
199 200
	if (!adreno_is_a430(adreno_gpu)) {
		adreno_gpu_write64(adreno_gpu, REG_ADRENO_CP_RB_RPTR_ADDR,
J
Jordan Crouse 已提交
201
			REG_ADRENO_CP_RB_RPTR_ADDR_HI, rbmemptr(gpu, rptr));
J
Jordan Crouse 已提交
202
	}
R
Rob Clark 已提交
203 204 205 206 207 208 209 210 211

	return 0;
}

static uint32_t get_wptr(struct msm_ringbuffer *ring)
{
	return ring->cur - ring->start;
}

212 213 214
/* Use this helper to read rptr, since a430 doesn't update rptr in memory */
static uint32_t get_rptr(struct adreno_gpu *adreno_gpu)
{
J
Jordan Crouse 已提交
215 216
	struct msm_gpu *gpu = &adreno_gpu->base;

217
	if (adreno_is_a430(adreno_gpu))
J
Jordan Crouse 已提交
218
		return gpu->memptrs->rptr = adreno_gpu_read(
219 220
			adreno_gpu, REG_ADRENO_CP_RB_RPTR);
	else
J
Jordan Crouse 已提交
221
		return gpu->memptrs->rptr;
R
Rob Clark 已提交
222 223
}

224 225 226 227 228
void adreno_recover(struct msm_gpu *gpu)
{
	struct drm_device *dev = gpu->dev;
	int ret;

R
Rob Clark 已提交
229 230 231
	// XXX pm-runtime??  we *need* the device to be off after this
	// so maybe continuing to call ->pm_suspend/resume() is better?

232 233
	gpu->funcs->pm_suspend(gpu);
	gpu->funcs->pm_resume(gpu);
234

R
Rob Clark 已提交
235
	ret = msm_gpu_hw_init(gpu);
236 237 238 239 240 241
	if (ret) {
		dev_err(dev->dev, "gpu hw init failed: %d\n", ret);
		/* hmm, oh well? */
	}
}

242
void adreno_submit(struct msm_gpu *gpu, struct msm_gem_submit *submit,
R
Rob Clark 已提交
243 244 245 246 247
		struct msm_file_private *ctx)
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
	struct msm_drm_private *priv = gpu->dev->dev_private;
	struct msm_ringbuffer *ring = gpu->rb;
248
	unsigned i;
R
Rob Clark 已提交
249 250 251 252 253 254 255 256 257 258 259

	for (i = 0; i < submit->nr_cmds; i++) {
		switch (submit->cmd[i].type) {
		case MSM_SUBMIT_CMD_IB_TARGET_BUF:
			/* ignore IB-targets */
			break;
		case MSM_SUBMIT_CMD_CTX_RESTORE_BUF:
			/* ignore if there has not been a ctx switch: */
			if (priv->lastctx == ctx)
				break;
		case MSM_SUBMIT_CMD_BUF:
260 261
			OUT_PKT3(ring, adreno_is_a430(adreno_gpu) ?
				CP_INDIRECT_BUFFER_PFE : CP_INDIRECT_BUFFER_PFD, 2);
R
Rob Clark 已提交
262 263
			OUT_RING(ring, submit->cmd[i].iova);
			OUT_RING(ring, submit->cmd[i].size);
264
			OUT_PKT2(ring);
R
Rob Clark 已提交
265 266 267 268 269
			break;
		}
	}

	OUT_PKT0(ring, REG_AXXX_CP_SCRATCH_REG2, 1);
R
Rob Clark 已提交
270
	OUT_RING(ring, submit->fence->seqno);
R
Rob Clark 已提交
271

272
	if (adreno_is_a3xx(adreno_gpu) || adreno_is_a4xx(adreno_gpu)) {
R
Rob Clark 已提交
273 274 275 276 277 278 279 280 281 282 283 284 285
		/* Flush HLSQ lazy updates to make sure there is nothing
		 * pending for indirect loads after the timestamp has
		 * passed:
		 */
		OUT_PKT3(ring, CP_EVENT_WRITE, 1);
		OUT_RING(ring, HLSQ_FLUSH);

		OUT_PKT3(ring, CP_WAIT_FOR_IDLE, 1);
		OUT_RING(ring, 0x00000000);
	}

	OUT_PKT3(ring, CP_EVENT_WRITE, 3);
	OUT_RING(ring, CACHE_FLUSH_TS);
J
Jordan Crouse 已提交
286
	OUT_RING(ring, rbmemptr(gpu, fence));
R
Rob Clark 已提交
287
	OUT_RING(ring, submit->fence->seqno);
R
Rob Clark 已提交
288 289 290 291 292

	/* we could maybe be clever and only CP_COND_EXEC the interrupt: */
	OUT_PKT3(ring, CP_INTERRUPT, 1);
	OUT_RING(ring, 0x80000000);

293 294 295 296 297 298 299 300 301 302 303
	/* Workaround for missing irq issue on 8x16/a306.  Unsure if the
	 * root cause is a platform issue or some a306 quirk, but this
	 * keeps things humming along:
	 */
	if (adreno_is_a306(adreno_gpu)) {
		OUT_PKT3(ring, CP_WAIT_FOR_IDLE, 1);
		OUT_RING(ring, 0x00000000);
		OUT_PKT3(ring, CP_INTERRUPT, 1);
		OUT_RING(ring, 0x80000000);
	}

R
Rob Clark 已提交
304 305 306 307 308 309 310 311 312 313 314 315 316 317
#if 0
	if (adreno_is_a3xx(adreno_gpu)) {
		/* Dummy set-constant to trigger context rollover */
		OUT_PKT3(ring, CP_SET_CONSTANT, 2);
		OUT_RING(ring, CP_REG(REG_A3XX_HLSQ_CL_KERNEL_GROUP_X_REG));
		OUT_RING(ring, 0x00000000);
	}
#endif

	gpu->funcs->flush(gpu);
}

void adreno_flush(struct msm_gpu *gpu)
{
318
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
319 320 321 322 323 324 325 326
	uint32_t wptr;

	/*
	 * Mask wptr value that we calculate to fit in the HW range. This is
	 * to account for the possibility that the last command fit exactly into
	 * the ringbuffer and rb->next hasn't wrapped to zero yet
	 */
	wptr = get_wptr(gpu->rb) & ((gpu->rb->size / 4) - 1);
R
Rob Clark 已提交
327 328 329 330

	/* ensure writes to ringbuffer have hit system memory: */
	mb();

331
	adreno_gpu_write(adreno_gpu, REG_ADRENO_CP_RB_WPTR, wptr);
R
Rob Clark 已提交
332 333
}

334
bool adreno_idle(struct msm_gpu *gpu)
R
Rob Clark 已提交
335 336
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
R
Rob Clark 已提交
337
	uint32_t wptr = get_wptr(gpu->rb);
R
Rob Clark 已提交
338

R
Rob Clark 已提交
339
	/* wait for CP to drain ringbuffer: */
340 341
	if (!spin_until(get_rptr(adreno_gpu) == wptr))
		return true;
R
Rob Clark 已提交
342 343

	/* TODO maybe we need to reset GPU here to recover from hang? */
344 345
	DRM_ERROR("%s: timeout waiting to drain ringbuffer!\n", gpu->name);
	return false;
R
Rob Clark 已提交
346 347 348 349 350 351
}

#ifdef CONFIG_DEBUG_FS
void adreno_show(struct msm_gpu *gpu, struct seq_file *m)
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
352
	int i;
R
Rob Clark 已提交
353 354 355 356 357 358

	seq_printf(m, "revision: %d (%d.%d.%d.%d)\n",
			adreno_gpu->info->revn, adreno_gpu->rev.core,
			adreno_gpu->rev.major, adreno_gpu->rev.minor,
			adreno_gpu->rev.patchid);

J
Jordan Crouse 已提交
359
	seq_printf(m, "fence:    %d/%d\n", gpu->memptrs->fence,
R
Rob Clark 已提交
360
			gpu->fctx->last_fence);
361
	seq_printf(m, "rptr:     %d\n", get_rptr(adreno_gpu));
R
Rob Clark 已提交
362
	seq_printf(m, "rb wptr:  %d\n", get_wptr(gpu->rb));
363 364 365 366 367 368 369 370 371 372 373 374 375

	/* dump these out in a form that can be parsed by demsm: */
	seq_printf(m, "IO:region %s 00000000 00020000\n", gpu->name);
	for (i = 0; adreno_gpu->registers[i] != ~0; i += 2) {
		uint32_t start = adreno_gpu->registers[i];
		uint32_t end   = adreno_gpu->registers[i+1];
		uint32_t addr;

		for (addr = start; addr <= end; addr++) {
			uint32_t val = gpu_read(gpu, addr);
			seq_printf(m, "IO:R %08x %08x\n", addr<<2, val);
		}
	}
R
Rob Clark 已提交
376 377 378
}
#endif

379 380 381 382 383 384 385
/* Dump common gpu status and scratch registers on any hang, to make
 * the hangcheck logs more useful.  The scratch registers seem always
 * safe to read when GPU has hung (unlike some other regs, depending
 * on how the GPU hung), and they are useful to match up to cmdstream
 * dumps when debugging hangs:
 */
void adreno_dump_info(struct msm_gpu *gpu)
R
Rob Clark 已提交
386 387 388 389 390 391 392 393
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);

	printk("revision: %d (%d.%d.%d.%d)\n",
			adreno_gpu->info->revn, adreno_gpu->rev.core,
			adreno_gpu->rev.major, adreno_gpu->rev.minor,
			adreno_gpu->rev.patchid);

J
Jordan Crouse 已提交
394
	printk("fence:    %d/%d\n", gpu->memptrs->fence,
R
Rob Clark 已提交
395
			gpu->fctx->last_fence);
396
	printk("rptr:     %d\n", get_rptr(adreno_gpu));
R
Rob Clark 已提交
397
	printk("rb wptr:  %d\n", get_wptr(gpu->rb));
398 399 400 401 402 403 404 405
}

/* would be nice to not have to duplicate the _show() stuff with printk(): */
void adreno_dump(struct msm_gpu *gpu)
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
	int i;

406 407 408 409 410 411 412 413 414 415 416 417
	/* dump these out in a form that can be parsed by demsm: */
	printk("IO:region %s 00000000 00020000\n", gpu->name);
	for (i = 0; adreno_gpu->registers[i] != ~0; i += 2) {
		uint32_t start = adreno_gpu->registers[i];
		uint32_t end   = adreno_gpu->registers[i+1];
		uint32_t addr;

		for (addr = start; addr <= end; addr++) {
			uint32_t val = gpu_read(gpu, addr);
			printk("IO:R %08x %08x\n", addr<<2, val);
		}
	}
R
Rob Clark 已提交
418 419
}

R
Rob Clark 已提交
420
static uint32_t ring_freewords(struct msm_gpu *gpu)
R
Rob Clark 已提交
421 422
{
	struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
R
Rob Clark 已提交
423 424
	uint32_t size = gpu->rb->size / 4;
	uint32_t wptr = get_wptr(gpu->rb);
425
	uint32_t rptr = get_rptr(adreno_gpu);
R
Rob Clark 已提交
426 427 428 429 430 431 432
	return (rptr + (size - 1) - wptr) % size;
}

void adreno_wait_ring(struct msm_gpu *gpu, uint32_t ndwords)
{
	if (spin_until(ring_freewords(gpu) >= ndwords))
		DRM_ERROR("%s: timeout waiting for ringbuffer space\n", gpu->name);
R
Rob Clark 已提交
433 434 435
}

int adreno_gpu_init(struct drm_device *drm, struct platform_device *pdev,
436
		struct adreno_gpu *adreno_gpu, const struct adreno_gpu_funcs *funcs)
R
Rob Clark 已提交
437
{
438
	struct adreno_platform_config *config = pdev->dev.platform_data;
439
	struct msm_gpu_config adreno_gpu_config  = { 0 };
440
	struct msm_gpu *gpu = &adreno_gpu->base;
R
Rob Clark 已提交
441

442 443 444 445 446 447 448 449
	adreno_gpu->funcs = funcs;
	adreno_gpu->info = adreno_info(config->rev);
	adreno_gpu->gmem = adreno_gpu->info->gmem;
	adreno_gpu->revn = adreno_gpu->info->revn;
	adreno_gpu->rev = config->rev;

	gpu->fast_rate = config->fast_rate;
	gpu->bus_freq  = config->bus_freq;
450
#ifdef DOWNSTREAM_CONFIG_MSM_BUS_SCALING
451 452 453
	gpu->bus_scale_table = config->bus_scale_table;
#endif

454 455
	DBG("fast_rate=%u, slow_rate=27000000, bus_freq=%u",
			gpu->fast_rate, gpu->bus_freq);
R
Rob Clark 已提交
456

457 458 459 460 461 462 463 464
	adreno_gpu_config.ioname = "kgsl_3d0_reg_memory";
	adreno_gpu_config.irqname = "kgsl_3d0_irq";

	adreno_gpu_config.va_start = SZ_16M;
	adreno_gpu_config.va_end = 0xffffffff;

	adreno_gpu_config.ringsz = RB_SIZE;

465 466 467 468
	pm_runtime_set_autosuspend_delay(&pdev->dev, DRM_MSM_INACTIVE_PERIOD);
	pm_runtime_use_autosuspend(&pdev->dev);
	pm_runtime_enable(&pdev->dev);

J
Jordan Crouse 已提交
469
	return msm_gpu_init(drm, pdev, &adreno_gpu->base, &funcs->base,
470
			adreno_gpu->info->name, &adreno_gpu_config);
R
Rob Clark 已提交
471 472
}

473
void adreno_gpu_cleanup(struct adreno_gpu *adreno_gpu)
R
Rob Clark 已提交
474
{
475 476
	release_firmware(adreno_gpu->pm4);
	release_firmware(adreno_gpu->pfp);
477

J
Jordan Crouse 已提交
478
	msm_gpu_cleanup(&adreno_gpu->base);
R
Rob Clark 已提交
479
}