msm_gpu.h 6.8 KB
Newer Older
R
Rob Clark 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
/*
 * Copyright (C) 2013 Red Hat
 * Author: Rob Clark <robdclark@gmail.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 as published by
 * the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program.  If not, see <http://www.gnu.org/licenses/>.
 */

#ifndef __MSM_GPU_H__
#define __MSM_GPU_H__

#include <linux/clk.h>
#include <linux/regulator/consumer.h>

#include "msm_drv.h"
R
Rob Clark 已提交
25
#include "msm_fence.h"
R
Rob Clark 已提交
26 27 28
#include "msm_ringbuffer.h"

struct msm_gem_submit;
R
Rob Clark 已提交
29
struct msm_gpu_perfcntr;
R
Rob Clark 已提交
30

31 32 33 34 35 36 37 38
struct msm_gpu_config {
	const char *ioname;
	const char *irqname;
	uint64_t va_start;
	uint64_t va_end;
	unsigned int ringsz;
};

R
Rob Clark 已提交
39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
/* So far, with hardware that I've seen to date, we can have:
 *  + zero, one, or two z180 2d cores
 *  + a3xx or a2xx 3d core, which share a common CP (the firmware
 *    for the CP seems to implement some different PM4 packet types
 *    but the basics of cmdstream submission are the same)
 *
 * Which means that the eventual complete "class" hierarchy, once
 * support for all past and present hw is in place, becomes:
 *  + msm_gpu
 *    + adreno_gpu
 *      + a3xx_gpu
 *      + a2xx_gpu
 *    + z180_gpu
 */
struct msm_gpu_funcs {
	int (*get_param)(struct msm_gpu *gpu, uint32_t param, uint64_t *value);
	int (*hw_init)(struct msm_gpu *gpu);
	int (*pm_suspend)(struct msm_gpu *gpu);
	int (*pm_resume)(struct msm_gpu *gpu);
58
	void (*submit)(struct msm_gpu *gpu, struct msm_gem_submit *submit,
R
Rob Clark 已提交
59 60 61
			struct msm_file_private *ctx);
	void (*flush)(struct msm_gpu *gpu);
	irqreturn_t (*irq)(struct msm_gpu *irq);
62
	void (*recover)(struct msm_gpu *gpu);
R
Rob Clark 已提交
63 64 65 66 67 68 69
	void (*destroy)(struct msm_gpu *gpu);
#ifdef CONFIG_DEBUG_FS
	/* show GPU status in debugfs: */
	void (*show)(struct msm_gpu *gpu, struct seq_file *m);
#endif
};

J
Jordan Crouse 已提交
70 71 72 73 74 75 76 77
#define rbmemptr(gpu, member)  \
	((gpu)->memptrs_iova + offsetof(struct msm_rbmemptrs, member))

struct msm_rbmemptrs {
	volatile uint32_t rptr;
	volatile uint32_t fence;
};

R
Rob Clark 已提交
78 79 80
struct msm_gpu {
	const char *name;
	struct drm_device *dev;
R
Rob Clark 已提交
81
	struct platform_device *pdev;
R
Rob Clark 已提交
82 83
	const struct msm_gpu_funcs *funcs;

R
Rob Clark 已提交
84 85 86 87 88 89 90 91 92 93 94 95
	/* performance counters (hw & sw): */
	spinlock_t perf_lock;
	bool perfcntr_active;
	struct {
		bool active;
		ktime_t time;
	} last_sample;
	uint32_t totaltime, activetime;    /* sw counters */
	uint32_t last_cntrs[5];            /* hw counters */
	const struct msm_gpu_perfcntr *perfcntrs;
	uint32_t num_perfcntrs;

R
Rob Clark 已提交
96
	/* ringbuffer: */
R
Rob Clark 已提交
97
	struct msm_ringbuffer *rb;
R
Rob Clark 已提交
98
	uint64_t rb_iova;
R
Rob Clark 已提交
99 100 101 102

	/* list of GEM active objects: */
	struct list_head active_list;

R
Rob Clark 已提交
103 104
	/* fencing: */
	struct msm_fence_context *fctx;
105

R
Rob Clark 已提交
106 107
	/* does gpu need hw_init? */
	bool needs_hw_init;
108

R
Rob Clark 已提交
109 110 111 112 113 114
	/* worker for handling active-list retiring: */
	struct work_struct retire_work;

	void __iomem *mmio;
	int irq;

115
	struct msm_gem_address_space *aspace;
R
Rob Clark 已提交
116 117 118

	/* Power Control: */
	struct regulator *gpu_reg, *gpu_cx;
119 120 121
	struct clk **grp_clks;
	int nr_clocks;
	struct clk *ebi1_clk, *core_clk, *rbbmtimer_clk;
122
	uint32_t fast_rate, bus_freq;
R
Rob Clark 已提交
123

124
#ifdef DOWNSTREAM_CONFIG_MSM_BUS_SCALING
R
Rob Clark 已提交
125
	struct msm_bus_scale_pdata *bus_scale_table;
R
Rob Clark 已提交
126
	uint32_t bsc;
R
Rob Clark 已提交
127
#endif
128

129 130 131
	/* Hang and Inactivity Detection:
	 */
#define DRM_MSM_INACTIVE_PERIOD   66 /* in ms (roughly four frames) */
R
Rob Clark 已提交
132

133 134 135 136 137
#define DRM_MSM_HANGCHECK_PERIOD 500 /* in ms */
#define DRM_MSM_HANGCHECK_JIFFIES msecs_to_jiffies(DRM_MSM_HANGCHECK_PERIOD)
	struct timer_list hangcheck_timer;
	uint32_t hangcheck_fence;
	struct work_struct recover_work;
138 139

	struct list_head submit_list;
J
Jordan Crouse 已提交
140 141 142 143 144 145

	struct msm_rbmemptrs *memptrs;
	struct drm_gem_object *memptrs_bo;
	uint64_t memptrs_iova;


R
Rob Clark 已提交
146 147
};

148 149
static inline bool msm_gpu_active(struct msm_gpu *gpu)
{
J
Jordan Crouse 已提交
150
	return gpu->fctx->last_fence > gpu->memptrs->fence;
151 152
}

R
Rob Clark 已提交
153 154 155 156 157 158 159 160 161 162 163 164 165
/* Perf-Counters:
 * The select_reg and select_val are just there for the benefit of the child
 * class that actually enables the perf counter..  but msm_gpu base class
 * will handle sampling/displaying the counters.
 */

struct msm_gpu_perfcntr {
	uint32_t select_reg;
	uint32_t sample_reg;
	uint32_t select_val;
	const char *name;
};

166 167 168 169 170 171 172 173 174
struct msm_gpu_submitqueue {
	int id;
	u32 flags;
	u32 prio;
	int faults;
	struct list_head node;
	struct kref ref;
};

R
Rob Clark 已提交
175 176 177 178 179 180 181 182 183 184
static inline void gpu_write(struct msm_gpu *gpu, u32 reg, u32 data)
{
	msm_writel(data, gpu->mmio + (reg << 2));
}

static inline u32 gpu_read(struct msm_gpu *gpu, u32 reg)
{
	return msm_readl(gpu->mmio + (reg << 2));
}

185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223
static inline void gpu_rmw(struct msm_gpu *gpu, u32 reg, u32 mask, u32 or)
{
	uint32_t val = gpu_read(gpu, reg);

	val &= ~mask;
	gpu_write(gpu, reg, val | or);
}

static inline u64 gpu_read64(struct msm_gpu *gpu, u32 lo, u32 hi)
{
	u64 val;

	/*
	 * Why not a readq here? Two reasons: 1) many of the LO registers are
	 * not quad word aligned and 2) the GPU hardware designers have a bit
	 * of a history of putting registers where they fit, especially in
	 * spins. The longer a GPU family goes the higher the chance that
	 * we'll get burned.  We could do a series of validity checks if we
	 * wanted to, but really is a readq() that much better? Nah.
	 */

	/*
	 * For some lo/hi registers (like perfcounters), the hi value is latched
	 * when the lo is read, so make sure to read the lo first to trigger
	 * that
	 */
	val = (u64) msm_readl(gpu->mmio + (lo << 2));
	val |= ((u64) msm_readl(gpu->mmio + (hi << 2)) << 32);

	return val;
}

static inline void gpu_write64(struct msm_gpu *gpu, u32 lo, u32 hi, u64 val)
{
	/* Why not a writeq here? Read the screed above */
	msm_writel(lower_32_bits(val), gpu->mmio + (lo << 2));
	msm_writel(upper_32_bits(val), gpu->mmio + (hi << 2));
}

R
Rob Clark 已提交
224 225 226
int msm_gpu_pm_suspend(struct msm_gpu *gpu);
int msm_gpu_pm_resume(struct msm_gpu *gpu);

R
Rob Clark 已提交
227 228
int msm_gpu_hw_init(struct msm_gpu *gpu);

R
Rob Clark 已提交
229 230 231 232 233
void msm_gpu_perfcntr_start(struct msm_gpu *gpu);
void msm_gpu_perfcntr_stop(struct msm_gpu *gpu);
int msm_gpu_perfcntr_sample(struct msm_gpu *gpu, uint32_t *activetime,
		uint32_t *totaltime, uint32_t ncntrs, uint32_t *cntrs);

R
Rob Clark 已提交
234
void msm_gpu_retire(struct msm_gpu *gpu);
235
void msm_gpu_submit(struct msm_gpu *gpu, struct msm_gem_submit *submit,
R
Rob Clark 已提交
236 237 238 239
		struct msm_file_private *ctx);

int msm_gpu_init(struct drm_device *drm, struct platform_device *pdev,
		struct msm_gpu *gpu, const struct msm_gpu_funcs *funcs,
240 241
		const char *name, struct msm_gpu_config *config);

R
Rob Clark 已提交
242 243
void msm_gpu_cleanup(struct msm_gpu *gpu);

244
struct msm_gpu *adreno_load_gpu(struct drm_device *dev);
245 246
void __init adreno_register(void);
void __exit adreno_unregister(void);
R
Rob Clark 已提交
247

248 249 250 251 252 253
static inline void msm_submitqueue_put(struct msm_gpu_submitqueue *queue)
{
	if (queue)
		kref_put(&queue->ref, msm_submitqueue_destroy);
}

R
Rob Clark 已提交
254
#endif /* __MSM_GPU_H__ */