radeon_cp.c 47.2 KB
Newer Older
1 2
/* radeon_cp.c -- CP support for Radeon -*- linux-c -*- */
/*
L
Linus Torvalds 已提交
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34
 * Copyright 2000 Precision Insight, Inc., Cedar Park, Texas.
 * Copyright 2000 VA Linux Systems, Inc., Fremont, California.
 * All Rights Reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 * DEALINGS IN THE SOFTWARE.
 *
 * Authors:
 *    Kevin E. Martin <martin@valinux.com>
 *    Gareth Hughes <gareth@valinux.com>
 */

#include "drmP.h"
#include "drm.h"
#include "radeon_drm.h"
#include "radeon_drv.h"
D
Dave Airlie 已提交
35
#include "r300_reg.h"
L
Linus Torvalds 已提交
36

37 38
#include "radeon_microcode.h"

L
Linus Torvalds 已提交
39 40
#define RADEON_FIFO_DEBUG	0

41
static int radeon_do_cleanup_cp(struct drm_device * dev);
L
Linus Torvalds 已提交
42

D
Dave Airlie 已提交
43 44 45 46 47 48 49 50 51
static u32 RADEON_READ_MCIND(drm_radeon_private_t *dev_priv, int addr)
{
	u32 ret;
	RADEON_WRITE(R520_MC_IND_INDEX, 0x7f0000 | (addr & 0xff));
	ret = RADEON_READ(R520_MC_IND_DATA);
	RADEON_WRITE(R520_MC_IND_INDEX, 0);
	return ret;
}

52 53 54 55 56 57
static u32 RS690_READ_MCIND(drm_radeon_private_t *dev_priv, int addr)
{
	RADEON_WRITE(RS690_MC_INDEX, (addr & RS690_MC_INDEX_MASK));
	return RADEON_READ(RS690_MC_DATA);
}

D
Dave Airlie 已提交
58 59 60 61 62
u32 radeon_read_fb_location(drm_radeon_private_t *dev_priv)
{

	if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV515)
		return RADEON_READ_MCIND(dev_priv, RV515_MC_FB_LOCATION);
63 64
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS690)
		return RS690_READ_MCIND(dev_priv, RS690_MC_FB_LOCATION);
D
Dave Airlie 已提交
65 66 67 68 69 70 71 72 73 74
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) > CHIP_RV515)
		return RADEON_READ_MCIND(dev_priv, R520_MC_FB_LOCATION);
	else
		return RADEON_READ(RADEON_MC_FB_LOCATION);
}

static void radeon_write_fb_location(drm_radeon_private_t *dev_priv, u32 fb_loc)
{
	if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV515)
		RADEON_WRITE_MCIND(RV515_MC_FB_LOCATION, fb_loc);
75 76
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS690)
		RS690_WRITE_MCIND(RS690_MC_FB_LOCATION, fb_loc);
D
Dave Airlie 已提交
77 78 79 80 81 82 83 84 85 86
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) > CHIP_RV515)
		RADEON_WRITE_MCIND(R520_MC_FB_LOCATION, fb_loc);
	else
		RADEON_WRITE(RADEON_MC_FB_LOCATION, fb_loc);
}

static void radeon_write_agp_location(drm_radeon_private_t *dev_priv, u32 agp_loc)
{
	if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV515)
		RADEON_WRITE_MCIND(RV515_MC_AGP_LOCATION, agp_loc);
87 88
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS690)
		RS690_WRITE_MCIND(RS690_MC_AGP_LOCATION, agp_loc);
D
Dave Airlie 已提交
89 90 91 92 93 94
	else if ((dev_priv->flags & RADEON_FAMILY_MASK) > CHIP_RV515)
		RADEON_WRITE_MCIND(R520_MC_AGP_LOCATION, agp_loc);
	else
		RADEON_WRITE(RADEON_MC_AGP_LOCATION, agp_loc);
}

95
static int RADEON_READ_PLL(struct drm_device * dev, int addr)
L
Linus Torvalds 已提交
96 97 98 99 100 101 102
{
	drm_radeon_private_t *dev_priv = dev->dev_private;

	RADEON_WRITE8(RADEON_CLOCK_CNTL_INDEX, addr & 0x1f);
	return RADEON_READ(RADEON_CLOCK_CNTL_DATA);
}

D
Dave Airlie 已提交
103
static u32 RADEON_READ_PCIE(drm_radeon_private_t *dev_priv, int addr)
104 105 106 107 108
{
	RADEON_WRITE8(RADEON_PCIE_INDEX, addr & 0xff);
	return RADEON_READ(RADEON_PCIE_DATA);
}

109 110 111 112 113 114 115 116 117
static u32 RADEON_READ_IGPGART(drm_radeon_private_t *dev_priv, int addr)
{
	u32 ret;
	RADEON_WRITE(RADEON_IGPGART_INDEX, addr & 0x7f);
	ret = RADEON_READ(RADEON_IGPGART_DATA);
	RADEON_WRITE(RADEON_IGPGART_INDEX, 0x7f);
	return ret;
}

L
Linus Torvalds 已提交
118
#if RADEON_FIFO_DEBUG
D
Dave Airlie 已提交
119
static void radeon_status(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
120
{
121
	printk("%s:\n", __func__);
D
Dave Airlie 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137
	printk("RBBM_STATUS = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_RBBM_STATUS));
	printk("CP_RB_RTPR = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_CP_RB_RPTR));
	printk("CP_RB_WTPR = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_CP_RB_WPTR));
	printk("AIC_CNTL = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_AIC_CNTL));
	printk("AIC_STAT = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_AIC_STAT));
	printk("AIC_PT_BASE = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_AIC_PT_BASE));
	printk("TLB_ADDR = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_AIC_TLB_ADDR));
	printk("TLB_DATA = 0x%08x\n",
	       (unsigned int)RADEON_READ(RADEON_AIC_TLB_DATA));
L
Linus Torvalds 已提交
138 139 140 141 142 143 144
}
#endif

/* ================================================================
 * Engine, FIFO control
 */

D
Dave Airlie 已提交
145
static int radeon_do_pixcache_flush(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
146 147 148 149 150 151
{
	u32 tmp;
	int i;

	dev_priv->stats.boxes |= RADEON_BOX_WAIT_IDLE;

152 153 154
	tmp = RADEON_READ(RADEON_RB3D_DSTCACHE_CTLSTAT);
	tmp |= RADEON_RB3D_DC_FLUSH_ALL;
	RADEON_WRITE(RADEON_RB3D_DSTCACHE_CTLSTAT, tmp);
L
Linus Torvalds 已提交
155

D
Dave Airlie 已提交
156
	for (i = 0; i < dev_priv->usec_timeout; i++) {
157 158
		if (!(RADEON_READ(RADEON_RB3D_DSTCACHE_CTLSTAT)
		      & RADEON_RB3D_DC_BUSY)) {
L
Linus Torvalds 已提交
159 160
			return 0;
		}
D
Dave Airlie 已提交
161
		DRM_UDELAY(1);
L
Linus Torvalds 已提交
162 163 164
	}

#if RADEON_FIFO_DEBUG
D
Dave Airlie 已提交
165 166
	DRM_ERROR("failed!\n");
	radeon_status(dev_priv);
L
Linus Torvalds 已提交
167
#endif
E
Eric Anholt 已提交
168
	return -EBUSY;
L
Linus Torvalds 已提交
169 170
}

D
Dave Airlie 已提交
171
static int radeon_do_wait_for_fifo(drm_radeon_private_t * dev_priv, int entries)
L
Linus Torvalds 已提交
172 173 174 175 176
{
	int i;

	dev_priv->stats.boxes |= RADEON_BOX_WAIT_IDLE;

D
Dave Airlie 已提交
177 178 179 180 181 182
	for (i = 0; i < dev_priv->usec_timeout; i++) {
		int slots = (RADEON_READ(RADEON_RBBM_STATUS)
			     & RADEON_RBBM_FIFOCNT_MASK);
		if (slots >= entries)
			return 0;
		DRM_UDELAY(1);
L
Linus Torvalds 已提交
183 184 185
	}

#if RADEON_FIFO_DEBUG
D
Dave Airlie 已提交
186 187
	DRM_ERROR("failed!\n");
	radeon_status(dev_priv);
L
Linus Torvalds 已提交
188
#endif
E
Eric Anholt 已提交
189
	return -EBUSY;
L
Linus Torvalds 已提交
190 191
}

D
Dave Airlie 已提交
192
static int radeon_do_wait_for_idle(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
193 194 195 196 197
{
	int i, ret;

	dev_priv->stats.boxes |= RADEON_BOX_WAIT_IDLE;

D
Dave Airlie 已提交
198 199 200
	ret = radeon_do_wait_for_fifo(dev_priv, 64);
	if (ret)
		return ret;
L
Linus Torvalds 已提交
201

D
Dave Airlie 已提交
202 203 204 205
	for (i = 0; i < dev_priv->usec_timeout; i++) {
		if (!(RADEON_READ(RADEON_RBBM_STATUS)
		      & RADEON_RBBM_ACTIVE)) {
			radeon_do_pixcache_flush(dev_priv);
L
Linus Torvalds 已提交
206 207
			return 0;
		}
D
Dave Airlie 已提交
208
		DRM_UDELAY(1);
L
Linus Torvalds 已提交
209 210 211
	}

#if RADEON_FIFO_DEBUG
D
Dave Airlie 已提交
212 213
	DRM_ERROR("failed!\n");
	radeon_status(dev_priv);
L
Linus Torvalds 已提交
214
#endif
E
Eric Anholt 已提交
215
	return -EBUSY;
L
Linus Torvalds 已提交
216 217 218 219 220 221 222
}

/* ================================================================
 * CP control, initialization
 */

/* Load the microcode for the CP */
D
Dave Airlie 已提交
223
static void radeon_cp_load_microcode(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
224 225
{
	int i;
D
Dave Airlie 已提交
226
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
227

D
Dave Airlie 已提交
228
	radeon_do_wait_for_idle(dev_priv);
L
Linus Torvalds 已提交
229

D
Dave Airlie 已提交
230
	RADEON_WRITE(RADEON_CP_ME_RAM_ADDR, 0);
231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246
	if (((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R100) ||
	    ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV100) ||
	    ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV200) ||
	    ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS100) ||
	    ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS200)) {
		DRM_INFO("Loading R100 Microcode\n");
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
				     R100_cp_microcode[i][1]);
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
				     R100_cp_microcode[i][0]);
		}
	} else if (((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R200) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV250) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV280) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS300)) {
L
Linus Torvalds 已提交
247
		DRM_INFO("Loading R200 Microcode\n");
D
Dave Airlie 已提交
248 249 250 251 252
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
				     R200_cp_microcode[i][1]);
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
				     R200_cp_microcode[i][0]);
L
Linus Torvalds 已提交
253
		}
254 255 256 257 258
	} else if (((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R300) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R350) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV350) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV380) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS400)) {
L
Linus Torvalds 已提交
259
		DRM_INFO("Loading R300 Microcode\n");
D
Dave Airlie 已提交
260 261 262 263 264
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
				     R300_cp_microcode[i][1]);
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
				     R300_cp_microcode[i][0]);
L
Linus Torvalds 已提交
265
		}
266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289
	} else if (((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R420) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV410)) {
		DRM_INFO("Loading R400 Microcode\n");
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
				     R420_cp_microcode[i][1]);
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
				     R420_cp_microcode[i][0]);
		}
	} else if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS690) {
		DRM_INFO("Loading RS690 Microcode\n");
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
				     RS690_cp_microcode[i][1]);
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
				     RS690_cp_microcode[i][0]);
		}
	} else if (((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV515) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R520) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV530) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_R580) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV560) ||
		   ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RV570)) {
		DRM_INFO("Loading R500 Microcode\n");
D
Dave Airlie 已提交
290 291
		for (i = 0; i < 256; i++) {
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAH,
292
				     R520_cp_microcode[i][1]);
D
Dave Airlie 已提交
293
			RADEON_WRITE(RADEON_CP_ME_RAM_DATAL,
294
				     R520_cp_microcode[i][0]);
L
Linus Torvalds 已提交
295 296 297 298 299 300 301 302
		}
	}
}

/* Flush any pending commands to the CP.  This should only be used just
 * prior to a wait for idle, as it informs the engine that the command
 * stream is ending.
 */
D
Dave Airlie 已提交
303
static void radeon_do_cp_flush(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
304
{
D
Dave Airlie 已提交
305
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
306 307 308
#if 0
	u32 tmp;

D
Dave Airlie 已提交
309 310
	tmp = RADEON_READ(RADEON_CP_RB_WPTR) | (1 << 31);
	RADEON_WRITE(RADEON_CP_RB_WPTR, tmp);
L
Linus Torvalds 已提交
311 312 313 314 315
#endif
}

/* Wait for the CP to go idle.
 */
D
Dave Airlie 已提交
316
int radeon_do_cp_idle(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
317 318
{
	RING_LOCALS;
D
Dave Airlie 已提交
319
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
320

D
Dave Airlie 已提交
321
	BEGIN_RING(6);
L
Linus Torvalds 已提交
322 323 324 325 326 327 328 329

	RADEON_PURGE_CACHE();
	RADEON_PURGE_ZCACHE();
	RADEON_WAIT_UNTIL_IDLE();

	ADVANCE_RING();
	COMMIT_RING();

D
Dave Airlie 已提交
330
	return radeon_do_wait_for_idle(dev_priv);
L
Linus Torvalds 已提交
331 332 333 334
}

/* Start the Command Processor.
 */
D
Dave Airlie 已提交
335
static void radeon_do_cp_start(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
336 337
{
	RING_LOCALS;
D
Dave Airlie 已提交
338
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
339

D
Dave Airlie 已提交
340
	radeon_do_wait_for_idle(dev_priv);
L
Linus Torvalds 已提交
341

D
Dave Airlie 已提交
342
	RADEON_WRITE(RADEON_CP_CSQ_CNTL, dev_priv->cp_mode);
L
Linus Torvalds 已提交
343 344 345

	dev_priv->cp_running = 1;

D
Dave Airlie 已提交
346
	BEGIN_RING(6);
L
Linus Torvalds 已提交
347 348 349 350 351 352 353 354 355 356 357 358 359

	RADEON_PURGE_CACHE();
	RADEON_PURGE_ZCACHE();
	RADEON_WAIT_UNTIL_IDLE();

	ADVANCE_RING();
	COMMIT_RING();
}

/* Reset the Command Processor.  This will not flush any pending
 * commands, so you must wait for the CP command stream to complete
 * before calling this routine.
 */
D
Dave Airlie 已提交
360
static void radeon_do_cp_reset(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
361 362
{
	u32 cur_read_ptr;
D
Dave Airlie 已提交
363
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
364

D
Dave Airlie 已提交
365 366 367
	cur_read_ptr = RADEON_READ(RADEON_CP_RB_RPTR);
	RADEON_WRITE(RADEON_CP_RB_WPTR, cur_read_ptr);
	SET_RING_HEAD(dev_priv, cur_read_ptr);
L
Linus Torvalds 已提交
368 369 370 371 372 373 374
	dev_priv->ring.tail = cur_read_ptr;
}

/* Stop the Command Processor.  This will not flush any pending
 * commands, so you must flush the command stream and wait for the CP
 * to go idle before calling this routine.
 */
D
Dave Airlie 已提交
375
static void radeon_do_cp_stop(drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
376
{
D
Dave Airlie 已提交
377
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
378

D
Dave Airlie 已提交
379
	RADEON_WRITE(RADEON_CP_CSQ_CNTL, RADEON_CSQ_PRIDIS_INDDIS);
L
Linus Torvalds 已提交
380 381 382 383 384 385

	dev_priv->cp_running = 0;
}

/* Reset the engine.  This will stop the CP if it is running.
 */
386
static int radeon_do_engine_reset(struct drm_device * dev)
L
Linus Torvalds 已提交
387 388 389
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
	u32 clock_cntl_index, mclk_cntl, rbbm_soft_reset;
D
Dave Airlie 已提交
390
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
391

D
Dave Airlie 已提交
392 393
	radeon_do_pixcache_flush(dev_priv);

D
Dave Airlie 已提交
394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430
	if ((dev_priv->flags & RADEON_FAMILY_MASK) < CHIP_RV515) {
		clock_cntl_index = RADEON_READ(RADEON_CLOCK_CNTL_INDEX);
		mclk_cntl = RADEON_READ_PLL(dev, RADEON_MCLK_CNTL);

		RADEON_WRITE_PLL(RADEON_MCLK_CNTL, (mclk_cntl |
						    RADEON_FORCEON_MCLKA |
						    RADEON_FORCEON_MCLKB |
						    RADEON_FORCEON_YCLKA |
						    RADEON_FORCEON_YCLKB |
						    RADEON_FORCEON_MC |
						    RADEON_FORCEON_AIC));

		rbbm_soft_reset = RADEON_READ(RADEON_RBBM_SOFT_RESET);

		RADEON_WRITE(RADEON_RBBM_SOFT_RESET, (rbbm_soft_reset |
						      RADEON_SOFT_RESET_CP |
						      RADEON_SOFT_RESET_HI |
						      RADEON_SOFT_RESET_SE |
						      RADEON_SOFT_RESET_RE |
						      RADEON_SOFT_RESET_PP |
						      RADEON_SOFT_RESET_E2 |
						      RADEON_SOFT_RESET_RB));
		RADEON_READ(RADEON_RBBM_SOFT_RESET);
		RADEON_WRITE(RADEON_RBBM_SOFT_RESET, (rbbm_soft_reset &
						      ~(RADEON_SOFT_RESET_CP |
							RADEON_SOFT_RESET_HI |
							RADEON_SOFT_RESET_SE |
							RADEON_SOFT_RESET_RE |
							RADEON_SOFT_RESET_PP |
							RADEON_SOFT_RESET_E2 |
							RADEON_SOFT_RESET_RB)));
		RADEON_READ(RADEON_RBBM_SOFT_RESET);

		RADEON_WRITE_PLL(RADEON_MCLK_CNTL, mclk_cntl);
		RADEON_WRITE(RADEON_CLOCK_CNTL_INDEX, clock_cntl_index);
		RADEON_WRITE(RADEON_RBBM_SOFT_RESET, rbbm_soft_reset);
	}
L
Linus Torvalds 已提交
431 432

	/* Reset the CP ring */
D
Dave Airlie 已提交
433
	radeon_do_cp_reset(dev_priv);
L
Linus Torvalds 已提交
434 435 436 437 438

	/* The CP is no longer running after an engine reset */
	dev_priv->cp_running = 0;

	/* Reset any pending vertex, indirect buffers */
D
Dave Airlie 已提交
439
	radeon_freelist_reset(dev);
L
Linus Torvalds 已提交
440 441 442 443

	return 0;
}

444
static void radeon_cp_init_ring_buffer(struct drm_device * dev,
D
Dave Airlie 已提交
445
				       drm_radeon_private_t * dev_priv)
L
Linus Torvalds 已提交
446 447 448
{
	u32 ring_start, cur_read_ptr;
	u32 tmp;
D
Dave Airlie 已提交
449

450 451 452 453 454 455
	/* Initialize the memory controller. With new memory map, the fb location
	 * is not changed, it should have been properly initialized already. Part
	 * of the problem is that the code below is bogus, assuming the GART is
	 * always appended to the fb which is not necessarily the case
	 */
	if (!dev_priv->new_memmap)
D
Dave Airlie 已提交
456
		radeon_write_fb_location(dev_priv,
457 458
			     ((dev_priv->gart_vm_start - 1) & 0xffff0000)
			     | (dev_priv->fb_location >> 16));
L
Linus Torvalds 已提交
459 460

#if __OS_HAS_AGP
461
	if (dev_priv->flags & RADEON_IS_AGP) {
462
		RADEON_WRITE(RADEON_AGP_BASE, (unsigned int)dev->agp->base);
D
Dave Airlie 已提交
463
		radeon_write_agp_location(dev_priv,
D
Dave Airlie 已提交
464 465 466
			     (((dev_priv->gart_vm_start - 1 +
				dev_priv->gart_size) & 0xffff0000) |
			      (dev_priv->gart_vm_start >> 16)));
L
Linus Torvalds 已提交
467 468 469 470

		ring_start = (dev_priv->cp_ring->offset
			      - dev->agp->base
			      + dev_priv->gart_vm_start);
471
	} else
L
Linus Torvalds 已提交
472 473
#endif
		ring_start = (dev_priv->cp_ring->offset
474
			      - (unsigned long)dev->sg->virtual
L
Linus Torvalds 已提交
475 476
			      + dev_priv->gart_vm_start);

D
Dave Airlie 已提交
477
	RADEON_WRITE(RADEON_CP_RB_BASE, ring_start);
L
Linus Torvalds 已提交
478 479

	/* Set the write pointer delay */
D
Dave Airlie 已提交
480
	RADEON_WRITE(RADEON_CP_RB_WPTR_DELAY, 0);
L
Linus Torvalds 已提交
481 482

	/* Initialize the ring buffer's read and write pointers */
D
Dave Airlie 已提交
483 484 485
	cur_read_ptr = RADEON_READ(RADEON_CP_RB_RPTR);
	RADEON_WRITE(RADEON_CP_RB_WPTR, cur_read_ptr);
	SET_RING_HEAD(dev_priv, cur_read_ptr);
L
Linus Torvalds 已提交
486 487 488
	dev_priv->ring.tail = cur_read_ptr;

#if __OS_HAS_AGP
489
	if (dev_priv->flags & RADEON_IS_AGP) {
D
Dave Airlie 已提交
490 491 492
		RADEON_WRITE(RADEON_CP_RB_RPTR_ADDR,
			     dev_priv->ring_rptr->offset
			     - dev->agp->base + dev_priv->gart_vm_start);
L
Linus Torvalds 已提交
493 494 495
	} else
#endif
	{
D
Dave Airlie 已提交
496
		struct drm_sg_mem *entry = dev->sg;
L
Linus Torvalds 已提交
497 498
		unsigned long tmp_ofs, page_ofs;

499 500
		tmp_ofs = dev_priv->ring_rptr->offset -
				(unsigned long)dev->sg->virtual;
L
Linus Torvalds 已提交
501 502
		page_ofs = tmp_ofs >> PAGE_SHIFT;

D
Dave Airlie 已提交
503 504 505 506
		RADEON_WRITE(RADEON_CP_RB_RPTR_ADDR, entry->busaddr[page_ofs]);
		DRM_DEBUG("ring rptr: offset=0x%08lx handle=0x%08lx\n",
			  (unsigned long)entry->busaddr[page_ofs],
			  entry->handle + tmp_ofs);
L
Linus Torvalds 已提交
507 508
	}

509 510 511
	/* Set ring buffer size */
#ifdef __BIG_ENDIAN
	RADEON_WRITE(RADEON_CP_RB_CNTL,
512 513 514 515
		     RADEON_BUF_SWAP_32BIT |
		     (dev_priv->ring.fetch_size_l2ow << 18) |
		     (dev_priv->ring.rptr_update_l2qw << 8) |
		     dev_priv->ring.size_l2qw);
516
#else
517 518 519 520
	RADEON_WRITE(RADEON_CP_RB_CNTL,
		     (dev_priv->ring.fetch_size_l2ow << 18) |
		     (dev_priv->ring.rptr_update_l2qw << 8) |
		     dev_priv->ring.size_l2qw);
521 522 523 524 525
#endif

	/* Start with assuming that writeback doesn't work */
	dev_priv->writeback_works = 0;

L
Linus Torvalds 已提交
526 527 528 529 530 531 532
	/* Initialize the scratch register pointer.  This will cause
	 * the scratch register values to be written out to memory
	 * whenever they are updated.
	 *
	 * We simply put this behind the ring read pointer, this works
	 * with PCI GART as well as (whatever kind of) AGP GART
	 */
D
Dave Airlie 已提交
533 534
	RADEON_WRITE(RADEON_SCRATCH_ADDR, RADEON_READ(RADEON_CP_RB_RPTR_ADDR)
		     + RADEON_SCRATCH_REG_OFFSET);
L
Linus Torvalds 已提交
535 536 537 538 539

	dev_priv->scratch = ((__volatile__ u32 *)
			     dev_priv->ring_rptr->handle +
			     (RADEON_SCRATCH_REG_OFFSET / sizeof(u32)));

D
Dave Airlie 已提交
540
	RADEON_WRITE(RADEON_SCRATCH_UMSK, 0x7);
L
Linus Torvalds 已提交
541

542 543 544
	/* Turn on bus mastering */
	tmp = RADEON_READ(RADEON_BUS_CNTL) & ~RADEON_BUS_MASTER_DIS;
	RADEON_WRITE(RADEON_BUS_CNTL, tmp);
L
Linus Torvalds 已提交
545 546

	dev_priv->sarea_priv->last_frame = dev_priv->scratch[0] = 0;
D
Dave Airlie 已提交
547
	RADEON_WRITE(RADEON_LAST_FRAME_REG, dev_priv->sarea_priv->last_frame);
L
Linus Torvalds 已提交
548 549

	dev_priv->sarea_priv->last_dispatch = dev_priv->scratch[1] = 0;
D
Dave Airlie 已提交
550 551
	RADEON_WRITE(RADEON_LAST_DISPATCH_REG,
		     dev_priv->sarea_priv->last_dispatch);
L
Linus Torvalds 已提交
552 553

	dev_priv->sarea_priv->last_clear = dev_priv->scratch[2] = 0;
D
Dave Airlie 已提交
554
	RADEON_WRITE(RADEON_LAST_CLEAR_REG, dev_priv->sarea_priv->last_clear);
L
Linus Torvalds 已提交
555

D
Dave Airlie 已提交
556
	radeon_do_wait_for_idle(dev_priv);
L
Linus Torvalds 已提交
557 558

	/* Sync everything up */
D
Dave Airlie 已提交
559 560 561 562 563
	RADEON_WRITE(RADEON_ISYNC_CNTL,
		     (RADEON_ISYNC_ANY2D_IDLE3D |
		      RADEON_ISYNC_ANY3D_IDLE2D |
		      RADEON_ISYNC_WAIT_IDLEGUI |
		      RADEON_ISYNC_CPSCRATCH_IDLEGUI));
564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594

}

static void radeon_test_writeback(drm_radeon_private_t * dev_priv)
{
	u32 tmp;

	/* Writeback doesn't seem to work everywhere, test it here and possibly
	 * enable it if it appears to work
	 */
	DRM_WRITE32(dev_priv->ring_rptr, RADEON_SCRATCHOFF(1), 0);
	RADEON_WRITE(RADEON_SCRATCH_REG1, 0xdeadbeef);

	for (tmp = 0; tmp < dev_priv->usec_timeout; tmp++) {
		if (DRM_READ32(dev_priv->ring_rptr, RADEON_SCRATCHOFF(1)) ==
		    0xdeadbeef)
			break;
		DRM_UDELAY(1);
	}

	if (tmp < dev_priv->usec_timeout) {
		dev_priv->writeback_works = 1;
		DRM_INFO("writeback test succeeded in %d usecs\n", tmp);
	} else {
		dev_priv->writeback_works = 0;
		DRM_INFO("writeback test failed\n");
	}
	if (radeon_no_wb == 1) {
		dev_priv->writeback_works = 0;
		DRM_INFO("writeback forced off\n");
	}
595 596 597 598 599 600 601

	if (!dev_priv->writeback_works) {
		/* Disable writeback to avoid unnecessary bus master transfer */
		RADEON_WRITE(RADEON_CP_RB_CNTL, RADEON_READ(RADEON_CP_RB_CNTL) |
			     RADEON_RB_NO_UPDATE);
		RADEON_WRITE(RADEON_SCRATCH_UMSK, 0);
	}
L
Linus Torvalds 已提交
602 603
}

604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626
/* Enable or disable IGP GART on the chip */
static void radeon_set_igpgart(drm_radeon_private_t * dev_priv, int on)
{
	u32 temp, tmp;

	tmp = RADEON_READ(RADEON_AIC_CNTL);
	if (on) {
		DRM_DEBUG("programming igpgart %08X %08lX %08X\n",
			 dev_priv->gart_vm_start,
			 (long)dev_priv->gart_info.bus_addr,
			 dev_priv->gart_size);

		RADEON_WRITE_IGPGART(RADEON_IGPGART_UNK_18, 0x1000);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_ENABLE, 0x1);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_CTRL, 0x42040800);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_BASE_ADDR,
				     dev_priv->gart_info.bus_addr);

		temp = RADEON_READ_IGPGART(dev_priv, RADEON_IGPGART_UNK_39);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_UNK_39, temp);

		RADEON_WRITE(RADEON_AGP_BASE, (unsigned int)dev_priv->gart_vm_start);
		dev_priv->gart_size = 32*1024*1024;
D
Dave Airlie 已提交
627
		radeon_write_agp_location(dev_priv,
628 629 630 631 632 633 634 635 636 637 638 639 640 641
			     (((dev_priv->gart_vm_start - 1 +
			       dev_priv->gart_size) & 0xffff0000) |
			     (dev_priv->gart_vm_start >> 16)));

		temp = RADEON_READ_IGPGART(dev_priv, RADEON_IGPGART_ENABLE);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_ENABLE, temp);

		RADEON_READ_IGPGART(dev_priv, RADEON_IGPGART_FLUSH);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_FLUSH, 0x1);
		RADEON_READ_IGPGART(dev_priv, RADEON_IGPGART_FLUSH);
		RADEON_WRITE_IGPGART(RADEON_IGPGART_FLUSH, 0x0);
       }
}

642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661
/* Enable or disable RS690 GART on the chip */
static void radeon_set_rs690gart(drm_radeon_private_t *dev_priv, int on)
{
	u32 temp;

	if (on) {
		DRM_DEBUG("programming rs690 gart %08X %08lX %08X\n",
			  dev_priv->gart_vm_start,
			  (long)dev_priv->gart_info.bus_addr,
			  dev_priv->gart_size);

		temp = RS690_READ_MCIND(dev_priv, RS690_MC_MISC_CNTL);
		RS690_WRITE_MCIND(RS690_MC_MISC_CNTL, 0x5000);

		RS690_WRITE_MCIND(RS690_MC_AGP_SIZE,
				  RS690_MC_GART_EN | RS690_MC_AGP_SIZE_32MB);

		temp = RS690_READ_MCIND(dev_priv, RS690_MC_GART_FEATURE_ID);
		RS690_WRITE_MCIND(RS690_MC_GART_FEATURE_ID, 0x42040800);

662 663 664
		temp = dev_priv->gart_info.bus_addr & 0xfffff000;
		temp |= (upper_32_bits(dev_priv->gart_info.bus_addr) & 0xff) << 4;
		RS690_WRITE_MCIND(RS690_MC_GART_BASE, temp);
665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706

		temp = RS690_READ_MCIND(dev_priv, RS690_MC_AGP_MODE_CONTROL);
		RS690_WRITE_MCIND(RS690_MC_AGP_MODE_CONTROL, 0x01400000);

		RS690_WRITE_MCIND(RS690_MC_AGP_BASE,
				  (unsigned int)dev_priv->gart_vm_start);

		dev_priv->gart_size = 32*1024*1024;
		temp = (((dev_priv->gart_vm_start - 1 + dev_priv->gart_size) &
			 0xffff0000) | (dev_priv->gart_vm_start >> 16));

		RS690_WRITE_MCIND(RS690_MC_AGP_LOCATION, temp);

		temp = RS690_READ_MCIND(dev_priv, RS690_MC_AGP_SIZE);
		RS690_WRITE_MCIND(RS690_MC_AGP_SIZE,
				  RS690_MC_GART_EN | RS690_MC_AGP_SIZE_32MB);

		do {
			temp = RS690_READ_MCIND(dev_priv, RS690_MC_GART_CACHE_CNTL);
			if ((temp & RS690_MC_GART_CLEAR_STATUS) ==
			    RS690_MC_GART_CLEAR_DONE)
				break;
			DRM_UDELAY(1);
		} while (1);

		RS690_WRITE_MCIND(RS690_MC_GART_CACHE_CNTL,
				  RS690_MC_GART_CC_CLEAR);
		do {
			temp = RS690_READ_MCIND(dev_priv, RS690_MC_GART_CACHE_CNTL);
			if ((temp & RS690_MC_GART_CLEAR_STATUS) ==
				   RS690_MC_GART_CLEAR_DONE)
				break;
			DRM_UDELAY(1);
		} while (1);

		RS690_WRITE_MCIND(RS690_MC_GART_CACHE_CNTL,
				  RS690_MC_GART_CC_NO_CHANGE);
	} else {
		RS690_WRITE_MCIND(RS690_MC_AGP_SIZE, RS690_MC_GART_DIS);
	}
}

707 708 709 710 711 712
static void radeon_set_pciegart(drm_radeon_private_t * dev_priv, int on)
{
	u32 tmp = RADEON_READ_PCIE(dev_priv, RADEON_PCIE_TX_GART_CNTL);
	if (on) {

		DRM_DEBUG("programming pcie %08X %08lX %08X\n",
D
Dave Airlie 已提交
713 714
			  dev_priv->gart_vm_start,
			  (long)dev_priv->gart_info.bus_addr,
715
			  dev_priv->gart_size);
D
Dave Airlie 已提交
716 717 718 719 720 721 722 723 724 725
		RADEON_WRITE_PCIE(RADEON_PCIE_TX_DISCARD_RD_ADDR_LO,
				  dev_priv->gart_vm_start);
		RADEON_WRITE_PCIE(RADEON_PCIE_TX_GART_BASE,
				  dev_priv->gart_info.bus_addr);
		RADEON_WRITE_PCIE(RADEON_PCIE_TX_GART_START_LO,
				  dev_priv->gart_vm_start);
		RADEON_WRITE_PCIE(RADEON_PCIE_TX_GART_END_LO,
				  dev_priv->gart_vm_start +
				  dev_priv->gart_size - 1);

D
Dave Airlie 已提交
726
		radeon_write_agp_location(dev_priv, 0xffffffc0); /* ?? */
D
Dave Airlie 已提交
727 728 729

		RADEON_WRITE_PCIE(RADEON_PCIE_TX_GART_CNTL,
				  RADEON_PCIE_TX_GART_EN);
730
	} else {
D
Dave Airlie 已提交
731 732
		RADEON_WRITE_PCIE(RADEON_PCIE_TX_GART_CNTL,
				  tmp & ~RADEON_PCIE_TX_GART_EN);
733
	}
L
Linus Torvalds 已提交
734 735 736
}

/* Enable or disable PCI GART on the chip */
D
Dave Airlie 已提交
737
static void radeon_set_pcigart(drm_radeon_private_t * dev_priv, int on)
L
Linus Torvalds 已提交
738
{
739
	u32 tmp;
L
Linus Torvalds 已提交
740

741 742 743 744 745
	if ((dev_priv->flags & RADEON_FAMILY_MASK) == CHIP_RS690) {
		radeon_set_rs690gart(dev_priv, on);
		return;
	}

746 747 748 749 750
	if (dev_priv->flags & RADEON_IS_IGPGART) {
		radeon_set_igpgart(dev_priv, on);
		return;
	}

751
	if (dev_priv->flags & RADEON_IS_PCIE) {
752 753 754
		radeon_set_pciegart(dev_priv, on);
		return;
	}
L
Linus Torvalds 已提交
755

D
Dave Airlie 已提交
756
	tmp = RADEON_READ(RADEON_AIC_CNTL);
757

D
Dave Airlie 已提交
758 759 760
	if (on) {
		RADEON_WRITE(RADEON_AIC_CNTL,
			     tmp | RADEON_PCIGART_TRANSLATE_EN);
L
Linus Torvalds 已提交
761 762 763

		/* set PCI GART page-table base address
		 */
764
		RADEON_WRITE(RADEON_AIC_PT_BASE, dev_priv->gart_info.bus_addr);
L
Linus Torvalds 已提交
765 766 767

		/* set address range for PCI address translate
		 */
D
Dave Airlie 已提交
768 769 770
		RADEON_WRITE(RADEON_AIC_LO_ADDR, dev_priv->gart_vm_start);
		RADEON_WRITE(RADEON_AIC_HI_ADDR, dev_priv->gart_vm_start
			     + dev_priv->gart_size - 1);
L
Linus Torvalds 已提交
771 772 773

		/* Turn off AGP aperture -- is this required for PCI GART?
		 */
D
Dave Airlie 已提交
774
		radeon_write_agp_location(dev_priv, 0xffffffc0);
D
Dave Airlie 已提交
775
		RADEON_WRITE(RADEON_AGP_COMMAND, 0);	/* clear AGP_COMMAND */
L
Linus Torvalds 已提交
776
	} else {
D
Dave Airlie 已提交
777 778
		RADEON_WRITE(RADEON_AIC_CNTL,
			     tmp & ~RADEON_PCIGART_TRANSLATE_EN);
L
Linus Torvalds 已提交
779 780 781
	}
}

782
static int radeon_do_init_cp(struct drm_device * dev, drm_radeon_init_t * init)
L
Linus Torvalds 已提交
783
{
784 785
	drm_radeon_private_t *dev_priv = dev->dev_private;

D
Dave Airlie 已提交
786
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
787

D
Dave Airlie 已提交
788
	/* if we require new memory map but we don't have it fail */
789
	if ((dev_priv->flags & RADEON_NEW_MEMMAP) && !dev_priv->new_memmap) {
790
		DRM_ERROR("Cannot initialise DRM on this card\nThis card requires a new X.org DDX for 3D\n");
D
Dave Airlie 已提交
791
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
792
		return -EINVAL;
D
Dave Airlie 已提交
793 794
	}

795
	if (init->is_pci && (dev_priv->flags & RADEON_IS_AGP)) {
796
		DRM_DEBUG("Forcing AGP card to PCI mode\n");
797 798
		dev_priv->flags &= ~RADEON_IS_AGP;
	} else if (!(dev_priv->flags & (RADEON_IS_AGP | RADEON_IS_PCI | RADEON_IS_PCIE))
799 800
		   && !init->is_pci) {
		DRM_DEBUG("Restoring AGP flag\n");
801
		dev_priv->flags |= RADEON_IS_AGP;
802
	}
L
Linus Torvalds 已提交
803

804
	if ((!(dev_priv->flags & RADEON_IS_AGP)) && !dev->sg) {
D
Dave Airlie 已提交
805
		DRM_ERROR("PCI GART memory not allocated!\n");
L
Linus Torvalds 已提交
806
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
807
		return -EINVAL;
L
Linus Torvalds 已提交
808 809 810
	}

	dev_priv->usec_timeout = init->usec_timeout;
D
Dave Airlie 已提交
811 812 813
	if (dev_priv->usec_timeout < 1 ||
	    dev_priv->usec_timeout > RADEON_MAX_USEC_TIMEOUT) {
		DRM_DEBUG("TIMEOUT problem!\n");
L
Linus Torvalds 已提交
814
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
815
		return -EINVAL;
L
Linus Torvalds 已提交
816 817
	}

818 819 820 821
	/* Enable vblank on CRTC1 for older X servers
	 */
	dev_priv->vblank_crtc = DRM_RADEON_VBLANK_CRTC1;

822
	switch(init->func) {
L
Linus Torvalds 已提交
823
	case RADEON_INIT_R200_CP:
D
Dave Airlie 已提交
824
		dev_priv->microcode_version = UCODE_R200;
L
Linus Torvalds 已提交
825 826
		break;
	case RADEON_INIT_R300_CP:
D
Dave Airlie 已提交
827
		dev_priv->microcode_version = UCODE_R300;
L
Linus Torvalds 已提交
828 829
		break;
	default:
D
Dave Airlie 已提交
830
		dev_priv->microcode_version = UCODE_R100;
L
Linus Torvalds 已提交
831
	}
D
Dave Airlie 已提交
832

L
Linus Torvalds 已提交
833 834 835 836 837 838 839
	dev_priv->do_boxes = 0;
	dev_priv->cp_mode = init->cp_mode;

	/* We don't support anything other than bus-mastering ring mode,
	 * but the ring can be in either AGP or PCI space for the ring
	 * read pointer.
	 */
D
Dave Airlie 已提交
840 841 842
	if ((init->cp_mode != RADEON_CSQ_PRIBM_INDDIS) &&
	    (init->cp_mode != RADEON_CSQ_PRIBM_INDBM)) {
		DRM_DEBUG("BAD cp_mode (%x)!\n", init->cp_mode);
L
Linus Torvalds 已提交
843
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
844
		return -EINVAL;
L
Linus Torvalds 已提交
845 846
	}

D
Dave Airlie 已提交
847
	switch (init->fb_bpp) {
L
Linus Torvalds 已提交
848 849 850 851 852 853 854 855
	case 16:
		dev_priv->color_fmt = RADEON_COLOR_FORMAT_RGB565;
		break;
	case 32:
	default:
		dev_priv->color_fmt = RADEON_COLOR_FORMAT_ARGB8888;
		break;
	}
D
Dave Airlie 已提交
856 857 858 859
	dev_priv->front_offset = init->front_offset;
	dev_priv->front_pitch = init->front_pitch;
	dev_priv->back_offset = init->back_offset;
	dev_priv->back_pitch = init->back_pitch;
L
Linus Torvalds 已提交
860

D
Dave Airlie 已提交
861
	switch (init->depth_bpp) {
L
Linus Torvalds 已提交
862 863 864 865 866 867 868 869
	case 16:
		dev_priv->depth_fmt = RADEON_DEPTH_FORMAT_16BIT_INT_Z;
		break;
	case 32:
	default:
		dev_priv->depth_fmt = RADEON_DEPTH_FORMAT_24BIT_INT_Z;
		break;
	}
D
Dave Airlie 已提交
870 871
	dev_priv->depth_offset = init->depth_offset;
	dev_priv->depth_pitch = init->depth_pitch;
L
Linus Torvalds 已提交
872 873 874 875 876 877 878 879

	/* Hardware state for depth clears.  Remove this if/when we no
	 * longer clear the depth buffer with a 3D rectangle.  Hard-code
	 * all values to prevent unwanted 3D state from slipping through
	 * and screwing with the clear operation.
	 */
	dev_priv->depth_clear.rb3d_cntl = (RADEON_PLANE_MASK_ENABLE |
					   (dev_priv->color_fmt << 10) |
D
Dave Airlie 已提交
880 881
					   (dev_priv->microcode_version ==
					    UCODE_R100 ? RADEON_ZBLOCK16 : 0));
L
Linus Torvalds 已提交
882

D
Dave Airlie 已提交
883 884 885 886 887 888 889
	dev_priv->depth_clear.rb3d_zstencilcntl =
	    (dev_priv->depth_fmt |
	     RADEON_Z_TEST_ALWAYS |
	     RADEON_STENCIL_TEST_ALWAYS |
	     RADEON_STENCIL_S_FAIL_REPLACE |
	     RADEON_STENCIL_ZPASS_REPLACE |
	     RADEON_STENCIL_ZFAIL_REPLACE | RADEON_Z_WRITE_ENABLE);
L
Linus Torvalds 已提交
890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907

	dev_priv->depth_clear.se_cntl = (RADEON_FFACE_CULL_CW |
					 RADEON_BFACE_SOLID |
					 RADEON_FFACE_SOLID |
					 RADEON_FLAT_SHADE_VTX_LAST |
					 RADEON_DIFFUSE_SHADE_FLAT |
					 RADEON_ALPHA_SHADE_FLAT |
					 RADEON_SPECULAR_SHADE_FLAT |
					 RADEON_FOG_SHADE_FLAT |
					 RADEON_VTX_PIX_CENTER_OGL |
					 RADEON_ROUND_MODE_TRUNC |
					 RADEON_ROUND_PREC_8TH_PIX);


	dev_priv->ring_offset = init->ring_offset;
	dev_priv->ring_rptr_offset = init->ring_rptr_offset;
	dev_priv->buffers_offset = init->buffers_offset;
	dev_priv->gart_textures_offset = init->gart_textures_offset;
D
Dave Airlie 已提交
908

909
	dev_priv->sarea = drm_getsarea(dev);
D
Dave Airlie 已提交
910
	if (!dev_priv->sarea) {
L
Linus Torvalds 已提交
911 912
		DRM_ERROR("could not find sarea!\n");
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
913
		return -EINVAL;
L
Linus Torvalds 已提交
914 915 916
	}

	dev_priv->cp_ring = drm_core_findmap(dev, init->ring_offset);
D
Dave Airlie 已提交
917
	if (!dev_priv->cp_ring) {
L
Linus Torvalds 已提交
918 919
		DRM_ERROR("could not find cp ring region!\n");
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
920
		return -EINVAL;
L
Linus Torvalds 已提交
921 922
	}
	dev_priv->ring_rptr = drm_core_findmap(dev, init->ring_rptr_offset);
D
Dave Airlie 已提交
923
	if (!dev_priv->ring_rptr) {
L
Linus Torvalds 已提交
924 925
		DRM_ERROR("could not find ring read pointer!\n");
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
926
		return -EINVAL;
L
Linus Torvalds 已提交
927
	}
928
	dev->agp_buffer_token = init->buffers_offset;
L
Linus Torvalds 已提交
929
	dev->agp_buffer_map = drm_core_findmap(dev, init->buffers_offset);
D
Dave Airlie 已提交
930
	if (!dev->agp_buffer_map) {
L
Linus Torvalds 已提交
931 932
		DRM_ERROR("could not find dma buffer region!\n");
		radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
933
		return -EINVAL;
L
Linus Torvalds 已提交
934 935
	}

D
Dave Airlie 已提交
936 937 938 939
	if (init->gart_textures_offset) {
		dev_priv->gart_textures =
		    drm_core_findmap(dev, init->gart_textures_offset);
		if (!dev_priv->gart_textures) {
L
Linus Torvalds 已提交
940 941
			DRM_ERROR("could not find GART texture region!\n");
			radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
942
			return -EINVAL;
L
Linus Torvalds 已提交
943 944 945 946
		}
	}

	dev_priv->sarea_priv =
D
Dave Airlie 已提交
947 948
	    (drm_radeon_sarea_t *) ((u8 *) dev_priv->sarea->handle +
				    init->sarea_priv_offset);
L
Linus Torvalds 已提交
949 950

#if __OS_HAS_AGP
951
	if (dev_priv->flags & RADEON_IS_AGP) {
D
Dave Airlie 已提交
952 953 954 955 956 957
		drm_core_ioremap(dev_priv->cp_ring, dev);
		drm_core_ioremap(dev_priv->ring_rptr, dev);
		drm_core_ioremap(dev->agp_buffer_map, dev);
		if (!dev_priv->cp_ring->handle ||
		    !dev_priv->ring_rptr->handle ||
		    !dev->agp_buffer_map->handle) {
L
Linus Torvalds 已提交
958 959
			DRM_ERROR("could not find ioremap agp regions!\n");
			radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
960
			return -EINVAL;
L
Linus Torvalds 已提交
961 962 963 964
		}
	} else
#endif
	{
D
Dave Airlie 已提交
965
		dev_priv->cp_ring->handle = (void *)dev_priv->cp_ring->offset;
L
Linus Torvalds 已提交
966
		dev_priv->ring_rptr->handle =
D
Dave Airlie 已提交
967 968 969 970 971 972 973 974 975 976
		    (void *)dev_priv->ring_rptr->offset;
		dev->agp_buffer_map->handle =
		    (void *)dev->agp_buffer_map->offset;

		DRM_DEBUG("dev_priv->cp_ring->handle %p\n",
			  dev_priv->cp_ring->handle);
		DRM_DEBUG("dev_priv->ring_rptr->handle %p\n",
			  dev_priv->ring_rptr->handle);
		DRM_DEBUG("dev->agp_buffer_map->handle %p\n",
			  dev->agp_buffer_map->handle);
L
Linus Torvalds 已提交
977 978
	}

D
Dave Airlie 已提交
979
	dev_priv->fb_location = (radeon_read_fb_location(dev_priv) & 0xffff) << 16;
D
Dave Airlie 已提交
980
	dev_priv->fb_size =
D
Dave Airlie 已提交
981
		((radeon_read_fb_location(dev_priv) & 0xffff0000u) + 0x10000)
982
		- dev_priv->fb_location;
L
Linus Torvalds 已提交
983

D
Dave Airlie 已提交
984 985 986
	dev_priv->front_pitch_offset = (((dev_priv->front_pitch / 64) << 22) |
					((dev_priv->front_offset
					  + dev_priv->fb_location) >> 10));
L
Linus Torvalds 已提交
987

D
Dave Airlie 已提交
988 989 990
	dev_priv->back_pitch_offset = (((dev_priv->back_pitch / 64) << 22) |
				       ((dev_priv->back_offset
					 + dev_priv->fb_location) >> 10));
L
Linus Torvalds 已提交
991

D
Dave Airlie 已提交
992 993 994
	dev_priv->depth_pitch_offset = (((dev_priv->depth_pitch / 64) << 22) |
					((dev_priv->depth_offset
					  + dev_priv->fb_location) >> 10));
L
Linus Torvalds 已提交
995 996

	dev_priv->gart_size = init->gart_size;
997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008

	/* New let's set the memory map ... */
	if (dev_priv->new_memmap) {
		u32 base = 0;

		DRM_INFO("Setting GART location based on new memory map\n");

		/* If using AGP, try to locate the AGP aperture at the same
		 * location in the card and on the bus, though we have to
		 * align it down.
		 */
#if __OS_HAS_AGP
1009
		if (dev_priv->flags & RADEON_IS_AGP) {
1010 1011
			base = dev->agp->base;
			/* Check if valid */
1012 1013
			if ((base + dev_priv->gart_size - 1) >= dev_priv->fb_location &&
			    base < (dev_priv->fb_location + dev_priv->fb_size - 1)) {
1014 1015 1016 1017 1018 1019 1020 1021 1022
				DRM_INFO("Can't use AGP base @0x%08lx, won't fit\n",
					 dev->agp->base);
				base = 0;
			}
		}
#endif
		/* If not or if AGP is at 0 (Macs), try to put it elsewhere */
		if (base == 0) {
			base = dev_priv->fb_location + dev_priv->fb_size;
1023 1024
			if (base < dev_priv->fb_location ||
			    ((base + dev_priv->gart_size) & 0xfffffffful) < base)
1025 1026
				base = dev_priv->fb_location
					- dev_priv->gart_size;
D
Dave Airlie 已提交
1027
		}
1028 1029 1030 1031 1032 1033 1034 1035 1036
		dev_priv->gart_vm_start = base & 0xffc00000u;
		if (dev_priv->gart_vm_start != base)
			DRM_INFO("GART aligned down from 0x%08x to 0x%08x\n",
				 base, dev_priv->gart_vm_start);
	} else {
		DRM_INFO("Setting GART location based on old memory map\n");
		dev_priv->gart_vm_start = dev_priv->fb_location +
			RADEON_READ(RADEON_CONFIG_APER_SIZE);
	}
L
Linus Torvalds 已提交
1037 1038

#if __OS_HAS_AGP
1039
	if (dev_priv->flags & RADEON_IS_AGP)
L
Linus Torvalds 已提交
1040
		dev_priv->gart_buffers_offset = (dev->agp_buffer_map->offset
D
Dave Airlie 已提交
1041 1042
						 - dev->agp->base
						 + dev_priv->gart_vm_start);
L
Linus Torvalds 已提交
1043 1044 1045
	else
#endif
		dev_priv->gart_buffers_offset = (dev->agp_buffer_map->offset
1046 1047
					- (unsigned long)dev->sg->virtual
					+ dev_priv->gart_vm_start);
L
Linus Torvalds 已提交
1048

D
Dave Airlie 已提交
1049 1050 1051 1052
	DRM_DEBUG("dev_priv->gart_size %d\n", dev_priv->gart_size);
	DRM_DEBUG("dev_priv->gart_vm_start 0x%x\n", dev_priv->gart_vm_start);
	DRM_DEBUG("dev_priv->gart_buffers_offset 0x%lx\n",
		  dev_priv->gart_buffers_offset);
L
Linus Torvalds 已提交
1053

D
Dave Airlie 已提交
1054 1055
	dev_priv->ring.start = (u32 *) dev_priv->cp_ring->handle;
	dev_priv->ring.end = ((u32 *) dev_priv->cp_ring->handle
L
Linus Torvalds 已提交
1056 1057
			      + init->ring_size / sizeof(u32));
	dev_priv->ring.size = init->ring_size;
D
Dave Airlie 已提交
1058
	dev_priv->ring.size_l2qw = drm_order(init->ring_size / 8);
L
Linus Torvalds 已提交
1059

1060 1061 1062 1063 1064
	dev_priv->ring.rptr_update = /* init->rptr_update */ 4096;
	dev_priv->ring.rptr_update_l2qw = drm_order( /* init->rptr_update */ 4096 / 8);

	dev_priv->ring.fetch_size = /* init->fetch_size */ 32;
	dev_priv->ring.fetch_size_l2ow = drm_order( /* init->fetch_size */ 32 / 16);
D
Dave Airlie 已提交
1065
	dev_priv->ring.tail_mask = (dev_priv->ring.size / sizeof(u32)) - 1;
L
Linus Torvalds 已提交
1066 1067 1068 1069

	dev_priv->ring.high_mark = RADEON_RING_HIGH_MARK;

#if __OS_HAS_AGP
1070
	if (dev_priv->flags & RADEON_IS_AGP) {
L
Linus Torvalds 已提交
1071
		/* Turn off PCI GART */
D
Dave Airlie 已提交
1072
		radeon_set_pcigart(dev_priv, 0);
L
Linus Torvalds 已提交
1073 1074 1075
	} else
#endif
	{
1076
		dev_priv->gart_info.table_mask = DMA_BIT_MASK(32);
1077
		/* if we have an offset set from userspace */
1078
		if (dev_priv->pcigart_offset_set) {
D
Dave Airlie 已提交
1079 1080
			dev_priv->gart_info.bus_addr =
			    dev_priv->pcigart_offset + dev_priv->fb_location;
1081
			dev_priv->gart_info.mapping.offset =
1082
			    dev_priv->pcigart_offset + dev_priv->fb_aper_offset;
1083
			dev_priv->gart_info.mapping.size =
1084
			    dev_priv->gart_info.table_size;
1085 1086

			drm_core_ioremap(&dev_priv->gart_info.mapping, dev);
D
Dave Airlie 已提交
1087
			dev_priv->gart_info.addr =
1088
			    dev_priv->gart_info.mapping.handle;
D
Dave Airlie 已提交
1089

1090 1091 1092 1093
			if (dev_priv->flags & RADEON_IS_PCIE)
				dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCIE;
			else
				dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCI;
D
Dave Airlie 已提交
1094 1095 1096
			dev_priv->gart_info.gart_table_location =
			    DRM_ATI_GART_FB;

1097
			DRM_DEBUG("Setting phys_pci_gart to %p %08lX\n",
D
Dave Airlie 已提交
1098 1099 1100
				  dev_priv->gart_info.addr,
				  dev_priv->pcigart_offset);
		} else {
1101 1102 1103 1104
			if (dev_priv->flags & RADEON_IS_IGPGART)
				dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_IGP;
			else
				dev_priv->gart_info.gart_reg_if = DRM_ATI_GART_PCI;
D
Dave Airlie 已提交
1105 1106
			dev_priv->gart_info.gart_table_location =
			    DRM_ATI_GART_MAIN;
1107 1108
			dev_priv->gart_info.addr = NULL;
			dev_priv->gart_info.bus_addr = 0;
1109
			if (dev_priv->flags & RADEON_IS_PCIE) {
D
Dave Airlie 已提交
1110 1111
				DRM_ERROR
				    ("Cannot use PCI Express without GART in FB memory\n");
1112
				radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
1113
				return -EINVAL;
1114 1115 1116 1117
			}
		}

		if (!drm_ati_pcigart_init(dev, &dev_priv->gart_info)) {
D
Dave Airlie 已提交
1118
			DRM_ERROR("failed to init PCI GART!\n");
L
Linus Torvalds 已提交
1119
			radeon_do_cleanup_cp(dev);
E
Eric Anholt 已提交
1120
			return -ENOMEM;
L
Linus Torvalds 已提交
1121 1122 1123
		}

		/* Turn on PCI GART */
D
Dave Airlie 已提交
1124
		radeon_set_pcigart(dev_priv, 1);
L
Linus Torvalds 已提交
1125 1126
	}

D
Dave Airlie 已提交
1127 1128
	radeon_cp_load_microcode(dev_priv);
	radeon_cp_init_ring_buffer(dev, dev_priv);
L
Linus Torvalds 已提交
1129 1130 1131

	dev_priv->last_buf = 0;

D
Dave Airlie 已提交
1132
	radeon_do_engine_reset(dev);
1133
	radeon_test_writeback(dev_priv);
L
Linus Torvalds 已提交
1134 1135 1136 1137

	return 0;
}

1138
static int radeon_do_cleanup_cp(struct drm_device * dev)
L
Linus Torvalds 已提交
1139 1140
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
D
Dave Airlie 已提交
1141
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1142 1143 1144 1145 1146

	/* Make sure interrupts are disabled here because the uninstall ioctl
	 * may not have been called from userspace and after dev_private
	 * is freed, it's too late.
	 */
D
Dave Airlie 已提交
1147 1148
	if (dev->irq_enabled)
		drm_irq_uninstall(dev);
L
Linus Torvalds 已提交
1149 1150

#if __OS_HAS_AGP
1151
	if (dev_priv->flags & RADEON_IS_AGP) {
1152
		if (dev_priv->cp_ring != NULL) {
D
Dave Airlie 已提交
1153
			drm_core_ioremapfree(dev_priv->cp_ring, dev);
1154 1155 1156
			dev_priv->cp_ring = NULL;
		}
		if (dev_priv->ring_rptr != NULL) {
D
Dave Airlie 已提交
1157
			drm_core_ioremapfree(dev_priv->ring_rptr, dev);
1158 1159
			dev_priv->ring_rptr = NULL;
		}
D
Dave Airlie 已提交
1160 1161
		if (dev->agp_buffer_map != NULL) {
			drm_core_ioremapfree(dev->agp_buffer_map, dev);
L
Linus Torvalds 已提交
1162 1163 1164 1165 1166
			dev->agp_buffer_map = NULL;
		}
	} else
#endif
	{
1167 1168 1169 1170

		if (dev_priv->gart_info.bus_addr) {
			/* Turn off PCI GART */
			radeon_set_pcigart(dev_priv, 0);
1171 1172
			if (!drm_ati_pcigart_cleanup(dev, &dev_priv->gart_info))
				DRM_ERROR("failed to cleanup PCI GART!\n");
1173
		}
D
Dave Airlie 已提交
1174

1175 1176
		if (dev_priv->gart_info.gart_table_location == DRM_ATI_GART_FB)
		{
1177
			drm_core_ioremapfree(&dev_priv->gart_info.mapping, dev);
1178
			dev_priv->gart_info.addr = 0;
1179
		}
L
Linus Torvalds 已提交
1180 1181 1182 1183 1184 1185 1186
	}
	/* only clear to the start of flags */
	memset(dev_priv, 0, offsetof(drm_radeon_private_t, flags));

	return 0;
}

D
Dave Airlie 已提交
1187 1188
/* This code will reinit the Radeon CP hardware after a resume from disc.
 * AFAIK, it would be very difficult to pickle the state at suspend time, so
L
Linus Torvalds 已提交
1189 1190 1191 1192 1193
 * here we make sure that all Radeon hardware initialisation is re-done without
 * affecting running applications.
 *
 * Charl P. Botha <http://cpbotha.net>
 */
1194
static int radeon_do_resume_cp(struct drm_device * dev)
L
Linus Torvalds 已提交
1195 1196 1197
{
	drm_radeon_private_t *dev_priv = dev->dev_private;

D
Dave Airlie 已提交
1198 1199
	if (!dev_priv) {
		DRM_ERROR("Called with no initialization\n");
E
Eric Anholt 已提交
1200
		return -EINVAL;
L
Linus Torvalds 已提交
1201 1202 1203 1204 1205
	}

	DRM_DEBUG("Starting radeon_do_resume_cp()\n");

#if __OS_HAS_AGP
1206
	if (dev_priv->flags & RADEON_IS_AGP) {
L
Linus Torvalds 已提交
1207
		/* Turn off PCI GART */
D
Dave Airlie 已提交
1208
		radeon_set_pcigart(dev_priv, 0);
L
Linus Torvalds 已提交
1209 1210 1211 1212
	} else
#endif
	{
		/* Turn on PCI GART */
D
Dave Airlie 已提交
1213
		radeon_set_pcigart(dev_priv, 1);
L
Linus Torvalds 已提交
1214 1215
	}

D
Dave Airlie 已提交
1216 1217
	radeon_cp_load_microcode(dev_priv);
	radeon_cp_init_ring_buffer(dev, dev_priv);
L
Linus Torvalds 已提交
1218

D
Dave Airlie 已提交
1219
	radeon_do_engine_reset(dev);
L
Linus Torvalds 已提交
1220 1221 1222 1223 1224 1225

	DRM_DEBUG("radeon_do_resume_cp() complete\n");

	return 0;
}

1226
int radeon_cp_init(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1227
{
1228
	drm_radeon_init_t *init = data;
L
Linus Torvalds 已提交
1229

1230
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1231

1232
	if (init->func == RADEON_INIT_R300_CP)
D
Dave Airlie 已提交
1233
		r300_init_reg_flags(dev);
D
Dave Airlie 已提交
1234

1235
	switch (init->func) {
L
Linus Torvalds 已提交
1236 1237 1238
	case RADEON_INIT_CP:
	case RADEON_INIT_R200_CP:
	case RADEON_INIT_R300_CP:
1239
		return radeon_do_init_cp(dev, init);
L
Linus Torvalds 已提交
1240
	case RADEON_CLEANUP_CP:
D
Dave Airlie 已提交
1241
		return radeon_do_cleanup_cp(dev);
L
Linus Torvalds 已提交
1242 1243
	}

E
Eric Anholt 已提交
1244
	return -EINVAL;
L
Linus Torvalds 已提交
1245 1246
}

1247
int radeon_cp_start(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1248 1249
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
D
Dave Airlie 已提交
1250
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1251

1252
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1253

D
Dave Airlie 已提交
1254
	if (dev_priv->cp_running) {
1255
		DRM_DEBUG("while CP running\n");
L
Linus Torvalds 已提交
1256 1257
		return 0;
	}
D
Dave Airlie 已提交
1258
	if (dev_priv->cp_mode == RADEON_CSQ_PRIDIS_INDDIS) {
1259 1260
		DRM_DEBUG("called with bogus CP mode (%d)\n",
			  dev_priv->cp_mode);
L
Linus Torvalds 已提交
1261 1262 1263
		return 0;
	}

D
Dave Airlie 已提交
1264
	radeon_do_cp_start(dev_priv);
L
Linus Torvalds 已提交
1265 1266 1267 1268 1269 1270 1271

	return 0;
}

/* Stop the CP.  The engine must have been idled before calling this
 * routine.
 */
1272
int radeon_cp_stop(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1273 1274
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
1275
	drm_radeon_cp_stop_t *stop = data;
L
Linus Torvalds 已提交
1276
	int ret;
D
Dave Airlie 已提交
1277
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1278

1279
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1280 1281 1282 1283 1284 1285 1286

	if (!dev_priv->cp_running)
		return 0;

	/* Flush any pending CP commands.  This ensures any outstanding
	 * commands are exectuted by the engine before we turn it off.
	 */
1287
	if (stop->flush) {
D
Dave Airlie 已提交
1288
		radeon_do_cp_flush(dev_priv);
L
Linus Torvalds 已提交
1289 1290 1291 1292 1293
	}

	/* If we fail to make the engine go idle, we return an error
	 * code so that the DRM ioctl wrapper can try again.
	 */
1294
	if (stop->idle) {
D
Dave Airlie 已提交
1295 1296 1297
		ret = radeon_do_cp_idle(dev_priv);
		if (ret)
			return ret;
L
Linus Torvalds 已提交
1298 1299 1300 1301 1302 1303
	}

	/* Finally, we can turn off the CP.  If the engine isn't idle,
	 * we will get some dropped triangles as they won't be fully
	 * rendered before the CP is shut down.
	 */
D
Dave Airlie 已提交
1304
	radeon_do_cp_stop(dev_priv);
L
Linus Torvalds 已提交
1305 1306

	/* Reset the engine */
D
Dave Airlie 已提交
1307
	radeon_do_engine_reset(dev);
L
Linus Torvalds 已提交
1308 1309 1310 1311

	return 0;
}

1312
void radeon_do_release(struct drm_device * dev)
L
Linus Torvalds 已提交
1313 1314 1315 1316 1317 1318 1319
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
	int i, ret;

	if (dev_priv) {
		if (dev_priv->cp_running) {
			/* Stop the cp */
D
Dave Airlie 已提交
1320
			while ((ret = radeon_do_cp_idle(dev_priv)) != 0) {
L
Linus Torvalds 已提交
1321 1322 1323 1324 1325 1326 1327
				DRM_DEBUG("radeon_do_cp_idle %d\n", ret);
#ifdef __linux__
				schedule();
#else
				tsleep(&ret, PZERO, "rdnrel", 1);
#endif
			}
D
Dave Airlie 已提交
1328 1329
			radeon_do_cp_stop(dev_priv);
			radeon_do_engine_reset(dev);
L
Linus Torvalds 已提交
1330 1331 1332 1333
		}

		/* Disable *all* interrupts */
		if (dev_priv->mmio)	/* remove this after permanent addmaps */
D
Dave Airlie 已提交
1334
			RADEON_WRITE(RADEON_GEN_INT_CNTL, 0);
L
Linus Torvalds 已提交
1335

D
Dave Airlie 已提交
1336
		if (dev_priv->mmio) {	/* remove all surfaces */
L
Linus Torvalds 已提交
1337
			for (i = 0; i < RADEON_MAX_SURFACES; i++) {
D
Dave Airlie 已提交
1338 1339 1340 1341 1342
				RADEON_WRITE(RADEON_SURFACE0_INFO + 16 * i, 0);
				RADEON_WRITE(RADEON_SURFACE0_LOWER_BOUND +
					     16 * i, 0);
				RADEON_WRITE(RADEON_SURFACE0_UPPER_BOUND +
					     16 * i, 0);
L
Linus Torvalds 已提交
1343 1344 1345 1346
			}
		}

		/* Free memory heap structures */
D
Dave Airlie 已提交
1347 1348
		radeon_mem_takedown(&(dev_priv->gart_heap));
		radeon_mem_takedown(&(dev_priv->fb_heap));
L
Linus Torvalds 已提交
1349 1350

		/* deallocate kernel resources */
D
Dave Airlie 已提交
1351
		radeon_do_cleanup_cp(dev);
L
Linus Torvalds 已提交
1352 1353 1354 1355 1356
	}
}

/* Just reset the CP ring.  Called as part of an X Server engine reset.
 */
1357
int radeon_cp_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1358 1359
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
D
Dave Airlie 已提交
1360
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1361

1362
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1363

D
Dave Airlie 已提交
1364
	if (!dev_priv) {
1365
		DRM_DEBUG("called before init done\n");
E
Eric Anholt 已提交
1366
		return -EINVAL;
L
Linus Torvalds 已提交
1367 1368
	}

D
Dave Airlie 已提交
1369
	radeon_do_cp_reset(dev_priv);
L
Linus Torvalds 已提交
1370 1371 1372 1373 1374 1375 1376

	/* The CP is no longer running after an engine reset */
	dev_priv->cp_running = 0;

	return 0;
}

1377
int radeon_cp_idle(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1378 1379
{
	drm_radeon_private_t *dev_priv = dev->dev_private;
D
Dave Airlie 已提交
1380
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1381

1382
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1383

D
Dave Airlie 已提交
1384
	return radeon_do_cp_idle(dev_priv);
L
Linus Torvalds 已提交
1385 1386 1387 1388
}

/* Added by Charl P. Botha to call radeon_do_resume_cp().
 */
1389
int radeon_cp_resume(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1390 1391 1392 1393 1394
{

	return radeon_do_resume_cp(dev);
}

1395
int radeon_engine_reset(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1396
{
D
Dave Airlie 已提交
1397
	DRM_DEBUG("\n");
L
Linus Torvalds 已提交
1398

1399
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1400

D
Dave Airlie 已提交
1401
	return radeon_do_engine_reset(dev);
L
Linus Torvalds 已提交
1402 1403 1404 1405 1406 1407 1408 1409
}

/* ================================================================
 * Fullscreen mode
 */

/* KW: Deprecated to say the least:
 */
1410
int radeon_fullscreen(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422
{
	return 0;
}

/* ================================================================
 * Freelist management
 */

/* Original comment: FIXME: ROTATE_BUFS is a hack to cycle through
 *   bufs until freelist code is used.  Note this hides a problem with
 *   the scratch register * (used to keep track of last buffer
 *   completed) being written to before * the last buffer has actually
D
Dave Airlie 已提交
1423
 *   completed rendering.
L
Linus Torvalds 已提交
1424 1425 1426 1427 1428 1429
 *
 * KW:  It's also a good way to find free buffers quickly.
 *
 * KW: Ideally this loop wouldn't exist, and freelist_get wouldn't
 * sleep.  However, bugs in older versions of radeon_accel.c mean that
 * we essentially have to do this, else old clients will break.
D
Dave Airlie 已提交
1430
 *
L
Linus Torvalds 已提交
1431 1432
 * However, it does leave open a potential deadlock where all the
 * buffers are held by other clients, which can't release them because
D
Dave Airlie 已提交
1433
 * they can't get the lock.
L
Linus Torvalds 已提交
1434 1435
 */

D
Dave Airlie 已提交
1436
struct drm_buf *radeon_freelist_get(struct drm_device * dev)
L
Linus Torvalds 已提交
1437
{
1438
	struct drm_device_dma *dma = dev->dma;
L
Linus Torvalds 已提交
1439 1440
	drm_radeon_private_t *dev_priv = dev->dev_private;
	drm_radeon_buf_priv_t *buf_priv;
D
Dave Airlie 已提交
1441
	struct drm_buf *buf;
L
Linus Torvalds 已提交
1442 1443 1444
	int i, t;
	int start;

D
Dave Airlie 已提交
1445
	if (++dev_priv->last_buf >= dma->buf_count)
L
Linus Torvalds 已提交
1446 1447 1448 1449
		dev_priv->last_buf = 0;

	start = dev_priv->last_buf;

D
Dave Airlie 已提交
1450 1451 1452 1453
	for (t = 0; t < dev_priv->usec_timeout; t++) {
		u32 done_age = GET_SCRATCH(1);
		DRM_DEBUG("done_age = %d\n", done_age);
		for (i = start; i < dma->buf_count; i++) {
L
Linus Torvalds 已提交
1454 1455
			buf = dma->buflist[i];
			buf_priv = buf->dev_private;
1456 1457 1458
			if (buf->file_priv == NULL || (buf->pending &&
						       buf_priv->age <=
						       done_age)) {
L
Linus Torvalds 已提交
1459 1460 1461 1462 1463 1464 1465 1466
				dev_priv->stats.requested_bufs++;
				buf->pending = 0;
				return buf;
			}
			start = 0;
		}

		if (t) {
D
Dave Airlie 已提交
1467
			DRM_UDELAY(1);
L
Linus Torvalds 已提交
1468 1469 1470 1471
			dev_priv->stats.freelist_loops++;
		}
	}

D
Dave Airlie 已提交
1472
	DRM_DEBUG("returning NULL!\n");
L
Linus Torvalds 已提交
1473 1474
	return NULL;
}
D
Dave Airlie 已提交
1475

L
Linus Torvalds 已提交
1476
#if 0
D
Dave Airlie 已提交
1477
struct drm_buf *radeon_freelist_get(struct drm_device * dev)
L
Linus Torvalds 已提交
1478
{
1479
	struct drm_device_dma *dma = dev->dma;
L
Linus Torvalds 已提交
1480 1481
	drm_radeon_private_t *dev_priv = dev->dev_private;
	drm_radeon_buf_priv_t *buf_priv;
D
Dave Airlie 已提交
1482
	struct drm_buf *buf;
L
Linus Torvalds 已提交
1483 1484 1485 1486
	int i, t;
	int start;
	u32 done_age = DRM_READ32(dev_priv->ring_rptr, RADEON_SCRATCHOFF(1));

D
Dave Airlie 已提交
1487
	if (++dev_priv->last_buf >= dma->buf_count)
L
Linus Torvalds 已提交
1488 1489 1490 1491
		dev_priv->last_buf = 0;

	start = dev_priv->last_buf;
	dev_priv->stats.freelist_loops++;
D
Dave Airlie 已提交
1492 1493 1494

	for (t = 0; t < 2; t++) {
		for (i = start; i < dma->buf_count; i++) {
L
Linus Torvalds 已提交
1495 1496
			buf = dma->buflist[i];
			buf_priv = buf->dev_private;
1497 1498 1499
			if (buf->file_priv == 0 || (buf->pending &&
						    buf_priv->age <=
						    done_age)) {
L
Linus Torvalds 已提交
1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511
				dev_priv->stats.requested_bufs++;
				buf->pending = 0;
				return buf;
			}
		}
		start = 0;
	}

	return NULL;
}
#endif

1512
void radeon_freelist_reset(struct drm_device * dev)
L
Linus Torvalds 已提交
1513
{
1514
	struct drm_device_dma *dma = dev->dma;
L
Linus Torvalds 已提交
1515 1516 1517 1518
	drm_radeon_private_t *dev_priv = dev->dev_private;
	int i;

	dev_priv->last_buf = 0;
D
Dave Airlie 已提交
1519
	for (i = 0; i < dma->buf_count; i++) {
D
Dave Airlie 已提交
1520
		struct drm_buf *buf = dma->buflist[i];
L
Linus Torvalds 已提交
1521 1522 1523 1524 1525 1526 1527 1528 1529
		drm_radeon_buf_priv_t *buf_priv = buf->dev_private;
		buf_priv->age = 0;
	}
}

/* ================================================================
 * CP command submission
 */

D
Dave Airlie 已提交
1530
int radeon_wait_ring(drm_radeon_private_t * dev_priv, int n)
L
Linus Torvalds 已提交
1531 1532 1533
{
	drm_radeon_ring_buffer_t *ring = &dev_priv->ring;
	int i;
D
Dave Airlie 已提交
1534
	u32 last_head = GET_RING_HEAD(dev_priv);
L
Linus Torvalds 已提交
1535

D
Dave Airlie 已提交
1536 1537
	for (i = 0; i < dev_priv->usec_timeout; i++) {
		u32 head = GET_RING_HEAD(dev_priv);
L
Linus Torvalds 已提交
1538 1539

		ring->space = (head - ring->tail) * sizeof(u32);
D
Dave Airlie 已提交
1540
		if (ring->space <= 0)
L
Linus Torvalds 已提交
1541
			ring->space += ring->size;
D
Dave Airlie 已提交
1542
		if (ring->space > n)
L
Linus Torvalds 已提交
1543
			return 0;
D
Dave Airlie 已提交
1544

L
Linus Torvalds 已提交
1545 1546 1547 1548 1549 1550
		dev_priv->stats.boxes |= RADEON_BOX_WAIT_IDLE;

		if (head != last_head)
			i = 0;
		last_head = head;

D
Dave Airlie 已提交
1551
		DRM_UDELAY(1);
L
Linus Torvalds 已提交
1552 1553 1554 1555
	}

	/* FIXME: This return value is ignored in the BEGIN_RING macro! */
#if RADEON_FIFO_DEBUG
D
Dave Airlie 已提交
1556 1557
	radeon_status(dev_priv);
	DRM_ERROR("failed!\n");
L
Linus Torvalds 已提交
1558
#endif
E
Eric Anholt 已提交
1559
	return -EBUSY;
L
Linus Torvalds 已提交
1560 1561
}

1562 1563
static int radeon_cp_get_buffers(struct drm_device *dev,
				 struct drm_file *file_priv,
1564
				 struct drm_dma * d)
L
Linus Torvalds 已提交
1565 1566
{
	int i;
D
Dave Airlie 已提交
1567
	struct drm_buf *buf;
L
Linus Torvalds 已提交
1568

D
Dave Airlie 已提交
1569 1570 1571
	for (i = d->granted_count; i < d->request_count; i++) {
		buf = radeon_freelist_get(dev);
		if (!buf)
E
Eric Anholt 已提交
1572
			return -EBUSY;	/* NOTE: broken client */
L
Linus Torvalds 已提交
1573

1574
		buf->file_priv = file_priv;
L
Linus Torvalds 已提交
1575

D
Dave Airlie 已提交
1576 1577
		if (DRM_COPY_TO_USER(&d->request_indices[i], &buf->idx,
				     sizeof(buf->idx)))
E
Eric Anholt 已提交
1578
			return -EFAULT;
D
Dave Airlie 已提交
1579 1580
		if (DRM_COPY_TO_USER(&d->request_sizes[i], &buf->total,
				     sizeof(buf->total)))
E
Eric Anholt 已提交
1581
			return -EFAULT;
L
Linus Torvalds 已提交
1582 1583 1584 1585 1586 1587

		d->granted_count++;
	}
	return 0;
}

1588
int radeon_cp_buffers(struct drm_device *dev, void *data, struct drm_file *file_priv)
L
Linus Torvalds 已提交
1589
{
1590
	struct drm_device_dma *dma = dev->dma;
L
Linus Torvalds 已提交
1591
	int ret = 0;
1592
	struct drm_dma *d = data;
L
Linus Torvalds 已提交
1593

1594
	LOCK_TEST_WITH_RETURN(dev, file_priv);
L
Linus Torvalds 已提交
1595 1596 1597

	/* Please don't send us buffers.
	 */
1598
	if (d->send_count != 0) {
D
Dave Airlie 已提交
1599
		DRM_ERROR("Process %d trying to send %d buffers via drmDMA\n",
1600
			  DRM_CURRENTPID, d->send_count);
E
Eric Anholt 已提交
1601
		return -EINVAL;
L
Linus Torvalds 已提交
1602 1603 1604 1605
	}

	/* We'll send you buffers.
	 */
1606
	if (d->request_count < 0 || d->request_count > dma->buf_count) {
D
Dave Airlie 已提交
1607
		DRM_ERROR("Process %d trying to get %d buffers (of %d max)\n",
1608
			  DRM_CURRENTPID, d->request_count, dma->buf_count);
E
Eric Anholt 已提交
1609
		return -EINVAL;
L
Linus Torvalds 已提交
1610 1611
	}

1612
	d->granted_count = 0;
L
Linus Torvalds 已提交
1613

1614 1615
	if (d->request_count) {
		ret = radeon_cp_get_buffers(dev, file_priv, d);
L
Linus Torvalds 已提交
1616 1617 1618 1619 1620
	}

	return ret;
}

1621
int radeon_driver_load(struct drm_device *dev, unsigned long flags)
L
Linus Torvalds 已提交
1622 1623 1624 1625 1626 1627
{
	drm_radeon_private_t *dev_priv;
	int ret = 0;

	dev_priv = drm_alloc(sizeof(drm_radeon_private_t), DRM_MEM_DRIVER);
	if (dev_priv == NULL)
E
Eric Anholt 已提交
1628
		return -ENOMEM;
L
Linus Torvalds 已提交
1629 1630 1631 1632 1633

	memset(dev_priv, 0, sizeof(drm_radeon_private_t));
	dev->dev_private = (void *)dev_priv;
	dev_priv->flags = flags;

1634
	switch (flags & RADEON_FAMILY_MASK) {
L
Linus Torvalds 已提交
1635 1636 1637 1638
	case CHIP_R100:
	case CHIP_RV200:
	case CHIP_R200:
	case CHIP_R300:
1639
	case CHIP_R350:
D
Dave Airlie 已提交
1640
	case CHIP_R420:
1641
	case CHIP_RV410:
D
Dave Airlie 已提交
1642 1643 1644 1645
	case CHIP_RV515:
	case CHIP_R520:
	case CHIP_RV570:
	case CHIP_R580:
1646
		dev_priv->flags |= RADEON_HAS_HIERZ;
L
Linus Torvalds 已提交
1647 1648
		break;
	default:
D
Dave Airlie 已提交
1649
		/* all other chips have no hierarchical z buffer */
L
Linus Torvalds 已提交
1650 1651
		break;
	}
D
Dave Airlie 已提交
1652 1653

	if (drm_device_is_agp(dev))
1654
		dev_priv->flags |= RADEON_IS_AGP;
1655
	else if (drm_device_is_pcie(dev))
1656
		dev_priv->flags |= RADEON_IS_PCIE;
1657
	else
1658
		dev_priv->flags |= RADEON_IS_PCI;
1659

D
Dave Airlie 已提交
1660
	DRM_DEBUG("%s card detected\n",
1661
		  ((dev_priv->flags & RADEON_IS_AGP) ? "AGP" : (((dev_priv->flags & RADEON_IS_PCIE) ? "PCIE" : "PCI"))));
L
Linus Torvalds 已提交
1662 1663 1664
	return ret;
}

1665 1666 1667 1668
/* Create mappings for registers and framebuffer so userland doesn't necessarily
 * have to find them.
 */
int radeon_driver_firstopen(struct drm_device *dev)
D
Dave Airlie 已提交
1669 1670 1671 1672 1673
{
	int ret;
	drm_local_map_t *map;
	drm_radeon_private_t *dev_priv = dev->dev_private;

1674 1675
	dev_priv->gart_info.table_size = RADEON_PCIGART_TABLE_SIZE;

D
Dave Airlie 已提交
1676 1677 1678 1679 1680 1681
	ret = drm_addmap(dev, drm_get_resource_start(dev, 2),
			 drm_get_resource_len(dev, 2), _DRM_REGISTERS,
			 _DRM_READ_ONLY, &dev_priv->mmio);
	if (ret != 0)
		return ret;

1682 1683
	dev_priv->fb_aper_offset = drm_get_resource_start(dev, 0);
	ret = drm_addmap(dev, dev_priv->fb_aper_offset,
D
Dave Airlie 已提交
1684 1685 1686 1687 1688 1689 1690 1691
			 drm_get_resource_len(dev, 0), _DRM_FRAME_BUFFER,
			 _DRM_WRITE_COMBINING, &map);
	if (ret != 0)
		return ret;

	return 0;
}

1692
int radeon_driver_unload(struct drm_device *dev)
L
Linus Torvalds 已提交
1693 1694 1695 1696 1697 1698 1699 1700 1701
{
	drm_radeon_private_t *dev_priv = dev->dev_private;

	DRM_DEBUG("\n");
	drm_free(dev_priv, sizeof(*dev_priv), DRM_MEM_DRIVER);

	dev->dev_private = NULL;
	return 0;
}