amd.c 8.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5
#include <linux/init.h>
#include <linux/bitops.h>
#include <linux/mm.h>
#include <asm/io.h>
#include <asm/processor.h>
6
#include <asm/apic.h>
7
#include <asm/mach_apic.h>
L
Linus Torvalds 已提交
8 9 10 11 12 13 14 15 16 17 18 19 20 21 22

#include "cpu.h"

/*
 *	B step AMD K6 before B 9730xxxx have hardware bugs that can cause
 *	misexecution of code under Linux. Owners of such processors should
 *	contact AMD for precise details and a CPU swap.
 *
 *	See	http://www.multimania.com/poulot/k6bug.html
 *		http://www.amd.com/K6/k6docs/revgd.html
 *
 *	The following test is erm.. interesting. AMD neglected to up
 *	the chip setting when fixing the bug but they also tweaked some
 *	performance at the same time..
 */
23

L
Linus Torvalds 已提交
24 25 26
extern void vide(void);
__asm__(".align 4\nvide: ret");

27
#ifdef CONFIG_X86_LOCAL_APIC
28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
#define ENABLE_C1E_MASK         0x18000000
#define CPUID_PROCESSOR_SIGNATURE       1
#define CPUID_XFAM              0x0ff00000
#define CPUID_XFAM_K8           0x00000000
#define CPUID_XFAM_10H          0x00100000
#define CPUID_XFAM_11H          0x00200000
#define CPUID_XMOD              0x000f0000
#define CPUID_XMOD_REV_F        0x00040000

/* AMD systems with C1E don't have a working lAPIC timer. Check for that. */
static __cpuinit int amd_apic_timer_broken(void)
{
	u32 lo, hi;
	u32 eax = cpuid_eax(CPUID_PROCESSOR_SIGNATURE);
	switch (eax & CPUID_XFAM) {
	case CPUID_XFAM_K8:
		if ((eax & CPUID_XMOD) < CPUID_XMOD_REV_F)
			break;
	case CPUID_XFAM_10H:
	case CPUID_XFAM_11H:
		rdmsr(MSR_K8_ENABLE_C1E, lo, hi);
49 50 51 52
		if (lo & ENABLE_C1E_MASK) {
			if (smp_processor_id() != boot_cpu_physical_apicid)
				printk(KERN_INFO "AMD C1E detected late. "
				       "	Force timer broadcast.\n");
53
			return 1;
54 55 56 57
		}
		break;
	default:
		/* err on the side of caution */
58
		return 1;
59
	}
60 61
	return 0;
}
62
#endif
63

64 65
int force_mwait __cpuinitdata;

66
static void __cpuinit early_init_amd(struct cpuinfo_x86 *c)
67 68 69 70 71 72 73 74
{
	if (cpuid_eax(0x80000000) >= 0x80000007) {
		c->x86_power = cpuid_edx(0x80000007);
		if (c->x86_power & (1<<8))
			set_bit(X86_FEATURE_CONSTANT_TSC, c->x86_capability);
	}
}

75
static void __cpuinit init_amd(struct cpuinfo_x86 *c)
L
Linus Torvalds 已提交
76 77 78 79 80
{
	u32 l, h;
	int mbytes = num_physpages >> (20-PAGE_SHIFT);
	int r;

81
#ifdef CONFIG_SMP
82
	unsigned long long value;
83

84 85
	/*
	 * Disable TLB flush filter by setting HWCR.FFDIS on K8
86 87 88 89 90 91 92 93 94 95 96 97
	 * bit 6 of msr C001_0015
	 *
	 * Errata 63 for SH-B3 steppings
	 * Errata 122 for all steppings (F+ have it disabled by default)
	 */
	if (c->x86 == 15) {
		rdmsrl(MSR_K7_HWCR, value);
		value |= 1 << 6;
		wrmsrl(MSR_K7_HWCR, value);
	}
#endif

98 99
	early_init_amd(c);

L
Linus Torvalds 已提交
100 101 102 103 104 105
	/*
	 *	FIXME: We should handle the K5 here. Set up the write
	 *	range and also turn on MSR 83 bits 4 and 31 (write alloc,
	 *	no bus pipeline)
	 */

106 107 108 109
	/*
	 * Bit 31 in normal CPUID used for nonstandard 3DNow ID;
	 * DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway
	 */
L
Linus Torvalds 已提交
110
	clear_bit(0*32+31, c->x86_capability);
111

L
Linus Torvalds 已提交
112 113
	r = get_model_name(c);

114 115
	switch (c->x86) {
	case 4:
L
Linus Torvalds 已提交
116 117 118 119 120 121 122 123 124
		/*
		 * General Systems BIOSen alias the cpu frequency registers
		 * of the Elan at 0x000df000. Unfortuantly, one of the Linux
		 * drivers subsequently pokes it, and changes the CPU speed.
		 * Workaround : Remove the unneeded alias.
		 */
#define CBAR		(0xfffc) /* Configuration Base Address  (32-bit) */
#define CBAR_ENB	(0x80000000)
#define CBAR_KEY	(0X000000CB)
125
			if (c->x86_model == 9 || c->x86_model == 10) {
L
Linus Torvalds 已提交
126 127 128 129
				if (inl (CBAR) & CBAR_ENB)
					outl (0 | CBAR_KEY, CBAR);
			}
			break;
130 131
	case 5:
			if (c->x86_model < 6) {
L
Linus Torvalds 已提交
132
				/* Based on AMD doc 20734R - June 2000 */
133
				if (c->x86_model == 0) {
L
Linus Torvalds 已提交
134 135 136 137 138
					clear_bit(X86_FEATURE_APIC, c->x86_capability);
					set_bit(X86_FEATURE_PGE, c->x86_capability);
				}
				break;
			}
139 140

			if (c->x86_model == 6 && c->x86_mask == 1) {
L
Linus Torvalds 已提交
141 142 143 144
				const int K6_BUG_LOOP = 1000000;
				int n;
				void (*f_vide)(void);
				unsigned long d, d2;
145

L
Linus Torvalds 已提交
146
				printk(KERN_INFO "AMD K6 stepping B detected - ");
147

L
Linus Torvalds 已提交
148
				/*
149
				 * It looks like AMD fixed the 2.6.2 bug and improved indirect
L
Linus Torvalds 已提交
150 151 152 153 154 155
				 * calls at the same time.
				 */

				n = K6_BUG_LOOP;
				f_vide = vide;
				rdtscl(d);
156
				while (n--)
L
Linus Torvalds 已提交
157 158 159
					f_vide();
				rdtscl(d2);
				d = d2-d;
D
Dave Jones 已提交
160

161
				if (d > 20*K6_BUG_LOOP)
L
Linus Torvalds 已提交
162
					printk("system stability may be impaired when more than 32 MB are used.\n");
163
				else
L
Linus Torvalds 已提交
164 165 166 167 168 169
					printk("probably OK (after B9730xxxx).\n");
				printk(KERN_INFO "Please see http://membres.lycos.fr/poulot/k6bug.html\n");
			}

			/* K6 with old style WHCR */
			if (c->x86_model < 8 ||
170
			   (c->x86_model == 8 && c->x86_mask < 8)) {
L
Linus Torvalds 已提交
171
				/* We can only write allocate on the low 508Mb */
172 173
				if (mbytes > 508)
					mbytes = 508;
L
Linus Torvalds 已提交
174 175

				rdmsr(MSR_K6_WHCR, l, h);
176
				if ((l&0x0000FFFF) == 0) {
L
Linus Torvalds 已提交
177
					unsigned long flags;
178
					l = (1<<0)|((mbytes/4)<<1);
L
Linus Torvalds 已提交
179 180 181 182 183 184 185 186 187 188
					local_irq_save(flags);
					wbinvd();
					wrmsr(MSR_K6_WHCR, l, h);
					local_irq_restore(flags);
					printk(KERN_INFO "Enabling old style K6 write allocation for %d Mb\n",
						mbytes);
				}
				break;
			}

189
			if ((c->x86_model == 8 && c->x86_mask > 7) ||
L
Linus Torvalds 已提交
190 191 192
			     c->x86_model == 9 || c->x86_model == 13) {
				/* The more serious chips .. */

193 194
				if (mbytes > 4092)
					mbytes = 4092;
L
Linus Torvalds 已提交
195 196

				rdmsr(MSR_K6_WHCR, l, h);
197
				if ((l&0xFFFF0000) == 0) {
L
Linus Torvalds 已提交
198
					unsigned long flags;
199
					l = ((mbytes>>2)<<22)|(1<<16);
L
Linus Torvalds 已提交
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214
					local_irq_save(flags);
					wbinvd();
					wrmsr(MSR_K6_WHCR, l, h);
					local_irq_restore(flags);
					printk(KERN_INFO "Enabling new style K6 write allocation for %d Mb\n",
						mbytes);
				}

				/*  Set MTRR capability flag if appropriate */
				if (c->x86_model == 13 || c->x86_model == 9 ||
				   (c->x86_model == 8 && c->x86_mask >= 8))
					set_bit(X86_FEATURE_K6_MTRR, c->x86_capability);
				break;
			}

215 216 217 218 219 220
			if (c->x86_model == 10) {
				/* AMD Geode LX is model 10 */
				/* placeholder for any needed mods */
				break;
			}
			break;
221 222 223 224 225
	case 6: /* An Athlon/Duron */

			/*
			 * Bit 15 of Athlon specific MSR 15, needs to be 0
			 * to enable SSE on Palomino/Morgan/Barton CPU's.
L
Linus Torvalds 已提交
226 227 228 229 230 231 232 233 234 235 236 237
			 * If the BIOS didn't enable it already, enable it here.
			 */
			if (c->x86_model >= 6 && c->x86_model <= 10) {
				if (!cpu_has(c, X86_FEATURE_XMM)) {
					printk(KERN_INFO "Enabling disabled K7/SSE Support.\n");
					rdmsr(MSR_K7_HWCR, l, h);
					l &= ~0x00008000;
					wrmsr(MSR_K7_HWCR, l, h);
					set_bit(X86_FEATURE_XMM, c->x86_capability);
				}
			}

238 239
			/*
			 * It's been determined by AMD that Athlons since model 8 stepping 1
L
Linus Torvalds 已提交
240 241 242
			 * are more robust with CLK_CTL set to 200xxxxx instead of 600xxxxx
			 * As per AMD technical note 27212 0.2
			 */
243
			if ((c->x86_model == 8 && c->x86_mask >= 1) || (c->x86_model > 8)) {
L
Linus Torvalds 已提交
244 245 246 247 248 249 250 251 252 253 254 255
				rdmsr(MSR_K7_CLK_CTL, l, h);
				if ((l & 0xfff00000) != 0x20000000) {
					printk ("CPU: CLK_CTL MSR was %x. Reprogramming to %x\n", l,
						((l & 0x000fffff)|0x20000000));
					wrmsr(MSR_K7_CLK_CTL, (l & 0x000fffff)|0x20000000, h);
				}
			}
			break;
	}

	switch (c->x86) {
	case 15:
A
Andi Kleen 已提交
256 257 258
	/* Use K8 tuning for Fam10h and Fam11h */
	case 0x10:
	case 0x11:
L
Linus Torvalds 已提交
259 260 261
		set_bit(X86_FEATURE_K8, c->x86_capability);
		break;
	case 6:
262
		set_bit(X86_FEATURE_K7, c->x86_capability);
L
Linus Torvalds 已提交
263 264
		break;
	}
265 266
	if (c->x86 >= 6)
		set_bit(X86_FEATURE_FXSAVE_LEAK, c->x86_capability);
L
Linus Torvalds 已提交
267 268

	display_cacheinfo(c);
269

270
	if (cpuid_eax(0x80000000) >= 0x80000008)
271
		c->x86_max_cores = (cpuid_ecx(0x80000008) & 0xff) + 1;
272

273
#ifdef CONFIG_X86_HT
274
	/*
275
	 * On a AMD multi core setup the lower bits of the APIC id
S
Simon Arlott 已提交
276
	 * distinguish the cores.
277
	 */
278
	if (c->x86_max_cores > 1) {
279
		int cpu = smp_processor_id();
280 281 282 283 284 285
		unsigned bits = (cpuid_ecx(0x80000008) >> 12) & 0xf;

		if (bits == 0) {
			while ((1 << bits) < c->x86_max_cores)
				bits++;
		}
286 287
		c->cpu_core_id = c->phys_proc_id & ((1<<bits)-1);
		c->phys_proc_id >>= bits;
288
		printk(KERN_INFO "CPU %d(%d) -> Core %d\n",
289
		       cpu, c->x86_max_cores, c->cpu_core_id);
290
	}
L
Linus Torvalds 已提交
291
#endif
292

293 294 295 296 297 298
	if (cpuid_eax(0x80000000) >= 0x80000006) {
		if ((c->x86 == 0x10) && (cpuid_edx(0x80000006) & 0xf000))
			num_cache_leaves = 4;
		else
			num_cache_leaves = 3;
	}
299

300
#ifdef CONFIG_X86_LOCAL_APIC
301
	if (amd_apic_timer_broken())
302 303
		local_apic_timer_disabled = 1;
#endif
304

A
Andi Kleen 已提交
305 306 307
	/* K6s reports MCEs but don't actually have all the MSRs */
	if (c->x86 < 6)
		clear_bit(X86_FEATURE_MCE, c->x86_capability);
308

309
	if (cpu_has_xmm2)
310
		set_bit(X86_FEATURE_MFENCE_RDTSC, c->x86_capability);
L
Linus Torvalds 已提交
311 312
}

313
static unsigned int __cpuinit amd_size_cache(struct cpuinfo_x86 *c, unsigned int size)
L
Linus Torvalds 已提交
314 315 316 317 318 319
{
	/* AMD errata T13 (order #21922) */
	if ((c->x86 == 6)) {
		if (c->x86_model == 3 && c->x86_mask == 0)	/* Duron Rev A0 */
			size = 64;
		if (c->x86_model == 4 &&
320
		    (c->x86_mask == 0 || c->x86_mask == 1))	/* Tbird rev A1/A2 */
L
Linus Torvalds 已提交
321 322 323 324 325
			size = 256;
	}
	return size;
}

326
static struct cpu_dev amd_cpu_dev __cpuinitdata = {
L
Linus Torvalds 已提交
327
	.c_vendor	= "AMD",
328
	.c_ident	= { "AuthenticAMD" },
L
Linus Torvalds 已提交
329 330 331 332 333
	.c_models = {
		{ .vendor = X86_VENDOR_AMD, .family = 4, .model_names =
		  {
			  [3] = "486 DX/2",
			  [7] = "486 DX/2-WB",
334 335
			  [8] = "486 DX/4",
			  [9] = "486 DX/4-WB",
L
Linus Torvalds 已提交
336
			  [14] = "Am5x86-WT",
337
			  [15] = "Am5x86-WB"
L
Linus Torvalds 已提交
338 339 340
		  }
		},
	},
341
	.c_early_init   = early_init_amd,
L
Linus Torvalds 已提交
342 343 344 345 346 347 348 349 350
	.c_init		= init_amd,
	.c_size_cache	= amd_size_cache,
};

int __init amd_init_cpu(void)
{
	cpu_devs[X86_VENDOR_AMD] = &amd_cpu_dev;
	return 0;
}
351 352

cpu_vendor_dev_register(X86_VENDOR_AMD, &amd_cpu_dev);