Merge remote-tracking branch 'origin/x86/boot' into x86/mm2
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / arch / x86 / kernel / cpu / centaur.c
CommitLineData
48f4c485 1#include <linux/bitops.h>
1da177e4
LT
2#include <linux/kernel.h>
3#include <linux/init.h>
edc05e6d 4
1da177e4 5#include <asm/processor.h>
1da177e4 6#include <asm/e820.h>
52f4a91a 7#include <asm/mtrr.h>
48f4c485 8#include <asm/msr.h>
edc05e6d 9
1da177e4
LT
10#include "cpu.h"
11
12#ifdef CONFIG_X86_OOSTORE
13
b4af3f7c 14static u32 __cpuinit power2(u32 x)
1da177e4 15{
29a9994b 16 u32 s = 1;
edc05e6d
IM
17
18 while (s <= x)
29a9994b 19 s <<= 1;
edc05e6d 20
29a9994b 21 return s >>= 1;
1da177e4
LT
22}
23
24
25/*
edc05e6d 26 * Set up an actual MCR
1da177e4 27 */
b4af3f7c 28static void __cpuinit centaur_mcr_insert(int reg, u32 base, u32 size, int key)
1da177e4
LT
29{
30 u32 lo, hi;
29a9994b 31
1da177e4
LT
32 hi = base & ~0xFFF;
33 lo = ~(size-1); /* Size is a power of 2 so this makes a mask */
34 lo &= ~0xFFF; /* Remove the ctrl value bits */
35 lo |= key; /* Attribute we wish to set */
36 wrmsr(reg+MSR_IDT_MCR0, lo, hi);
37 mtrr_centaur_report_mcr(reg, lo, hi); /* Tell the mtrr driver */
38}
39
40/*
edc05e6d 41 * Figure what we can cover with MCR's
1da177e4 42 *
edc05e6d 43 * Shortcut: We know you can't put 4Gig of RAM on a winchip
1da177e4 44 */
edc05e6d 45static u32 __cpuinit ramtop(void)
1da177e4 46{
1da177e4 47 u32 clip = 0xFFFFFFFFUL;
edc05e6d
IM
48 u32 top = 0;
49 int i;
29a9994b 50
1da177e4
LT
51 for (i = 0; i < e820.nr_map; i++) {
52 unsigned long start, end;
53
54 if (e820.map[i].addr > 0xFFFFFFFFUL)
55 continue;
56 /*
edc05e6d
IM
57 * Don't MCR over reserved space. Ignore the ISA hole
58 * we frob around that catastrophe already
1da177e4 59 */
edc05e6d
IM
60 if (e820.map[i].type == E820_RESERVED) {
61 if (e820.map[i].addr >= 0x100000UL &&
62 e820.map[i].addr < clip)
1da177e4
LT
63 clip = e820.map[i].addr;
64 continue;
65 }
66 start = e820.map[i].addr;
67 end = e820.map[i].addr + e820.map[i].size;
68 if (start >= end)
69 continue;
70 if (end > top)
71 top = end;
72 }
edc05e6d
IM
73 /*
74 * Everything below 'top' should be RAM except for the ISA hole.
75 * Because of the limited MCR's we want to map NV/ACPI into our
76 * MCR range for gunk in RAM
77 *
78 * Clip might cause us to MCR insufficient RAM but that is an
79 * acceptable failure mode and should only bite obscure boxes with
80 * a VESA hole at 15Mb
81 *
82 * The second case Clip sometimes kicks in is when the EBDA is marked
83 * as reserved. Again we fail safe with reasonable results
84 */
85 if (top > clip)
29a9994b
PC
86 top = clip;
87
1da177e4
LT
88 return top;
89}
90
91/*
edc05e6d 92 * Compute a set of MCR's to give maximum coverage
1da177e4 93 */
b4af3f7c 94static int __cpuinit centaur_mcr_compute(int nr, int key)
1da177e4
LT
95{
96 u32 mem = ramtop();
97 u32 root = power2(mem);
98 u32 base = root;
99 u32 top = root;
100 u32 floor = 0;
101 int ct = 0;
29a9994b 102
edc05e6d 103 while (ct < nr) {
1da177e4 104 u32 fspace = 0;
edc05e6d
IM
105 u32 high;
106 u32 low;
1da177e4
LT
107
108 /*
edc05e6d 109 * Find the largest block we will fill going upwards
1da177e4 110 */
edc05e6d 111 high = power2(mem-top);
1da177e4
LT
112
113 /*
edc05e6d 114 * Find the largest block we will fill going downwards
1da177e4 115 */
edc05e6d 116 low = base/2;
1da177e4
LT
117
118 /*
edc05e6d
IM
119 * Don't fill below 1Mb going downwards as there
120 * is an ISA hole in the way.
29a9994b 121 */
29a9994b 122 if (base <= 1024*1024)
1da177e4 123 low = 0;
29a9994b 124
1da177e4 125 /*
edc05e6d
IM
126 * See how much space we could cover by filling below
127 * the ISA hole
1da177e4 128 */
29a9994b
PC
129
130 if (floor == 0)
1da177e4 131 fspace = 512*1024;
29a9994b 132 else if (floor == 512*1024)
1da177e4
LT
133 fspace = 128*1024;
134
135 /* And forget ROM space */
29a9994b 136
1da177e4 137 /*
edc05e6d 138 * Now install the largest coverage we get
1da177e4 139 */
edc05e6d 140 if (fspace > high && fspace > low) {
1da177e4
LT
141 centaur_mcr_insert(ct, floor, fspace, key);
142 floor += fspace;
edc05e6d 143 } else if (high > low) {
1da177e4
LT
144 centaur_mcr_insert(ct, top, high, key);
145 top += high;
edc05e6d 146 } else if (low > 0) {
1da177e4
LT
147 base -= low;
148 centaur_mcr_insert(ct, base, low, key);
edc05e6d
IM
149 } else
150 break;
1da177e4
LT
151 ct++;
152 }
153 /*
edc05e6d
IM
154 * We loaded ct values. We now need to set the mask. The caller
155 * must do this bit.
1da177e4 156 */
1da177e4
LT
157 return ct;
158}
159
b4af3f7c 160static void __cpuinit centaur_create_optimal_mcr(void)
1da177e4 161{
edc05e6d 162 int used;
1da177e4 163 int i;
edc05e6d 164
1da177e4 165 /*
edc05e6d
IM
166 * Allocate up to 6 mcrs to mark as much of ram as possible
167 * as write combining and weak write ordered.
1da177e4 168 *
edc05e6d
IM
169 * To experiment with: Linux never uses stack operations for
170 * mmio spaces so we could globally enable stack operation wc
1da177e4 171 *
edc05e6d
IM
172 * Load the registers with type 31 - full write combining, all
173 * writes weakly ordered.
1da177e4 174 */
edc05e6d 175 used = centaur_mcr_compute(6, 31);
1da177e4
LT
176
177 /*
edc05e6d 178 * Wipe unused MCRs
1da177e4 179 */
29a9994b 180 for (i = used; i < 8; i++)
1da177e4
LT
181 wrmsr(MSR_IDT_MCR0+i, 0, 0);
182}
183
b4af3f7c 184static void __cpuinit winchip2_create_optimal_mcr(void)
1da177e4
LT
185{
186 u32 lo, hi;
edc05e6d 187 int used;
1da177e4
LT
188 int i;
189
190 /*
edc05e6d
IM
191 * Allocate up to 6 mcrs to mark as much of ram as possible
192 * as write combining, weak store ordered.
1da177e4 193 *
edc05e6d
IM
194 * Load the registers with type 25
195 * 8 - weak write ordering
196 * 16 - weak read ordering
197 * 1 - write combining
1da177e4 198 */
edc05e6d 199 used = centaur_mcr_compute(6, 25);
29a9994b 200
1da177e4 201 /*
edc05e6d 202 * Mark the registers we are using.
1da177e4 203 */
1da177e4 204 rdmsr(MSR_IDT_MCR_CTRL, lo, hi);
29a9994b
PC
205 for (i = 0; i < used; i++)
206 lo |= 1<<(9+i);
1da177e4 207 wrmsr(MSR_IDT_MCR_CTRL, lo, hi);
29a9994b 208
1da177e4 209 /*
edc05e6d 210 * Wipe unused MCRs
1da177e4 211 */
29a9994b
PC
212
213 for (i = used; i < 8; i++)
1da177e4
LT
214 wrmsr(MSR_IDT_MCR0+i, 0, 0);
215}
216
217/*
edc05e6d 218 * Handle the MCR key on the Winchip 2.
1da177e4 219 */
b4af3f7c 220static void __cpuinit winchip2_unprotect_mcr(void)
1da177e4
LT
221{
222 u32 lo, hi;
223 u32 key;
29a9994b 224
1da177e4 225 rdmsr(MSR_IDT_MCR_CTRL, lo, hi);
29a9994b 226 lo &= ~0x1C0; /* blank bits 8-6 */
1da177e4
LT
227 key = (lo>>17) & 7;
228 lo |= key<<6; /* replace with unlock key */
229 wrmsr(MSR_IDT_MCR_CTRL, lo, hi);
230}
231
b4af3f7c 232static void __cpuinit winchip2_protect_mcr(void)
1da177e4
LT
233{
234 u32 lo, hi;
29a9994b 235
1da177e4 236 rdmsr(MSR_IDT_MCR_CTRL, lo, hi);
29a9994b 237 lo &= ~0x1C0; /* blank bits 8-6 */
1da177e4
LT
238 wrmsr(MSR_IDT_MCR_CTRL, lo, hi);
239}
240#endif /* CONFIG_X86_OOSTORE */
241
242#define ACE_PRESENT (1 << 6)
243#define ACE_ENABLED (1 << 7)
244#define ACE_FCR (1 << 28) /* MSR_VIA_FCR */
245
246#define RNG_PRESENT (1 << 2)
247#define RNG_ENABLED (1 << 3)
248#define RNG_ENABLE (1 << 6) /* MSR_VIA_RNG */
249
b4af3f7c 250static void __cpuinit init_c3(struct cpuinfo_x86 *c)
1da177e4
LT
251{
252 u32 lo, hi;
253
254 /* Test for Centaur Extended Feature Flags presence */
255 if (cpuid_eax(0xC0000000) >= 0xC0000001) {
256 u32 tmp = cpuid_edx(0xC0000001);
257
258 /* enable ACE unit, if present and disabled */
259 if ((tmp & (ACE_PRESENT | ACE_ENABLED)) == ACE_PRESENT) {
29a9994b 260 rdmsr(MSR_VIA_FCR, lo, hi);
1da177e4 261 lo |= ACE_FCR; /* enable ACE unit */
29a9994b 262 wrmsr(MSR_VIA_FCR, lo, hi);
1da177e4
LT
263 printk(KERN_INFO "CPU: Enabled ACE h/w crypto\n");
264 }
265
266 /* enable RNG unit, if present and disabled */
267 if ((tmp & (RNG_PRESENT | RNG_ENABLED)) == RNG_PRESENT) {
29a9994b 268 rdmsr(MSR_VIA_RNG, lo, hi);
1da177e4 269 lo |= RNG_ENABLE; /* enable RNG unit */
29a9994b 270 wrmsr(MSR_VIA_RNG, lo, hi);
1da177e4
LT
271 printk(KERN_INFO "CPU: Enabled h/w RNG\n");
272 }
273
274 /* store Centaur Extended Feature Flags as
275 * word 5 of the CPU capability bit array
276 */
277 c->x86_capability[5] = cpuid_edx(0xC0000001);
278 }
48f4c485 279#ifdef CONFIG_X86_32
27b46d76 280 /* Cyrix III family needs CX8 & PGE explicitly enabled. */
cb3f718d 281 if (c->x86_model >= 6 && c->x86_model <= 13) {
29a9994b 282 rdmsr(MSR_VIA_FCR, lo, hi);
1da177e4 283 lo |= (1<<1 | 1<<7);
29a9994b 284 wrmsr(MSR_VIA_FCR, lo, hi);
e1a94a97 285 set_cpu_cap(c, X86_FEATURE_CX8);
1da177e4
LT
286 }
287
288 /* Before Nehemiah, the C3's had 3dNOW! */
29a9994b 289 if (c->x86_model >= 6 && c->x86_model < 9)
e1a94a97 290 set_cpu_cap(c, X86_FEATURE_3DNOW);
48f4c485
SAS
291#endif
292 if (c->x86 == 0x6 && c->x86_model >= 0xf) {
293 c->x86_cache_alignment = c->x86_clflush_size * 2;
294 set_cpu_cap(c, X86_FEATURE_REP_GOOD);
295 }
1da177e4 296
27c13ece 297 cpu_detect_cache_sizes(c);
1da177e4
LT
298}
299
edc05e6d
IM
300enum {
301 ECX8 = 1<<1,
302 EIERRINT = 1<<2,
303 DPM = 1<<3,
304 DMCE = 1<<4,
305 DSTPCLK = 1<<5,
306 ELINEAR = 1<<6,
307 DSMC = 1<<7,
308 DTLOCK = 1<<8,
309 EDCTLB = 1<<8,
310 EMMX = 1<<9,
311 DPDC = 1<<11,
312 EBRPRED = 1<<12,
313 DIC = 1<<13,
314 DDC = 1<<14,
315 DNA = 1<<15,
316 ERETSTK = 1<<16,
317 E2MMX = 1<<19,
318 EAMD3D = 1<<20,
319};
320
5fef55fd
YL
321static void __cpuinit early_init_centaur(struct cpuinfo_x86 *c)
322{
323 switch (c->x86) {
48f4c485 324#ifdef CONFIG_X86_32
5fef55fd
YL
325 case 5:
326 /* Emulate MTRRs using Centaur's MCR. */
327 set_cpu_cap(c, X86_FEATURE_CENTAUR_MCR);
328 break;
48f4c485
SAS
329#endif
330 case 6:
331 if (c->x86_model >= 0xf)
332 set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC);
333 break;
5fef55fd 334 }
48f4c485
SAS
335#ifdef CONFIG_X86_64
336 set_cpu_cap(c, X86_FEATURE_SYSENTER32);
337#endif
5fef55fd
YL
338}
339
b4af3f7c 340static void __cpuinit init_centaur(struct cpuinfo_x86 *c)
1da177e4 341{
48f4c485 342#ifdef CONFIG_X86_32
1da177e4 343 char *name;
29a9994b
PC
344 u32 fcr_set = 0;
345 u32 fcr_clr = 0;
346 u32 lo, hi, newlo;
347 u32 aa, bb, cc, dd;
1da177e4 348
edc05e6d
IM
349 /*
350 * Bit 31 in normal CPUID used for nonstandard 3DNow ID;
351 * 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway
352 */
e1a94a97 353 clear_cpu_cap(c, 0*32+31);
48f4c485
SAS
354#endif
355 early_init_centaur(c);
1da177e4 356 switch (c->x86) {
48f4c485 357#ifdef CONFIG_X86_32
29a9994b 358 case 5:
edc05e6d
IM
359 switch (c->x86_model) {
360 case 4:
361 name = "C6";
362 fcr_set = ECX8|DSMC|EDCTLB|EMMX|ERETSTK;
363 fcr_clr = DPDC;
364 printk(KERN_NOTICE "Disabling bugged TSC.\n");
e1a94a97 365 clear_cpu_cap(c, X86_FEATURE_TSC);
1da177e4 366#ifdef CONFIG_X86_OOSTORE
edc05e6d
IM
367 centaur_create_optimal_mcr();
368 /*
369 * Enable:
370 * write combining on non-stack, non-string
371 * write combining on string, all types
372 * weak write ordering
373 *
374 * The C6 original lacks weak read order
375 *
376 * Note 0x120 is write only on Winchip 1
377 */
378 wrmsr(MSR_IDT_MCR_CTRL, 0x01F0001F, 0);
29a9994b 379#endif
edc05e6d
IM
380 break;
381 case 8:
382 switch (c->x86_mask) {
383 default:
384 name = "2";
1da177e4 385 break;
edc05e6d
IM
386 case 7 ... 9:
387 name = "2A";
388 break;
389 case 10 ... 15:
390 name = "2B";
391 break;
392 }
393 fcr_set = ECX8|DSMC|DTLOCK|EMMX|EBRPRED|ERETSTK|
394 E2MMX|EAMD3D;
395 fcr_clr = DPDC;
1da177e4 396#ifdef CONFIG_X86_OOSTORE
edc05e6d
IM
397 winchip2_unprotect_mcr();
398 winchip2_create_optimal_mcr();
399 rdmsr(MSR_IDT_MCR_CTRL, lo, hi);
400 /*
401 * Enable:
402 * write combining on non-stack, non-string
403 * write combining on string, all types
404 * weak write ordering
405 */
406 lo |= 31;
407 wrmsr(MSR_IDT_MCR_CTRL, lo, hi);
408 winchip2_protect_mcr();
1da177e4 409#endif
edc05e6d
IM
410 break;
411 case 9:
412 name = "3";
413 fcr_set = ECX8|DSMC|DTLOCK|EMMX|EBRPRED|ERETSTK|
414 E2MMX|EAMD3D;
415 fcr_clr = DPDC;
1da177e4 416#ifdef CONFIG_X86_OOSTORE
edc05e6d
IM
417 winchip2_unprotect_mcr();
418 winchip2_create_optimal_mcr();
419 rdmsr(MSR_IDT_MCR_CTRL, lo, hi);
420 /*
421 * Enable:
422 * write combining on non-stack, non-string
423 * write combining on string, all types
424 * weak write ordering
425 */
426 lo |= 31;
427 wrmsr(MSR_IDT_MCR_CTRL, lo, hi);
428 winchip2_protect_mcr();
1da177e4 429#endif
edc05e6d
IM
430 break;
431 default:
432 name = "??";
433 }
1da177e4 434
edc05e6d
IM
435 rdmsr(MSR_IDT_FCR1, lo, hi);
436 newlo = (lo|fcr_set) & (~fcr_clr);
1da177e4 437
edc05e6d
IM
438 if (newlo != lo) {
439 printk(KERN_INFO "Centaur FCR was 0x%X now 0x%X\n",
440 lo, newlo);
441 wrmsr(MSR_IDT_FCR1, newlo, hi);
442 } else {
443 printk(KERN_INFO "Centaur FCR is 0x%X\n", lo);
444 }
445 /* Emulate MTRRs using Centaur's MCR. */
e1a94a97 446 set_cpu_cap(c, X86_FEATURE_CENTAUR_MCR);
edc05e6d 447 /* Report CX8 */
e1a94a97 448 set_cpu_cap(c, X86_FEATURE_CX8);
edc05e6d
IM
449 /* Set 3DNow! on Winchip 2 and above. */
450 if (c->x86_model >= 8)
e1a94a97 451 set_cpu_cap(c, X86_FEATURE_3DNOW);
edc05e6d
IM
452 /* See if we can find out some more. */
453 if (cpuid_eax(0x80000000) >= 0x80000005) {
454 /* Yes, we can. */
455 cpuid(0x80000005, &aa, &bb, &cc, &dd);
456 /* Add L1 data and code cache sizes. */
457 c->x86_cache_size = (cc>>24)+(dd>>24);
458 }
459 sprintf(c->x86_model_id, "WinChip %s", name);
460 break;
48f4c485 461#endif
29a9994b 462 case 6:
edc05e6d
IM
463 init_c3(c);
464 break;
1da177e4 465 }
48f4c485
SAS
466#ifdef CONFIG_X86_64
467 set_cpu_cap(c, X86_FEATURE_LFENCE_RDTSC);
468#endif
1da177e4
LT
469}
470
edc05e6d
IM
471static unsigned int __cpuinit
472centaur_size_cache(struct cpuinfo_x86 *c, unsigned int size)
1da177e4 473{
48f4c485 474#ifdef CONFIG_X86_32
1da177e4
LT
475 /* VIA C3 CPUs (670-68F) need further shifting. */
476 if ((c->x86 == 6) && ((c->x86_model == 7) || (c->x86_model == 8)))
477 size >>= 8;
478
edc05e6d
IM
479 /*
480 * There's also an erratum in Nehemiah stepping 1, which
481 * returns '65KB' instead of '64KB'
482 * - Note, it seems this may only be in engineering samples.
483 */
484 if ((c->x86 == 6) && (c->x86_model == 9) &&
485 (c->x86_mask == 1) && (size == 65))
29a9994b 486 size -= 1;
48f4c485 487#endif
1da177e4
LT
488 return size;
489}
490
02dde8b4 491static const struct cpu_dev __cpuinitconst centaur_cpu_dev = {
1da177e4
LT
492 .c_vendor = "Centaur",
493 .c_ident = { "CentaurHauls" },
5fef55fd 494 .c_early_init = early_init_centaur,
1da177e4
LT
495 .c_init = init_centaur,
496 .c_size_cache = centaur_size_cache,
10a434fc 497 .c_x86_vendor = X86_VENDOR_CENTAUR,
1da177e4
LT
498};
499
10a434fc 500cpu_dev_register(centaur_cpu_dev);