| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 1 | /* -*- linux-c -*- ------------------------------------------------------- * | 
|  | 2 | * | 
|  | 3 | *   Copyright (C) 1991, 1992 Linus Torvalds | 
|  | 4 | *   Copyright 2007 rPath, Inc. - All Rights Reserved | 
|  | 5 | * | 
|  | 6 | *   This file is part of the Linux kernel, and is made available under | 
|  | 7 | *   the terms of the GNU General Public License version 2. | 
|  | 8 | * | 
|  | 9 | * ----------------------------------------------------------------------- */ | 
|  | 10 |  | 
|  | 11 | /* | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 12 | * Check for obligatory CPU features and abort if the features are not | 
|  | 13 | * present.  This code should be compilable as 16-, 32- or 64-bit | 
|  | 14 | * code, so be very careful with types and inline assembly. | 
|  | 15 | * | 
|  | 16 | * This code should not contain any messages; that requires an | 
|  | 17 | * additional wrapper. | 
|  | 18 | * | 
|  | 19 | * As written, this code is not safe for inclusion into the kernel | 
|  | 20 | * proper (after FPU initialization, in particular). | 
|  | 21 | */ | 
|  | 22 |  | 
|  | 23 | #ifdef _SETUP | 
|  | 24 | # include "boot.h" | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 25 | #endif | 
|  | 26 | #include <linux/types.h> | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 27 | #include <asm/processor-flags.h> | 
|  | 28 | #include <asm/required-features.h> | 
|  | 29 | #include <asm/msr-index.h> | 
|  | 30 |  | 
| Joerg Roedel | 7b27718 | 2008-08-13 10:07:05 +0200 | [diff] [blame] | 31 | struct cpu_features cpu; | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 32 | static u32 cpu_vendor[3]; | 
|  | 33 | static u32 err_flags[NCAPINTS]; | 
|  | 34 |  | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 35 | static const int req_level = CONFIG_X86_MINIMUM_CPU_FAMILY; | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 36 |  | 
|  | 37 | static const u32 req_flags[NCAPINTS] = | 
|  | 38 | { | 
|  | 39 | REQUIRED_MASK0, | 
|  | 40 | REQUIRED_MASK1, | 
| H. Peter Anvin | b74b06c | 2008-08-15 15:36:31 -0700 | [diff] [blame] | 41 | 0, /* REQUIRED_MASK2 not implemented in this file */ | 
|  | 42 | 0, /* REQUIRED_MASK3 not implemented in this file */ | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 43 | REQUIRED_MASK4, | 
| H. Peter Anvin | b74b06c | 2008-08-15 15:36:31 -0700 | [diff] [blame] | 44 | 0, /* REQUIRED_MASK5 not implemented in this file */ | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 45 | REQUIRED_MASK6, | 
| H. Peter Anvin | b74b06c | 2008-08-15 15:36:31 -0700 | [diff] [blame] | 46 | 0, /* REQUIRED_MASK7 not implemented in this file */ | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 47 | }; | 
|  | 48 |  | 
| Paolo Ciarrocchi | 7030760 | 2008-02-22 23:11:12 +0100 | [diff] [blame] | 49 | #define A32(a, b, c, d) (((d) << 24)+((c) << 16)+((b) << 8)+(a)) | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 50 |  | 
|  | 51 | static int is_amd(void) | 
|  | 52 | { | 
| Paolo Ciarrocchi | 7030760 | 2008-02-22 23:11:12 +0100 | [diff] [blame] | 53 | return cpu_vendor[0] == A32('A', 'u', 't', 'h') && | 
|  | 54 | cpu_vendor[1] == A32('e', 'n', 't', 'i') && | 
|  | 55 | cpu_vendor[2] == A32('c', 'A', 'M', 'D'); | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 56 | } | 
|  | 57 |  | 
|  | 58 | static int is_centaur(void) | 
|  | 59 | { | 
| Paolo Ciarrocchi | 7030760 | 2008-02-22 23:11:12 +0100 | [diff] [blame] | 60 | return cpu_vendor[0] == A32('C', 'e', 'n', 't') && | 
|  | 61 | cpu_vendor[1] == A32('a', 'u', 'r', 'H') && | 
|  | 62 | cpu_vendor[2] == A32('a', 'u', 'l', 's'); | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 63 | } | 
|  | 64 |  | 
|  | 65 | static int is_transmeta(void) | 
|  | 66 | { | 
| Paolo Ciarrocchi | 7030760 | 2008-02-22 23:11:12 +0100 | [diff] [blame] | 67 | return cpu_vendor[0] == A32('G', 'e', 'n', 'u') && | 
|  | 68 | cpu_vendor[1] == A32('i', 'n', 'e', 'T') && | 
|  | 69 | cpu_vendor[2] == A32('M', 'x', '8', '6'); | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 70 | } | 
|  | 71 |  | 
|  | 72 | static int has_fpu(void) | 
|  | 73 | { | 
|  | 74 | u16 fcw = -1, fsw = -1; | 
|  | 75 | u32 cr0; | 
|  | 76 |  | 
|  | 77 | asm("movl %%cr0,%0" : "=r" (cr0)); | 
|  | 78 | if (cr0 & (X86_CR0_EM|X86_CR0_TS)) { | 
|  | 79 | cr0 &= ~(X86_CR0_EM|X86_CR0_TS); | 
|  | 80 | asm volatile("movl %0,%%cr0" : : "r" (cr0)); | 
|  | 81 | } | 
|  | 82 |  | 
| H. Peter Anvin | b015124 | 2007-08-22 16:28:01 -0700 | [diff] [blame] | 83 | asm volatile("fninit ; fnstsw %0 ; fnstcw %1" | 
|  | 84 | : "+m" (fsw), "+m" (fcw)); | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 85 |  | 
|  | 86 | return fsw == 0 && (fcw & 0x103f) == 0x003f; | 
|  | 87 | } | 
|  | 88 |  | 
|  | 89 | static int has_eflag(u32 mask) | 
|  | 90 | { | 
|  | 91 | u32 f0, f1; | 
|  | 92 |  | 
|  | 93 | asm("pushfl ; " | 
|  | 94 | "pushfl ; " | 
|  | 95 | "popl %0 ; " | 
|  | 96 | "movl %0,%1 ; " | 
|  | 97 | "xorl %2,%1 ; " | 
|  | 98 | "pushl %1 ; " | 
|  | 99 | "popfl ; " | 
|  | 100 | "pushfl ; " | 
|  | 101 | "popl %1 ; " | 
|  | 102 | "popfl" | 
| H. Peter Anvin | 5593eaa | 2007-07-14 16:47:13 -0700 | [diff] [blame] | 103 | : "=&r" (f0), "=&r" (f1) | 
|  | 104 | : "ri" (mask)); | 
| H. Peter Anvin | 31b54f4 | 2007-07-11 12:18:47 -0700 | [diff] [blame] | 105 |  | 
|  | 106 | return !!((f0^f1) & mask); | 
|  | 107 | } | 
|  | 108 |  | 
|  | 109 | static void get_flags(void) | 
|  | 110 | { | 
|  | 111 | u32 max_intel_level, max_amd_level; | 
|  | 112 | u32 tfms; | 
|  | 113 |  | 
|  | 114 | if (has_fpu()) | 
|  | 115 | set_bit(X86_FEATURE_FPU, cpu.flags); | 
|  | 116 |  | 
|  | 117 | if (has_eflag(X86_EFLAGS_ID)) { | 
|  | 118 | asm("cpuid" | 
|  | 119 | : "=a" (max_intel_level), | 
|  | 120 | "=b" (cpu_vendor[0]), | 
|  | 121 | "=d" (cpu_vendor[1]), | 
|  | 122 | "=c" (cpu_vendor[2]) | 
|  | 123 | : "a" (0)); | 
|  | 124 |  | 
|  | 125 | if (max_intel_level >= 0x00000001 && | 
|  | 126 | max_intel_level <= 0x0000ffff) { | 
|  | 127 | asm("cpuid" | 
|  | 128 | : "=a" (tfms), | 
|  | 129 | "=c" (cpu.flags[4]), | 
|  | 130 | "=d" (cpu.flags[0]) | 
|  | 131 | : "a" (0x00000001) | 
|  | 132 | : "ebx"); | 
|  | 133 | cpu.level = (tfms >> 8) & 15; | 
|  | 134 | cpu.model = (tfms >> 4) & 15; | 
|  | 135 | if (cpu.level >= 6) | 
|  | 136 | cpu.model += ((tfms >> 16) & 0xf) << 4; | 
|  | 137 | } | 
|  | 138 |  | 
|  | 139 | asm("cpuid" | 
|  | 140 | : "=a" (max_amd_level) | 
|  | 141 | : "a" (0x80000000) | 
|  | 142 | : "ebx", "ecx", "edx"); | 
|  | 143 |  | 
|  | 144 | if (max_amd_level >= 0x80000001 && | 
|  | 145 | max_amd_level <= 0x8000ffff) { | 
|  | 146 | u32 eax = 0x80000001; | 
|  | 147 | asm("cpuid" | 
|  | 148 | : "+a" (eax), | 
|  | 149 | "=c" (cpu.flags[6]), | 
|  | 150 | "=d" (cpu.flags[1]) | 
|  | 151 | : : "ebx"); | 
|  | 152 | } | 
|  | 153 | } | 
|  | 154 | } | 
|  | 155 |  | 
|  | 156 | /* Returns a bitmask of which words we have error bits in */ | 
|  | 157 | static int check_flags(void) | 
|  | 158 | { | 
|  | 159 | u32 err; | 
|  | 160 | int i; | 
|  | 161 |  | 
|  | 162 | err = 0; | 
|  | 163 | for (i = 0; i < NCAPINTS; i++) { | 
|  | 164 | err_flags[i] = req_flags[i] & ~cpu.flags[i]; | 
|  | 165 | if (err_flags[i]) | 
|  | 166 | err |= 1 << i; | 
|  | 167 | } | 
|  | 168 |  | 
|  | 169 | return err; | 
|  | 170 | } | 
|  | 171 |  | 
|  | 172 | /* | 
|  | 173 | * Returns -1 on error. | 
|  | 174 | * | 
|  | 175 | * *cpu_level is set to the current CPU level; *req_level to the required | 
|  | 176 | * level.  x86-64 is considered level 64 for this purpose. | 
|  | 177 | * | 
|  | 178 | * *err_flags_ptr is set to the flags error array if there are flags missing. | 
|  | 179 | */ | 
|  | 180 | int check_cpu(int *cpu_level_ptr, int *req_level_ptr, u32 **err_flags_ptr) | 
|  | 181 | { | 
|  | 182 | int err; | 
|  | 183 |  | 
|  | 184 | memset(&cpu.flags, 0, sizeof cpu.flags); | 
|  | 185 | cpu.level = 3; | 
|  | 186 |  | 
|  | 187 | if (has_eflag(X86_EFLAGS_AC)) | 
|  | 188 | cpu.level = 4; | 
|  | 189 |  | 
|  | 190 | get_flags(); | 
|  | 191 | err = check_flags(); | 
|  | 192 |  | 
|  | 193 | if (test_bit(X86_FEATURE_LM, cpu.flags)) | 
|  | 194 | cpu.level = 64; | 
|  | 195 |  | 
|  | 196 | if (err == 0x01 && | 
|  | 197 | !(err_flags[0] & | 
|  | 198 | ~((1 << X86_FEATURE_XMM)|(1 << X86_FEATURE_XMM2))) && | 
|  | 199 | is_amd()) { | 
|  | 200 | /* If this is an AMD and we're only missing SSE+SSE2, try to | 
|  | 201 | turn them on */ | 
|  | 202 |  | 
|  | 203 | u32 ecx = MSR_K7_HWCR; | 
|  | 204 | u32 eax, edx; | 
|  | 205 |  | 
|  | 206 | asm("rdmsr" : "=a" (eax), "=d" (edx) : "c" (ecx)); | 
|  | 207 | eax &= ~(1 << 15); | 
|  | 208 | asm("wrmsr" : : "a" (eax), "d" (edx), "c" (ecx)); | 
|  | 209 |  | 
|  | 210 | get_flags();	/* Make sure it really did something */ | 
|  | 211 | err = check_flags(); | 
|  | 212 | } else if (err == 0x01 && | 
|  | 213 | !(err_flags[0] & ~(1 << X86_FEATURE_CX8)) && | 
|  | 214 | is_centaur() && cpu.model >= 6) { | 
|  | 215 | /* If this is a VIA C3, we might have to enable CX8 | 
|  | 216 | explicitly */ | 
|  | 217 |  | 
|  | 218 | u32 ecx = MSR_VIA_FCR; | 
|  | 219 | u32 eax, edx; | 
|  | 220 |  | 
|  | 221 | asm("rdmsr" : "=a" (eax), "=d" (edx) : "c" (ecx)); | 
|  | 222 | eax |= (1<<1)|(1<<7); | 
|  | 223 | asm("wrmsr" : : "a" (eax), "d" (edx), "c" (ecx)); | 
|  | 224 |  | 
|  | 225 | set_bit(X86_FEATURE_CX8, cpu.flags); | 
|  | 226 | err = check_flags(); | 
|  | 227 | } else if (err == 0x01 && is_transmeta()) { | 
|  | 228 | /* Transmeta might have masked feature bits in word 0 */ | 
|  | 229 |  | 
|  | 230 | u32 ecx = 0x80860004; | 
|  | 231 | u32 eax, edx; | 
|  | 232 | u32 level = 1; | 
|  | 233 |  | 
|  | 234 | asm("rdmsr" : "=a" (eax), "=d" (edx) : "c" (ecx)); | 
|  | 235 | asm("wrmsr" : : "a" (~0), "d" (edx), "c" (ecx)); | 
|  | 236 | asm("cpuid" | 
|  | 237 | : "+a" (level), "=d" (cpu.flags[0]) | 
|  | 238 | : : "ecx", "ebx"); | 
|  | 239 | asm("wrmsr" : : "a" (eax), "d" (edx), "c" (ecx)); | 
|  | 240 |  | 
|  | 241 | err = check_flags(); | 
|  | 242 | } | 
|  | 243 |  | 
|  | 244 | if (err_flags_ptr) | 
|  | 245 | *err_flags_ptr = err ? err_flags : NULL; | 
|  | 246 | if (cpu_level_ptr) | 
|  | 247 | *cpu_level_ptr = cpu.level; | 
|  | 248 | if (req_level_ptr) | 
|  | 249 | *req_level_ptr = req_level; | 
|  | 250 |  | 
|  | 251 | return (cpu.level < req_level || err) ? -1 : 0; | 
|  | 252 | } |