1 // Copyright 2016 The SwiftShader Authors. All Rights Reserved. 2 // 3 // Licensed under the Apache License, Version 2.0 (the "License"); 4 // you may not use this file except in compliance with the License. 5 // You may obtain a copy of the License at 6 // 7 // http://www.apache.org/licenses/LICENSE-2.0 8 // 9 // Unless required by applicable law or agreed to in writing, software 10 // distributed under the License is distributed on an "AS IS" BASIS, 11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 // See the License for the specific language governing permissions and 13 // limitations under the License. 14 15 #include "CPUID.hpp" 16 17 #if defined(_WIN32) 18 #ifndef WIN32_LEAN_AND_MEAN 19 #define WIN32_LEAN_AND_MEAN 20 #endif 21 #include <windows.h> 22 #include <intrin.h> 23 #include <float.h> 24 #else 25 #include <unistd.h> 26 #include <sched.h> 27 #include <sys/types.h> 28 #endif 29 30 namespace sw 31 { 32 bool CPUID::MMX = detectMMX(); 33 bool CPUID::CMOV = detectCMOV(); 34 bool CPUID::SSE = detectSSE(); 35 bool CPUID::SSE2 = detectSSE2(); 36 bool CPUID::SSE3 = detectSSE3(); 37 bool CPUID::SSSE3 = detectSSSE3(); 38 bool CPUID::SSE4_1 = detectSSE4_1(); 39 int CPUID::cores = detectCoreCount(); 40 int CPUID::affinity = detectAffinity(); 41 42 bool CPUID::enableMMX = true; 43 bool CPUID::enableCMOV = true; 44 bool CPUID::enableSSE = true; 45 bool CPUID::enableSSE2 = true; 46 bool CPUID::enableSSE3 = true; 47 bool CPUID::enableSSSE3 = true; 48 bool CPUID::enableSSE4_1 = true; 49 setEnableMMX(bool enable)50 void CPUID::setEnableMMX(bool enable) 51 { 52 enableMMX = enable; 53 54 if(!enableMMX) 55 { 56 enableSSE = false; 57 enableSSE2 = false; 58 enableSSE3 = false; 59 enableSSSE3 = false; 60 enableSSE4_1 = false; 61 } 62 } 63 setEnableCMOV(bool enable)64 void CPUID::setEnableCMOV(bool enable) 65 { 66 enableCMOV = enable; 67 68 if(!CMOV) 69 { 70 enableSSE = false; 71 enableSSE2 = false; 72 enableSSE3 = false; 73 enableSSSE3 = false; 74 enableSSE4_1 = false; 75 } 76 } 77 setEnableSSE(bool enable)78 void CPUID::setEnableSSE(bool enable) 79 { 80 enableSSE = enable; 81 82 if(enableSSE) 83 { 84 enableMMX = true; 85 enableCMOV = true; 86 } 87 else 88 { 89 enableSSE2 = false; 90 enableSSE3 = false; 91 enableSSSE3 = false; 92 enableSSE4_1 = false; 93 } 94 } 95 setEnableSSE2(bool enable)96 void CPUID::setEnableSSE2(bool enable) 97 { 98 enableSSE2 = enable; 99 100 if(enableSSE2) 101 { 102 enableMMX = true; 103 enableCMOV = true; 104 enableSSE = true; 105 } 106 else 107 { 108 enableSSE3 = false; 109 enableSSSE3 = false; 110 enableSSE4_1 = false; 111 } 112 } 113 setEnableSSE3(bool enable)114 void CPUID::setEnableSSE3(bool enable) 115 { 116 enableSSE3 = enable; 117 118 if(enableSSE3) 119 { 120 enableMMX = true; 121 enableCMOV = true; 122 enableSSE = true; 123 enableSSE2 = true; 124 } 125 else 126 { 127 enableSSSE3 = false; 128 enableSSE4_1 = false; 129 } 130 } 131 setEnableSSSE3(bool enable)132 void CPUID::setEnableSSSE3(bool enable) 133 { 134 enableSSSE3 = enable; 135 136 if(enableSSSE3) 137 { 138 enableMMX = true; 139 enableCMOV = true; 140 enableSSE = true; 141 enableSSE2 = true; 142 enableSSE3 = true; 143 } 144 else 145 { 146 enableSSE4_1 = false; 147 } 148 } 149 setEnableSSE4_1(bool enable)150 void CPUID::setEnableSSE4_1(bool enable) 151 { 152 enableSSE4_1 = enable; 153 154 if(enableSSE4_1) 155 { 156 enableMMX = true; 157 enableCMOV = true; 158 enableSSE = true; 159 enableSSE2 = true; 160 enableSSE3 = true; 161 enableSSSE3 = true; 162 } 163 } 164 cpuid(int registers[4],int info)165 static void cpuid(int registers[4], int info) 166 { 167 #if defined(_WIN32) 168 __cpuid(registers, info); 169 #else 170 __asm volatile("cpuid": "=a" (registers[0]), "=b" (registers[1]), "=c" (registers[2]), "=d" (registers[3]): "a" (info)); 171 #endif 172 } 173 detectMMX()174 bool CPUID::detectMMX() 175 { 176 int registers[4]; 177 cpuid(registers, 1); 178 return MMX = (registers[3] & 0x00800000) != 0; 179 } 180 detectCMOV()181 bool CPUID::detectCMOV() 182 { 183 int registers[4]; 184 cpuid(registers, 1); 185 return CMOV = (registers[3] & 0x00008000) != 0; 186 } 187 detectSSE()188 bool CPUID::detectSSE() 189 { 190 int registers[4]; 191 cpuid(registers, 1); 192 return SSE = (registers[3] & 0x02000000) != 0; 193 } 194 detectSSE2()195 bool CPUID::detectSSE2() 196 { 197 int registers[4]; 198 cpuid(registers, 1); 199 return SSE2 = (registers[3] & 0x04000000) != 0; 200 } 201 detectSSE3()202 bool CPUID::detectSSE3() 203 { 204 int registers[4]; 205 cpuid(registers, 1); 206 return SSE3 = (registers[2] & 0x00000001) != 0; 207 } 208 detectSSSE3()209 bool CPUID::detectSSSE3() 210 { 211 int registers[4]; 212 cpuid(registers, 1); 213 return SSSE3 = (registers[2] & 0x00000200) != 0; 214 } 215 detectSSE4_1()216 bool CPUID::detectSSE4_1() 217 { 218 int registers[4]; 219 cpuid(registers, 1); 220 return SSE4_1 = (registers[2] & 0x00080000) != 0; 221 } 222 detectCoreCount()223 int CPUID::detectCoreCount() 224 { 225 int cores = 0; 226 227 #if defined(_WIN32) 228 DWORD_PTR processAffinityMask = 1; 229 DWORD_PTR systemAffinityMask = 1; 230 231 GetProcessAffinityMask(GetCurrentProcess(), &processAffinityMask, &systemAffinityMask); 232 233 while(systemAffinityMask) 234 { 235 if(systemAffinityMask & 1) 236 { 237 cores++; 238 } 239 240 systemAffinityMask >>= 1; 241 } 242 #else 243 cores = sysconf(_SC_NPROCESSORS_ONLN); 244 #endif 245 246 if(cores < 1) cores = 1; 247 if(cores > 16) cores = 16; 248 249 return cores; // FIXME: Number of physical cores 250 } 251 detectAffinity()252 int CPUID::detectAffinity() 253 { 254 int cores = 0; 255 256 #if defined(_WIN32) 257 DWORD_PTR processAffinityMask = 1; 258 DWORD_PTR systemAffinityMask = 1; 259 260 GetProcessAffinityMask(GetCurrentProcess(), &processAffinityMask, &systemAffinityMask); 261 262 while(processAffinityMask) 263 { 264 if(processAffinityMask & 1) 265 { 266 cores++; 267 } 268 269 processAffinityMask >>= 1; 270 } 271 #else 272 return detectCoreCount(); // FIXME: Assumes no affinity limitation 273 #endif 274 275 if(cores < 1) cores = 1; 276 if(cores > 16) cores = 16; 277 278 return cores; 279 } 280 setFlushToZero(bool enable)281 void CPUID::setFlushToZero(bool enable) 282 { 283 #if defined(_MSC_VER) 284 _controlfp(enable ? _DN_FLUSH : _DN_SAVE, _MCW_DN); 285 #else 286 // Unimplemented 287 #endif 288 } 289 setDenormalsAreZero(bool enable)290 void CPUID::setDenormalsAreZero(bool enable) 291 { 292 // Unimplemented 293 } 294 } 295