1 //===--- X86.cpp - Implement X86 target feature support -------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements X86 TargetInfo objects.
10 //
11 //===----------------------------------------------------------------------===//
12
13 #include "X86.h"
14 #include "clang/Basic/Builtins.h"
15 #include "clang/Basic/Diagnostic.h"
16 #include "clang/Basic/TargetBuiltins.h"
17 #include "llvm/ADT/StringExtras.h"
18 #include "llvm/ADT/StringRef.h"
19 #include "llvm/ADT/StringSwitch.h"
20 #include "llvm/Support/X86TargetParser.h"
21
22 namespace clang {
23 namespace targets {
24
25 const Builtin::Info BuiltinInfoX86[] = {
26 #define BUILTIN(ID, TYPE, ATTRS) \
27 {#ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, nullptr},
28 #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE) \
29 {#ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, FEATURE},
30 #define TARGET_HEADER_BUILTIN(ID, TYPE, ATTRS, HEADER, LANGS, FEATURE) \
31 {#ID, TYPE, ATTRS, HEADER, LANGS, FEATURE},
32 #include "clang/Basic/BuiltinsX86.def"
33
34 #define BUILTIN(ID, TYPE, ATTRS) \
35 {#ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, nullptr},
36 #define TARGET_BUILTIN(ID, TYPE, ATTRS, FEATURE) \
37 {#ID, TYPE, ATTRS, nullptr, ALL_LANGUAGES, FEATURE},
38 #define TARGET_HEADER_BUILTIN(ID, TYPE, ATTRS, HEADER, LANGS, FEATURE) \
39 {#ID, TYPE, ATTRS, HEADER, LANGS, FEATURE},
40 #include "clang/Basic/BuiltinsX86_64.def"
41 };
42
43 static const char *const GCCRegNames[] = {
44 "ax", "dx", "cx", "bx", "si", "di", "bp", "sp",
45 "st", "st(1)", "st(2)", "st(3)", "st(4)", "st(5)", "st(6)", "st(7)",
46 "argp", "flags", "fpcr", "fpsr", "dirflag", "frame", "xmm0", "xmm1",
47 "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7", "mm0", "mm1",
48 "mm2", "mm3", "mm4", "mm5", "mm6", "mm7", "r8", "r9",
49 "r10", "r11", "r12", "r13", "r14", "r15", "xmm8", "xmm9",
50 "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15", "ymm0", "ymm1",
51 "ymm2", "ymm3", "ymm4", "ymm5", "ymm6", "ymm7", "ymm8", "ymm9",
52 "ymm10", "ymm11", "ymm12", "ymm13", "ymm14", "ymm15", "xmm16", "xmm17",
53 "xmm18", "xmm19", "xmm20", "xmm21", "xmm22", "xmm23", "xmm24", "xmm25",
54 "xmm26", "xmm27", "xmm28", "xmm29", "xmm30", "xmm31", "ymm16", "ymm17",
55 "ymm18", "ymm19", "ymm20", "ymm21", "ymm22", "ymm23", "ymm24", "ymm25",
56 "ymm26", "ymm27", "ymm28", "ymm29", "ymm30", "ymm31", "zmm0", "zmm1",
57 "zmm2", "zmm3", "zmm4", "zmm5", "zmm6", "zmm7", "zmm8", "zmm9",
58 "zmm10", "zmm11", "zmm12", "zmm13", "zmm14", "zmm15", "zmm16", "zmm17",
59 "zmm18", "zmm19", "zmm20", "zmm21", "zmm22", "zmm23", "zmm24", "zmm25",
60 "zmm26", "zmm27", "zmm28", "zmm29", "zmm30", "zmm31", "k0", "k1",
61 "k2", "k3", "k4", "k5", "k6", "k7",
62 "cr0", "cr2", "cr3", "cr4", "cr8",
63 "dr0", "dr1", "dr2", "dr3", "dr6", "dr7",
64 "bnd0", "bnd1", "bnd2", "bnd3",
65 "tmm0", "tmm1", "tmm2", "tmm3", "tmm4", "tmm5", "tmm6", "tmm7",
66 };
67
68 const TargetInfo::AddlRegName AddlRegNames[] = {
69 {{"al", "ah", "eax", "rax"}, 0},
70 {{"bl", "bh", "ebx", "rbx"}, 3},
71 {{"cl", "ch", "ecx", "rcx"}, 2},
72 {{"dl", "dh", "edx", "rdx"}, 1},
73 {{"esi", "rsi"}, 4},
74 {{"edi", "rdi"}, 5},
75 {{"esp", "rsp"}, 7},
76 {{"ebp", "rbp"}, 6},
77 {{"r8d", "r8w", "r8b"}, 38},
78 {{"r9d", "r9w", "r9b"}, 39},
79 {{"r10d", "r10w", "r10b"}, 40},
80 {{"r11d", "r11w", "r11b"}, 41},
81 {{"r12d", "r12w", "r12b"}, 42},
82 {{"r13d", "r13w", "r13b"}, 43},
83 {{"r14d", "r14w", "r14b"}, 44},
84 {{"r15d", "r15w", "r15b"}, 45},
85 };
86
87 } // namespace targets
88 } // namespace clang
89
90 using namespace clang;
91 using namespace clang::targets;
92
setFPMath(StringRef Name)93 bool X86TargetInfo::setFPMath(StringRef Name) {
94 if (Name == "387") {
95 FPMath = FP_387;
96 return true;
97 }
98 if (Name == "sse") {
99 FPMath = FP_SSE;
100 return true;
101 }
102 return false;
103 }
104
initFeatureMap(llvm::StringMap<bool> & Features,DiagnosticsEngine & Diags,StringRef CPU,const std::vector<std::string> & FeaturesVec) const105 bool X86TargetInfo::initFeatureMap(
106 llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags, StringRef CPU,
107 const std::vector<std::string> &FeaturesVec) const {
108 // FIXME: This *really* should not be here.
109 // X86_64 always has SSE2.
110 if (getTriple().getArch() == llvm::Triple::x86_64)
111 setFeatureEnabled(Features, "sse2", true);
112
113 using namespace llvm::X86;
114
115 SmallVector<StringRef, 16> CPUFeatures;
116 getFeaturesForCPU(CPU, CPUFeatures);
117 for (auto &F : CPUFeatures)
118 setFeatureEnabled(Features, F, true);
119
120 if (!TargetInfo::initFeatureMap(Features, Diags, CPU, FeaturesVec))
121 return false;
122
123 // Can't do this earlier because we need to be able to explicitly enable
124 // or disable these features and the things that they depend upon.
125
126 // Enable popcnt if sse4.2 is enabled and popcnt is not explicitly disabled.
127 auto I = Features.find("sse4.2");
128 if (I != Features.end() && I->getValue() &&
129 llvm::find(FeaturesVec, "-popcnt") == FeaturesVec.end())
130 Features["popcnt"] = true;
131
132 // Additionally, if SSE is enabled and mmx is not explicitly disabled,
133 // then enable MMX.
134 I = Features.find("sse");
135 if (I != Features.end() && I->getValue() &&
136 llvm::find(FeaturesVec, "-mmx") == FeaturesVec.end())
137 Features["mmx"] = true;
138
139 // Enable xsave if avx is enabled and xsave is not explicitly disabled.
140 I = Features.find("avx");
141 if (I != Features.end() && I->getValue() &&
142 llvm::find(FeaturesVec, "-xsave") == FeaturesVec.end())
143 Features["xsave"] = true;
144
145 return true;
146 }
147
setFeatureEnabled(llvm::StringMap<bool> & Features,StringRef Name,bool Enabled) const148 void X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
149 StringRef Name, bool Enabled) const {
150 if (Name == "sse4") {
151 // We can get here via the __target__ attribute since that's not controlled
152 // via the -msse4/-mno-sse4 command line alias. Handle this the same way
153 // here - turn on the sse4.2 if enabled, turn off the sse4.1 level if
154 // disabled.
155 if (Enabled)
156 Name = "sse4.2";
157 else
158 Name = "sse4.1";
159 }
160
161 Features[Name] = Enabled;
162 llvm::X86::updateImpliedFeatures(Name, Enabled, Features);
163 }
164
165 /// handleTargetFeatures - Perform initialization based on the user
166 /// configured set of features.
handleTargetFeatures(std::vector<std::string> & Features,DiagnosticsEngine & Diags)167 bool X86TargetInfo::handleTargetFeatures(std::vector<std::string> &Features,
168 DiagnosticsEngine &Diags) {
169 for (const auto &Feature : Features) {
170 if (Feature[0] != '+')
171 continue;
172
173 if (Feature == "+aes") {
174 HasAES = true;
175 } else if (Feature == "+vaes") {
176 HasVAES = true;
177 } else if (Feature == "+pclmul") {
178 HasPCLMUL = true;
179 } else if (Feature == "+vpclmulqdq") {
180 HasVPCLMULQDQ = true;
181 } else if (Feature == "+lzcnt") {
182 HasLZCNT = true;
183 } else if (Feature == "+rdrnd") {
184 HasRDRND = true;
185 } else if (Feature == "+fsgsbase") {
186 HasFSGSBASE = true;
187 } else if (Feature == "+bmi") {
188 HasBMI = true;
189 } else if (Feature == "+bmi2") {
190 HasBMI2 = true;
191 } else if (Feature == "+popcnt") {
192 HasPOPCNT = true;
193 } else if (Feature == "+rtm") {
194 HasRTM = true;
195 } else if (Feature == "+prfchw") {
196 HasPRFCHW = true;
197 } else if (Feature == "+rdseed") {
198 HasRDSEED = true;
199 } else if (Feature == "+adx") {
200 HasADX = true;
201 } else if (Feature == "+tbm") {
202 HasTBM = true;
203 } else if (Feature == "+lwp") {
204 HasLWP = true;
205 } else if (Feature == "+fma") {
206 HasFMA = true;
207 } else if (Feature == "+f16c") {
208 HasF16C = true;
209 } else if (Feature == "+gfni") {
210 HasGFNI = true;
211 } else if (Feature == "+avx512cd") {
212 HasAVX512CD = true;
213 } else if (Feature == "+avx512vpopcntdq") {
214 HasAVX512VPOPCNTDQ = true;
215 } else if (Feature == "+avx512vnni") {
216 HasAVX512VNNI = true;
217 } else if (Feature == "+avx512bf16") {
218 HasAVX512BF16 = true;
219 } else if (Feature == "+avx512er") {
220 HasAVX512ER = true;
221 } else if (Feature == "+avx512pf") {
222 HasAVX512PF = true;
223 } else if (Feature == "+avx512dq") {
224 HasAVX512DQ = true;
225 } else if (Feature == "+avx512bitalg") {
226 HasAVX512BITALG = true;
227 } else if (Feature == "+avx512bw") {
228 HasAVX512BW = true;
229 } else if (Feature == "+avx512vl") {
230 HasAVX512VL = true;
231 } else if (Feature == "+avx512vbmi") {
232 HasAVX512VBMI = true;
233 } else if (Feature == "+avx512vbmi2") {
234 HasAVX512VBMI2 = true;
235 } else if (Feature == "+avx512ifma") {
236 HasAVX512IFMA = true;
237 } else if (Feature == "+avx512vp2intersect") {
238 HasAVX512VP2INTERSECT = true;
239 } else if (Feature == "+sha") {
240 HasSHA = true;
241 } else if (Feature == "+shstk") {
242 HasSHSTK = true;
243 } else if (Feature == "+movbe") {
244 HasMOVBE = true;
245 } else if (Feature == "+sgx") {
246 HasSGX = true;
247 } else if (Feature == "+cx8") {
248 HasCX8 = true;
249 } else if (Feature == "+cx16") {
250 HasCX16 = true;
251 } else if (Feature == "+fxsr") {
252 HasFXSR = true;
253 } else if (Feature == "+xsave") {
254 HasXSAVE = true;
255 } else if (Feature == "+xsaveopt") {
256 HasXSAVEOPT = true;
257 } else if (Feature == "+xsavec") {
258 HasXSAVEC = true;
259 } else if (Feature == "+xsaves") {
260 HasXSAVES = true;
261 } else if (Feature == "+mwaitx") {
262 HasMWAITX = true;
263 } else if (Feature == "+pku") {
264 HasPKU = true;
265 } else if (Feature == "+clflushopt") {
266 HasCLFLUSHOPT = true;
267 } else if (Feature == "+clwb") {
268 HasCLWB = true;
269 } else if (Feature == "+wbnoinvd") {
270 HasWBNOINVD = true;
271 } else if (Feature == "+prefetchwt1") {
272 HasPREFETCHWT1 = true;
273 } else if (Feature == "+clzero") {
274 HasCLZERO = true;
275 } else if (Feature == "+cldemote") {
276 HasCLDEMOTE = true;
277 } else if (Feature == "+rdpid") {
278 HasRDPID = true;
279 } else if (Feature == "+kl") {
280 HasKL = true;
281 } else if (Feature == "+widekl") {
282 HasWIDEKL = true;
283 } else if (Feature == "+retpoline-external-thunk") {
284 HasRetpolineExternalThunk = true;
285 } else if (Feature == "+sahf") {
286 HasLAHFSAHF = true;
287 } else if (Feature == "+waitpkg") {
288 HasWAITPKG = true;
289 } else if (Feature == "+movdiri") {
290 HasMOVDIRI = true;
291 } else if (Feature == "+movdir64b") {
292 HasMOVDIR64B = true;
293 } else if (Feature == "+pconfig") {
294 HasPCONFIG = true;
295 } else if (Feature == "+ptwrite") {
296 HasPTWRITE = true;
297 } else if (Feature == "+invpcid") {
298 HasINVPCID = true;
299 } else if (Feature == "+enqcmd") {
300 HasENQCMD = true;
301 } else if (Feature == "+hreset") {
302 HasHRESET = true;
303 } else if (Feature == "+amx-bf16") {
304 HasAMXBF16 = true;
305 } else if (Feature == "+amx-int8") {
306 HasAMXINT8 = true;
307 } else if (Feature == "+amx-tile") {
308 HasAMXTILE = true;
309 } else if (Feature == "+avxvnni") {
310 HasAVXVNNI = true;
311 } else if (Feature == "+serialize") {
312 HasSERIALIZE = true;
313 } else if (Feature == "+tsxldtrk") {
314 HasTSXLDTRK = true;
315 } else if (Feature == "+uintr") {
316 HasUINTR = true;
317 }
318
319 X86SSEEnum Level = llvm::StringSwitch<X86SSEEnum>(Feature)
320 .Case("+avx512f", AVX512F)
321 .Case("+avx2", AVX2)
322 .Case("+avx", AVX)
323 .Case("+sse4.2", SSE42)
324 .Case("+sse4.1", SSE41)
325 .Case("+ssse3", SSSE3)
326 .Case("+sse3", SSE3)
327 .Case("+sse2", SSE2)
328 .Case("+sse", SSE1)
329 .Default(NoSSE);
330 SSELevel = std::max(SSELevel, Level);
331
332 MMX3DNowEnum ThreeDNowLevel = llvm::StringSwitch<MMX3DNowEnum>(Feature)
333 .Case("+3dnowa", AMD3DNowAthlon)
334 .Case("+3dnow", AMD3DNow)
335 .Case("+mmx", MMX)
336 .Default(NoMMX3DNow);
337 MMX3DNowLevel = std::max(MMX3DNowLevel, ThreeDNowLevel);
338
339 XOPEnum XLevel = llvm::StringSwitch<XOPEnum>(Feature)
340 .Case("+xop", XOP)
341 .Case("+fma4", FMA4)
342 .Case("+sse4a", SSE4A)
343 .Default(NoXOP);
344 XOPLevel = std::max(XOPLevel, XLevel);
345 }
346
347 // LLVM doesn't have a separate switch for fpmath, so only accept it if it
348 // matches the selected sse level.
349 if ((FPMath == FP_SSE && SSELevel < SSE1) ||
350 (FPMath == FP_387 && SSELevel >= SSE1)) {
351 Diags.Report(diag::err_target_unsupported_fpmath)
352 << (FPMath == FP_SSE ? "sse" : "387");
353 return false;
354 }
355
356 SimdDefaultAlign =
357 hasFeature("avx512f") ? 512 : hasFeature("avx") ? 256 : 128;
358 return true;
359 }
360
361 /// X86TargetInfo::getTargetDefines - Return the set of the X86-specific macro
362 /// definitions for this particular subtarget.
getTargetDefines(const LangOptions & Opts,MacroBuilder & Builder) const363 void X86TargetInfo::getTargetDefines(const LangOptions &Opts,
364 MacroBuilder &Builder) const {
365 // Inline assembly supports X86 flag outputs.
366 Builder.defineMacro("__GCC_ASM_FLAG_OUTPUTS__");
367
368 std::string CodeModel = getTargetOpts().CodeModel;
369 if (CodeModel == "default")
370 CodeModel = "small";
371 Builder.defineMacro("__code_model_" + CodeModel + "__");
372
373 // Target identification.
374 if (getTriple().getArch() == llvm::Triple::x86_64) {
375 Builder.defineMacro("__amd64__");
376 Builder.defineMacro("__amd64");
377 Builder.defineMacro("__x86_64");
378 Builder.defineMacro("__x86_64__");
379 if (getTriple().getArchName() == "x86_64h") {
380 Builder.defineMacro("__x86_64h");
381 Builder.defineMacro("__x86_64h__");
382 }
383 } else {
384 DefineStd(Builder, "i386", Opts);
385 }
386
387 Builder.defineMacro("__SEG_GS");
388 Builder.defineMacro("__SEG_FS");
389 Builder.defineMacro("__seg_gs", "__attribute__((address_space(256)))");
390 Builder.defineMacro("__seg_fs", "__attribute__((address_space(257)))");
391
392 // Subtarget options.
393 // FIXME: We are hard-coding the tune parameters based on the CPU, but they
394 // truly should be based on -mtune options.
395 using namespace llvm::X86;
396 switch (CPU) {
397 case CK_None:
398 break;
399 case CK_i386:
400 // The rest are coming from the i386 define above.
401 Builder.defineMacro("__tune_i386__");
402 break;
403 case CK_i486:
404 case CK_WinChipC6:
405 case CK_WinChip2:
406 case CK_C3:
407 defineCPUMacros(Builder, "i486");
408 break;
409 case CK_PentiumMMX:
410 Builder.defineMacro("__pentium_mmx__");
411 Builder.defineMacro("__tune_pentium_mmx__");
412 LLVM_FALLTHROUGH;
413 case CK_i586:
414 case CK_Pentium:
415 defineCPUMacros(Builder, "i586");
416 defineCPUMacros(Builder, "pentium");
417 break;
418 case CK_Pentium3:
419 case CK_PentiumM:
420 Builder.defineMacro("__tune_pentium3__");
421 LLVM_FALLTHROUGH;
422 case CK_Pentium2:
423 case CK_C3_2:
424 Builder.defineMacro("__tune_pentium2__");
425 LLVM_FALLTHROUGH;
426 case CK_PentiumPro:
427 case CK_i686:
428 defineCPUMacros(Builder, "i686");
429 defineCPUMacros(Builder, "pentiumpro");
430 break;
431 case CK_Pentium4:
432 defineCPUMacros(Builder, "pentium4");
433 break;
434 case CK_Yonah:
435 case CK_Prescott:
436 case CK_Nocona:
437 defineCPUMacros(Builder, "nocona");
438 break;
439 case CK_Core2:
440 case CK_Penryn:
441 defineCPUMacros(Builder, "core2");
442 break;
443 case CK_Bonnell:
444 defineCPUMacros(Builder, "atom");
445 break;
446 case CK_Silvermont:
447 defineCPUMacros(Builder, "slm");
448 break;
449 case CK_Goldmont:
450 defineCPUMacros(Builder, "goldmont");
451 break;
452 case CK_GoldmontPlus:
453 defineCPUMacros(Builder, "goldmont_plus");
454 break;
455 case CK_Tremont:
456 defineCPUMacros(Builder, "tremont");
457 break;
458 case CK_Nehalem:
459 case CK_Westmere:
460 case CK_SandyBridge:
461 case CK_IvyBridge:
462 case CK_Haswell:
463 case CK_Broadwell:
464 case CK_SkylakeClient:
465 case CK_SkylakeServer:
466 case CK_Cascadelake:
467 case CK_Cooperlake:
468 case CK_Cannonlake:
469 case CK_IcelakeClient:
470 case CK_IcelakeServer:
471 case CK_Tigerlake:
472 case CK_SapphireRapids:
473 case CK_Alderlake:
474 // FIXME: Historically, we defined this legacy name, it would be nice to
475 // remove it at some point. We've never exposed fine-grained names for
476 // recent primary x86 CPUs, and we should keep it that way.
477 defineCPUMacros(Builder, "corei7");
478 break;
479 case CK_KNL:
480 defineCPUMacros(Builder, "knl");
481 break;
482 case CK_KNM:
483 break;
484 case CK_Lakemont:
485 defineCPUMacros(Builder, "i586", /*Tuning*/false);
486 defineCPUMacros(Builder, "pentium", /*Tuning*/false);
487 Builder.defineMacro("__tune_lakemont__");
488 break;
489 case CK_K6_2:
490 Builder.defineMacro("__k6_2__");
491 Builder.defineMacro("__tune_k6_2__");
492 LLVM_FALLTHROUGH;
493 case CK_K6_3:
494 if (CPU != CK_K6_2) { // In case of fallthrough
495 // FIXME: GCC may be enabling these in cases where some other k6
496 // architecture is specified but -m3dnow is explicitly provided. The
497 // exact semantics need to be determined and emulated here.
498 Builder.defineMacro("__k6_3__");
499 Builder.defineMacro("__tune_k6_3__");
500 }
501 LLVM_FALLTHROUGH;
502 case CK_K6:
503 defineCPUMacros(Builder, "k6");
504 break;
505 case CK_Athlon:
506 case CK_AthlonXP:
507 defineCPUMacros(Builder, "athlon");
508 if (SSELevel != NoSSE) {
509 Builder.defineMacro("__athlon_sse__");
510 Builder.defineMacro("__tune_athlon_sse__");
511 }
512 break;
513 case CK_K8:
514 case CK_K8SSE3:
515 case CK_x86_64:
516 case CK_x86_64_v2:
517 case CK_x86_64_v3:
518 case CK_x86_64_v4:
519 defineCPUMacros(Builder, "k8");
520 break;
521 case CK_AMDFAM10:
522 defineCPUMacros(Builder, "amdfam10");
523 break;
524 case CK_BTVER1:
525 defineCPUMacros(Builder, "btver1");
526 break;
527 case CK_BTVER2:
528 defineCPUMacros(Builder, "btver2");
529 break;
530 case CK_BDVER1:
531 defineCPUMacros(Builder, "bdver1");
532 break;
533 case CK_BDVER2:
534 defineCPUMacros(Builder, "bdver2");
535 break;
536 case CK_BDVER3:
537 defineCPUMacros(Builder, "bdver3");
538 break;
539 case CK_BDVER4:
540 defineCPUMacros(Builder, "bdver4");
541 break;
542 case CK_ZNVER1:
543 defineCPUMacros(Builder, "znver1");
544 break;
545 case CK_ZNVER2:
546 defineCPUMacros(Builder, "znver2");
547 break;
548 case CK_ZNVER3:
549 defineCPUMacros(Builder, "znver3");
550 break;
551 case CK_Geode:
552 defineCPUMacros(Builder, "geode");
553 break;
554 }
555
556 // Target properties.
557 Builder.defineMacro("__REGISTER_PREFIX__", "");
558
559 // Define __NO_MATH_INLINES on linux/x86 so that we don't get inline
560 // functions in glibc header files that use FP Stack inline asm which the
561 // backend can't deal with (PR879).
562 Builder.defineMacro("__NO_MATH_INLINES");
563
564 if (HasAES)
565 Builder.defineMacro("__AES__");
566
567 if (HasVAES)
568 Builder.defineMacro("__VAES__");
569
570 if (HasPCLMUL)
571 Builder.defineMacro("__PCLMUL__");
572
573 if (HasVPCLMULQDQ)
574 Builder.defineMacro("__VPCLMULQDQ__");
575
576 // Note, in 32-bit mode, GCC does not define the macro if -mno-sahf. In LLVM,
577 // the feature flag only applies to 64-bit mode.
578 if (HasLAHFSAHF || getTriple().getArch() == llvm::Triple::x86)
579 Builder.defineMacro("__LAHF_SAHF__");
580
581 if (HasLZCNT)
582 Builder.defineMacro("__LZCNT__");
583
584 if (HasRDRND)
585 Builder.defineMacro("__RDRND__");
586
587 if (HasFSGSBASE)
588 Builder.defineMacro("__FSGSBASE__");
589
590 if (HasBMI)
591 Builder.defineMacro("__BMI__");
592
593 if (HasBMI2)
594 Builder.defineMacro("__BMI2__");
595
596 if (HasPOPCNT)
597 Builder.defineMacro("__POPCNT__");
598
599 if (HasRTM)
600 Builder.defineMacro("__RTM__");
601
602 if (HasPRFCHW)
603 Builder.defineMacro("__PRFCHW__");
604
605 if (HasRDSEED)
606 Builder.defineMacro("__RDSEED__");
607
608 if (HasADX)
609 Builder.defineMacro("__ADX__");
610
611 if (HasTBM)
612 Builder.defineMacro("__TBM__");
613
614 if (HasLWP)
615 Builder.defineMacro("__LWP__");
616
617 if (HasMWAITX)
618 Builder.defineMacro("__MWAITX__");
619
620 if (HasMOVBE)
621 Builder.defineMacro("__MOVBE__");
622
623 switch (XOPLevel) {
624 case XOP:
625 Builder.defineMacro("__XOP__");
626 LLVM_FALLTHROUGH;
627 case FMA4:
628 Builder.defineMacro("__FMA4__");
629 LLVM_FALLTHROUGH;
630 case SSE4A:
631 Builder.defineMacro("__SSE4A__");
632 LLVM_FALLTHROUGH;
633 case NoXOP:
634 break;
635 }
636
637 if (HasFMA)
638 Builder.defineMacro("__FMA__");
639
640 if (HasF16C)
641 Builder.defineMacro("__F16C__");
642
643 if (HasGFNI)
644 Builder.defineMacro("__GFNI__");
645
646 if (HasAVX512CD)
647 Builder.defineMacro("__AVX512CD__");
648 if (HasAVX512VPOPCNTDQ)
649 Builder.defineMacro("__AVX512VPOPCNTDQ__");
650 if (HasAVX512VNNI)
651 Builder.defineMacro("__AVX512VNNI__");
652 if (HasAVX512BF16)
653 Builder.defineMacro("__AVX512BF16__");
654 if (HasAVX512ER)
655 Builder.defineMacro("__AVX512ER__");
656 if (HasAVX512PF)
657 Builder.defineMacro("__AVX512PF__");
658 if (HasAVX512DQ)
659 Builder.defineMacro("__AVX512DQ__");
660 if (HasAVX512BITALG)
661 Builder.defineMacro("__AVX512BITALG__");
662 if (HasAVX512BW)
663 Builder.defineMacro("__AVX512BW__");
664 if (HasAVX512VL)
665 Builder.defineMacro("__AVX512VL__");
666 if (HasAVX512VBMI)
667 Builder.defineMacro("__AVX512VBMI__");
668 if (HasAVX512VBMI2)
669 Builder.defineMacro("__AVX512VBMI2__");
670 if (HasAVX512IFMA)
671 Builder.defineMacro("__AVX512IFMA__");
672 if (HasAVX512VP2INTERSECT)
673 Builder.defineMacro("__AVX512VP2INTERSECT__");
674 if (HasSHA)
675 Builder.defineMacro("__SHA__");
676
677 if (HasFXSR)
678 Builder.defineMacro("__FXSR__");
679 if (HasXSAVE)
680 Builder.defineMacro("__XSAVE__");
681 if (HasXSAVEOPT)
682 Builder.defineMacro("__XSAVEOPT__");
683 if (HasXSAVEC)
684 Builder.defineMacro("__XSAVEC__");
685 if (HasXSAVES)
686 Builder.defineMacro("__XSAVES__");
687 if (HasPKU)
688 Builder.defineMacro("__PKU__");
689 if (HasCLFLUSHOPT)
690 Builder.defineMacro("__CLFLUSHOPT__");
691 if (HasCLWB)
692 Builder.defineMacro("__CLWB__");
693 if (HasWBNOINVD)
694 Builder.defineMacro("__WBNOINVD__");
695 if (HasSHSTK)
696 Builder.defineMacro("__SHSTK__");
697 if (HasSGX)
698 Builder.defineMacro("__SGX__");
699 if (HasPREFETCHWT1)
700 Builder.defineMacro("__PREFETCHWT1__");
701 if (HasCLZERO)
702 Builder.defineMacro("__CLZERO__");
703 if (HasKL)
704 Builder.defineMacro("__KL__");
705 if (HasWIDEKL)
706 Builder.defineMacro("__WIDEKL__");
707 if (HasRDPID)
708 Builder.defineMacro("__RDPID__");
709 if (HasCLDEMOTE)
710 Builder.defineMacro("__CLDEMOTE__");
711 if (HasWAITPKG)
712 Builder.defineMacro("__WAITPKG__");
713 if (HasMOVDIRI)
714 Builder.defineMacro("__MOVDIRI__");
715 if (HasMOVDIR64B)
716 Builder.defineMacro("__MOVDIR64B__");
717 if (HasPCONFIG)
718 Builder.defineMacro("__PCONFIG__");
719 if (HasPTWRITE)
720 Builder.defineMacro("__PTWRITE__");
721 if (HasINVPCID)
722 Builder.defineMacro("__INVPCID__");
723 if (HasENQCMD)
724 Builder.defineMacro("__ENQCMD__");
725 if (HasHRESET)
726 Builder.defineMacro("__HRESET__");
727 if (HasAMXTILE)
728 Builder.defineMacro("__AMXTILE__");
729 if (HasAMXINT8)
730 Builder.defineMacro("__AMXINT8__");
731 if (HasAMXBF16)
732 Builder.defineMacro("__AMXBF16__");
733 if (HasAVXVNNI)
734 Builder.defineMacro("__AVXVNNI__");
735 if (HasSERIALIZE)
736 Builder.defineMacro("__SERIALIZE__");
737 if (HasTSXLDTRK)
738 Builder.defineMacro("__TSXLDTRK__");
739 if (HasUINTR)
740 Builder.defineMacro("__UINTR__");
741
742 // Each case falls through to the previous one here.
743 switch (SSELevel) {
744 case AVX512F:
745 Builder.defineMacro("__AVX512F__");
746 LLVM_FALLTHROUGH;
747 case AVX2:
748 Builder.defineMacro("__AVX2__");
749 LLVM_FALLTHROUGH;
750 case AVX:
751 Builder.defineMacro("__AVX__");
752 LLVM_FALLTHROUGH;
753 case SSE42:
754 Builder.defineMacro("__SSE4_2__");
755 LLVM_FALLTHROUGH;
756 case SSE41:
757 Builder.defineMacro("__SSE4_1__");
758 LLVM_FALLTHROUGH;
759 case SSSE3:
760 Builder.defineMacro("__SSSE3__");
761 LLVM_FALLTHROUGH;
762 case SSE3:
763 Builder.defineMacro("__SSE3__");
764 LLVM_FALLTHROUGH;
765 case SSE2:
766 Builder.defineMacro("__SSE2__");
767 Builder.defineMacro("__SSE2_MATH__"); // -mfp-math=sse always implied.
768 LLVM_FALLTHROUGH;
769 case SSE1:
770 Builder.defineMacro("__SSE__");
771 Builder.defineMacro("__SSE_MATH__"); // -mfp-math=sse always implied.
772 LLVM_FALLTHROUGH;
773 case NoSSE:
774 break;
775 }
776
777 if (Opts.MicrosoftExt && getTriple().getArch() == llvm::Triple::x86) {
778 switch (SSELevel) {
779 case AVX512F:
780 case AVX2:
781 case AVX:
782 case SSE42:
783 case SSE41:
784 case SSSE3:
785 case SSE3:
786 case SSE2:
787 Builder.defineMacro("_M_IX86_FP", Twine(2));
788 break;
789 case SSE1:
790 Builder.defineMacro("_M_IX86_FP", Twine(1));
791 break;
792 default:
793 Builder.defineMacro("_M_IX86_FP", Twine(0));
794 break;
795 }
796 }
797
798 // Each case falls through to the previous one here.
799 switch (MMX3DNowLevel) {
800 case AMD3DNowAthlon:
801 Builder.defineMacro("__3dNOW_A__");
802 LLVM_FALLTHROUGH;
803 case AMD3DNow:
804 Builder.defineMacro("__3dNOW__");
805 LLVM_FALLTHROUGH;
806 case MMX:
807 Builder.defineMacro("__MMX__");
808 LLVM_FALLTHROUGH;
809 case NoMMX3DNow:
810 break;
811 }
812
813 if (CPU >= CK_i486 || CPU == CK_None) {
814 Builder.defineMacro("__GCC_HAVE_SYNC_COMPARE_AND_SWAP_1");
815 Builder.defineMacro("__GCC_HAVE_SYNC_COMPARE_AND_SWAP_2");
816 Builder.defineMacro("__GCC_HAVE_SYNC_COMPARE_AND_SWAP_4");
817 }
818 if (HasCX8)
819 Builder.defineMacro("__GCC_HAVE_SYNC_COMPARE_AND_SWAP_8");
820 if (HasCX16 && getTriple().getArch() == llvm::Triple::x86_64)
821 Builder.defineMacro("__GCC_HAVE_SYNC_COMPARE_AND_SWAP_16");
822
823 if (HasFloat128)
824 Builder.defineMacro("__SIZEOF_FLOAT128__", "16");
825 }
826
isValidFeatureName(StringRef Name) const827 bool X86TargetInfo::isValidFeatureName(StringRef Name) const {
828 return llvm::StringSwitch<bool>(Name)
829 .Case("3dnow", true)
830 .Case("3dnowa", true)
831 .Case("adx", true)
832 .Case("aes", true)
833 .Case("amx-bf16", true)
834 .Case("amx-int8", true)
835 .Case("amx-tile", true)
836 .Case("avx", true)
837 .Case("avx2", true)
838 .Case("avx512f", true)
839 .Case("avx512cd", true)
840 .Case("avx512vpopcntdq", true)
841 .Case("avx512vnni", true)
842 .Case("avx512bf16", true)
843 .Case("avx512er", true)
844 .Case("avx512pf", true)
845 .Case("avx512dq", true)
846 .Case("avx512bitalg", true)
847 .Case("avx512bw", true)
848 .Case("avx512vl", true)
849 .Case("avx512vbmi", true)
850 .Case("avx512vbmi2", true)
851 .Case("avx512ifma", true)
852 .Case("avx512vp2intersect", true)
853 .Case("avxvnni", true)
854 .Case("bmi", true)
855 .Case("bmi2", true)
856 .Case("cldemote", true)
857 .Case("clflushopt", true)
858 .Case("clwb", true)
859 .Case("clzero", true)
860 .Case("cx16", true)
861 .Case("enqcmd", true)
862 .Case("f16c", true)
863 .Case("fma", true)
864 .Case("fma4", true)
865 .Case("fsgsbase", true)
866 .Case("fxsr", true)
867 .Case("gfni", true)
868 .Case("hreset", true)
869 .Case("invpcid", true)
870 .Case("kl", true)
871 .Case("widekl", true)
872 .Case("lwp", true)
873 .Case("lzcnt", true)
874 .Case("mmx", true)
875 .Case("movbe", true)
876 .Case("movdiri", true)
877 .Case("movdir64b", true)
878 .Case("mwaitx", true)
879 .Case("pclmul", true)
880 .Case("pconfig", true)
881 .Case("pku", true)
882 .Case("popcnt", true)
883 .Case("prefetchwt1", true)
884 .Case("prfchw", true)
885 .Case("ptwrite", true)
886 .Case("rdpid", true)
887 .Case("rdrnd", true)
888 .Case("rdseed", true)
889 .Case("rtm", true)
890 .Case("sahf", true)
891 .Case("serialize", true)
892 .Case("sgx", true)
893 .Case("sha", true)
894 .Case("shstk", true)
895 .Case("sse", true)
896 .Case("sse2", true)
897 .Case("sse3", true)
898 .Case("ssse3", true)
899 .Case("sse4", true)
900 .Case("sse4.1", true)
901 .Case("sse4.2", true)
902 .Case("sse4a", true)
903 .Case("tbm", true)
904 .Case("tsxldtrk", true)
905 .Case("uintr", true)
906 .Case("vaes", true)
907 .Case("vpclmulqdq", true)
908 .Case("wbnoinvd", true)
909 .Case("waitpkg", true)
910 .Case("x87", true)
911 .Case("xop", true)
912 .Case("xsave", true)
913 .Case("xsavec", true)
914 .Case("xsaves", true)
915 .Case("xsaveopt", true)
916 .Default(false);
917 }
918
hasFeature(StringRef Feature) const919 bool X86TargetInfo::hasFeature(StringRef Feature) const {
920 return llvm::StringSwitch<bool>(Feature)
921 .Case("adx", HasADX)
922 .Case("aes", HasAES)
923 .Case("amx-bf16", HasAMXBF16)
924 .Case("amx-int8", HasAMXINT8)
925 .Case("amx-tile", HasAMXTILE)
926 .Case("avxvnni", HasAVXVNNI)
927 .Case("avx", SSELevel >= AVX)
928 .Case("avx2", SSELevel >= AVX2)
929 .Case("avx512f", SSELevel >= AVX512F)
930 .Case("avx512cd", HasAVX512CD)
931 .Case("avx512vpopcntdq", HasAVX512VPOPCNTDQ)
932 .Case("avx512vnni", HasAVX512VNNI)
933 .Case("avx512bf16", HasAVX512BF16)
934 .Case("avx512er", HasAVX512ER)
935 .Case("avx512pf", HasAVX512PF)
936 .Case("avx512dq", HasAVX512DQ)
937 .Case("avx512bitalg", HasAVX512BITALG)
938 .Case("avx512bw", HasAVX512BW)
939 .Case("avx512vl", HasAVX512VL)
940 .Case("avx512vbmi", HasAVX512VBMI)
941 .Case("avx512vbmi2", HasAVX512VBMI2)
942 .Case("avx512ifma", HasAVX512IFMA)
943 .Case("avx512vp2intersect", HasAVX512VP2INTERSECT)
944 .Case("bmi", HasBMI)
945 .Case("bmi2", HasBMI2)
946 .Case("cldemote", HasCLDEMOTE)
947 .Case("clflushopt", HasCLFLUSHOPT)
948 .Case("clwb", HasCLWB)
949 .Case("clzero", HasCLZERO)
950 .Case("cx8", HasCX8)
951 .Case("cx16", HasCX16)
952 .Case("enqcmd", HasENQCMD)
953 .Case("f16c", HasF16C)
954 .Case("fma", HasFMA)
955 .Case("fma4", XOPLevel >= FMA4)
956 .Case("fsgsbase", HasFSGSBASE)
957 .Case("fxsr", HasFXSR)
958 .Case("gfni", HasGFNI)
959 .Case("hreset", HasHRESET)
960 .Case("invpcid", HasINVPCID)
961 .Case("kl", HasKL)
962 .Case("widekl", HasWIDEKL)
963 .Case("lwp", HasLWP)
964 .Case("lzcnt", HasLZCNT)
965 .Case("mm3dnow", MMX3DNowLevel >= AMD3DNow)
966 .Case("mm3dnowa", MMX3DNowLevel >= AMD3DNowAthlon)
967 .Case("mmx", MMX3DNowLevel >= MMX)
968 .Case("movbe", HasMOVBE)
969 .Case("movdiri", HasMOVDIRI)
970 .Case("movdir64b", HasMOVDIR64B)
971 .Case("mwaitx", HasMWAITX)
972 .Case("pclmul", HasPCLMUL)
973 .Case("pconfig", HasPCONFIG)
974 .Case("pku", HasPKU)
975 .Case("popcnt", HasPOPCNT)
976 .Case("prefetchwt1", HasPREFETCHWT1)
977 .Case("prfchw", HasPRFCHW)
978 .Case("ptwrite", HasPTWRITE)
979 .Case("rdpid", HasRDPID)
980 .Case("rdrnd", HasRDRND)
981 .Case("rdseed", HasRDSEED)
982 .Case("retpoline-external-thunk", HasRetpolineExternalThunk)
983 .Case("rtm", HasRTM)
984 .Case("sahf", HasLAHFSAHF)
985 .Case("serialize", HasSERIALIZE)
986 .Case("sgx", HasSGX)
987 .Case("sha", HasSHA)
988 .Case("shstk", HasSHSTK)
989 .Case("sse", SSELevel >= SSE1)
990 .Case("sse2", SSELevel >= SSE2)
991 .Case("sse3", SSELevel >= SSE3)
992 .Case("ssse3", SSELevel >= SSSE3)
993 .Case("sse4.1", SSELevel >= SSE41)
994 .Case("sse4.2", SSELevel >= SSE42)
995 .Case("sse4a", XOPLevel >= SSE4A)
996 .Case("tbm", HasTBM)
997 .Case("tsxldtrk", HasTSXLDTRK)
998 .Case("uintr", HasUINTR)
999 .Case("vaes", HasVAES)
1000 .Case("vpclmulqdq", HasVPCLMULQDQ)
1001 .Case("wbnoinvd", HasWBNOINVD)
1002 .Case("waitpkg", HasWAITPKG)
1003 .Case("x86", true)
1004 .Case("x86_32", getTriple().getArch() == llvm::Triple::x86)
1005 .Case("x86_64", getTriple().getArch() == llvm::Triple::x86_64)
1006 .Case("xop", XOPLevel >= XOP)
1007 .Case("xsave", HasXSAVE)
1008 .Case("xsavec", HasXSAVEC)
1009 .Case("xsaves", HasXSAVES)
1010 .Case("xsaveopt", HasXSAVEOPT)
1011 .Default(false);
1012 }
1013
1014 // We can't use a generic validation scheme for the features accepted here
1015 // versus subtarget features accepted in the target attribute because the
1016 // bitfield structure that's initialized in the runtime only supports the
1017 // below currently rather than the full range of subtarget features. (See
1018 // X86TargetInfo::hasFeature for a somewhat comprehensive list).
validateCpuSupports(StringRef FeatureStr) const1019 bool X86TargetInfo::validateCpuSupports(StringRef FeatureStr) const {
1020 return llvm::StringSwitch<bool>(FeatureStr)
1021 #define X86_FEATURE_COMPAT(ENUM, STR) .Case(STR, true)
1022 #include "llvm/Support/X86TargetParser.def"
1023 .Default(false);
1024 }
1025
getFeature(StringRef Name)1026 static llvm::X86::ProcessorFeatures getFeature(StringRef Name) {
1027 return llvm::StringSwitch<llvm::X86::ProcessorFeatures>(Name)
1028 #define X86_FEATURE_COMPAT(ENUM, STR) .Case(STR, llvm::X86::FEATURE_##ENUM)
1029 #include "llvm/Support/X86TargetParser.def"
1030 ;
1031 // Note, this function should only be used after ensuring the value is
1032 // correct, so it asserts if the value is out of range.
1033 }
1034
getFeaturePriority(llvm::X86::ProcessorFeatures Feat)1035 static unsigned getFeaturePriority(llvm::X86::ProcessorFeatures Feat) {
1036 enum class FeatPriority {
1037 #define FEATURE(FEAT) FEAT,
1038 #include "clang/Basic/X86Target.def"
1039 };
1040 switch (Feat) {
1041 #define FEATURE(FEAT) \
1042 case llvm::X86::FEAT: \
1043 return static_cast<unsigned>(FeatPriority::FEAT);
1044 #include "clang/Basic/X86Target.def"
1045 default:
1046 llvm_unreachable("No Feature Priority for non-CPUSupports Features");
1047 }
1048 }
1049
multiVersionSortPriority(StringRef Name) const1050 unsigned X86TargetInfo::multiVersionSortPriority(StringRef Name) const {
1051 // Valid CPUs have a 'key feature' that compares just better than its key
1052 // feature.
1053 using namespace llvm::X86;
1054 CPUKind Kind = parseArchX86(Name);
1055 if (Kind != CK_None) {
1056 ProcessorFeatures KeyFeature = getKeyFeature(Kind);
1057 return (getFeaturePriority(KeyFeature) << 1) + 1;
1058 }
1059
1060 // Now we know we have a feature, so get its priority and shift it a few so
1061 // that we have sufficient room for the CPUs (above).
1062 return getFeaturePriority(getFeature(Name)) << 1;
1063 }
1064
validateCPUSpecificCPUDispatch(StringRef Name) const1065 bool X86TargetInfo::validateCPUSpecificCPUDispatch(StringRef Name) const {
1066 return llvm::StringSwitch<bool>(Name)
1067 #define CPU_SPECIFIC(NAME, MANGLING, FEATURES) .Case(NAME, true)
1068 #define CPU_SPECIFIC_ALIAS(NEW_NAME, NAME) .Case(NEW_NAME, true)
1069 #include "clang/Basic/X86Target.def"
1070 .Default(false);
1071 }
1072
CPUSpecificCPUDispatchNameDealias(StringRef Name)1073 static StringRef CPUSpecificCPUDispatchNameDealias(StringRef Name) {
1074 return llvm::StringSwitch<StringRef>(Name)
1075 #define CPU_SPECIFIC_ALIAS(NEW_NAME, NAME) .Case(NEW_NAME, NAME)
1076 #include "clang/Basic/X86Target.def"
1077 .Default(Name);
1078 }
1079
CPUSpecificManglingCharacter(StringRef Name) const1080 char X86TargetInfo::CPUSpecificManglingCharacter(StringRef Name) const {
1081 return llvm::StringSwitch<char>(CPUSpecificCPUDispatchNameDealias(Name))
1082 #define CPU_SPECIFIC(NAME, MANGLING, FEATURES) .Case(NAME, MANGLING)
1083 #include "clang/Basic/X86Target.def"
1084 .Default(0);
1085 }
1086
getCPUSpecificCPUDispatchFeatures(StringRef Name,llvm::SmallVectorImpl<StringRef> & Features) const1087 void X86TargetInfo::getCPUSpecificCPUDispatchFeatures(
1088 StringRef Name, llvm::SmallVectorImpl<StringRef> &Features) const {
1089 StringRef WholeList =
1090 llvm::StringSwitch<StringRef>(CPUSpecificCPUDispatchNameDealias(Name))
1091 #define CPU_SPECIFIC(NAME, MANGLING, FEATURES) .Case(NAME, FEATURES)
1092 #include "clang/Basic/X86Target.def"
1093 .Default("");
1094 WholeList.split(Features, ',', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
1095 }
1096
1097 // We can't use a generic validation scheme for the cpus accepted here
1098 // versus subtarget cpus accepted in the target attribute because the
1099 // variables intitialized by the runtime only support the below currently
1100 // rather than the full range of cpus.
validateCpuIs(StringRef FeatureStr) const1101 bool X86TargetInfo::validateCpuIs(StringRef FeatureStr) const {
1102 return llvm::StringSwitch<bool>(FeatureStr)
1103 #define X86_VENDOR(ENUM, STRING) .Case(STRING, true)
1104 #define X86_CPU_TYPE_ALIAS(ENUM, ALIAS) .Case(ALIAS, true)
1105 #define X86_CPU_TYPE(ENUM, STR) .Case(STR, true)
1106 #define X86_CPU_SUBTYPE(ENUM, STR) .Case(STR, true)
1107 #include "llvm/Support/X86TargetParser.def"
1108 .Default(false);
1109 }
1110
matchAsmCCConstraint(const char * & Name)1111 static unsigned matchAsmCCConstraint(const char *&Name) {
1112 auto RV = llvm::StringSwitch<unsigned>(Name)
1113 .Case("@cca", 4)
1114 .Case("@ccae", 5)
1115 .Case("@ccb", 4)
1116 .Case("@ccbe", 5)
1117 .Case("@ccc", 4)
1118 .Case("@cce", 4)
1119 .Case("@ccz", 4)
1120 .Case("@ccg", 4)
1121 .Case("@ccge", 5)
1122 .Case("@ccl", 4)
1123 .Case("@ccle", 5)
1124 .Case("@ccna", 5)
1125 .Case("@ccnae", 6)
1126 .Case("@ccnb", 5)
1127 .Case("@ccnbe", 6)
1128 .Case("@ccnc", 5)
1129 .Case("@ccne", 5)
1130 .Case("@ccnz", 5)
1131 .Case("@ccng", 5)
1132 .Case("@ccnge", 6)
1133 .Case("@ccnl", 5)
1134 .Case("@ccnle", 6)
1135 .Case("@ccno", 5)
1136 .Case("@ccnp", 5)
1137 .Case("@ccns", 5)
1138 .Case("@cco", 4)
1139 .Case("@ccp", 4)
1140 .Case("@ccs", 4)
1141 .Default(0);
1142 return RV;
1143 }
1144
validateAsmConstraint(const char * & Name,TargetInfo::ConstraintInfo & Info) const1145 bool X86TargetInfo::validateAsmConstraint(
1146 const char *&Name, TargetInfo::ConstraintInfo &Info) const {
1147 switch (*Name) {
1148 default:
1149 return false;
1150 // Constant constraints.
1151 case 'e': // 32-bit signed integer constant for use with sign-extending x86_64
1152 // instructions.
1153 case 'Z': // 32-bit unsigned integer constant for use with zero-extending
1154 // x86_64 instructions.
1155 case 's':
1156 Info.setRequiresImmediate();
1157 return true;
1158 case 'I':
1159 Info.setRequiresImmediate(0, 31);
1160 return true;
1161 case 'J':
1162 Info.setRequiresImmediate(0, 63);
1163 return true;
1164 case 'K':
1165 Info.setRequiresImmediate(-128, 127);
1166 return true;
1167 case 'L':
1168 Info.setRequiresImmediate({int(0xff), int(0xffff), int(0xffffffff)});
1169 return true;
1170 case 'M':
1171 Info.setRequiresImmediate(0, 3);
1172 return true;
1173 case 'N':
1174 Info.setRequiresImmediate(0, 255);
1175 return true;
1176 case 'O':
1177 Info.setRequiresImmediate(0, 127);
1178 return true;
1179 // Register constraints.
1180 case 'Y': // 'Y' is the first character for several 2-character constraints.
1181 // Shift the pointer to the second character of the constraint.
1182 Name++;
1183 switch (*Name) {
1184 default:
1185 return false;
1186 case 'z': // First SSE register.
1187 case '2':
1188 case 't': // Any SSE register, when SSE2 is enabled.
1189 case 'i': // Any SSE register, when SSE2 and inter-unit moves enabled.
1190 case 'm': // Any MMX register, when inter-unit moves enabled.
1191 case 'k': // AVX512 arch mask registers: k1-k7.
1192 Info.setAllowsRegister();
1193 return true;
1194 }
1195 case 'f': // Any x87 floating point stack register.
1196 // Constraint 'f' cannot be used for output operands.
1197 if (Info.ConstraintStr[0] == '=')
1198 return false;
1199 Info.setAllowsRegister();
1200 return true;
1201 case 'a': // eax.
1202 case 'b': // ebx.
1203 case 'c': // ecx.
1204 case 'd': // edx.
1205 case 'S': // esi.
1206 case 'D': // edi.
1207 case 'A': // edx:eax.
1208 case 't': // Top of floating point stack.
1209 case 'u': // Second from top of floating point stack.
1210 case 'q': // Any register accessible as [r]l: a, b, c, and d.
1211 case 'y': // Any MMX register.
1212 case 'v': // Any {X,Y,Z}MM register (Arch & context dependent)
1213 case 'x': // Any SSE register.
1214 case 'k': // Any AVX512 mask register (same as Yk, additionally allows k0
1215 // for intermideate k reg operations).
1216 case 'Q': // Any register accessible as [r]h: a, b, c, and d.
1217 case 'R': // "Legacy" registers: ax, bx, cx, dx, di, si, sp, bp.
1218 case 'l': // "Index" registers: any general register that can be used as an
1219 // index in a base+index memory access.
1220 Info.setAllowsRegister();
1221 return true;
1222 // Floating point constant constraints.
1223 case 'C': // SSE floating point constant.
1224 case 'G': // x87 floating point constant.
1225 return true;
1226 case '@':
1227 // CC condition changes.
1228 if (auto Len = matchAsmCCConstraint(Name)) {
1229 Name += Len - 1;
1230 Info.setAllowsRegister();
1231 return true;
1232 }
1233 return false;
1234 }
1235 }
1236
1237 // Below is based on the following information:
1238 // +------------------------------------+-------------------------+--------------------------------------------------------------------------------------------------------------------------------------------------------------+
1239 // | Processor Name | Cache Line Size (Bytes) | Source |
1240 // +------------------------------------+-------------------------+--------------------------------------------------------------------------------------------------------------------------------------------------------------+
1241 // | i386 | 64 | https://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf |
1242 // | i486 | 16 | "four doublewords" (doubleword = 32 bits, 4 bits * 32 bits = 16 bytes) https://en.wikichip.org/w/images/d/d3/i486_MICROPROCESSOR_HARDWARE_REFERENCE_MANUAL_%281990%29.pdf and http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.126.4216&rep=rep1&type=pdf (page 29) |
1243 // | i586/Pentium MMX | 32 | https://www.7-cpu.com/cpu/P-MMX.html |
1244 // | i686/Pentium | 32 | https://www.7-cpu.com/cpu/P6.html |
1245 // | Netburst/Pentium4 | 64 | https://www.7-cpu.com/cpu/P4-180.html |
1246 // | Atom | 64 | https://www.7-cpu.com/cpu/Atom.html |
1247 // | Westmere | 64 | https://en.wikichip.org/wiki/intel/microarchitectures/sandy_bridge_(client) "Cache Architecture" |
1248 // | Sandy Bridge | 64 | https://en.wikipedia.org/wiki/Sandy_Bridge and https://www.7-cpu.com/cpu/SandyBridge.html |
1249 // | Ivy Bridge | 64 | https://blog.stuffedcow.net/2013/01/ivb-cache-replacement/ and https://www.7-cpu.com/cpu/IvyBridge.html |
1250 // | Haswell | 64 | https://www.7-cpu.com/cpu/Haswell.html |
1251 // | Boadwell | 64 | https://www.7-cpu.com/cpu/Broadwell.html |
1252 // | Skylake (including skylake-avx512) | 64 | https://www.nas.nasa.gov/hecc/support/kb/skylake-processors_550.html "Cache Hierarchy" |
1253 // | Cascade Lake | 64 | https://www.nas.nasa.gov/hecc/support/kb/cascade-lake-processors_579.html "Cache Hierarchy" |
1254 // | Skylake | 64 | https://en.wikichip.org/wiki/intel/microarchitectures/kaby_lake "Memory Hierarchy" |
1255 // | Ice Lake | 64 | https://www.7-cpu.com/cpu/Ice_Lake.html |
1256 // | Knights Landing | 64 | https://software.intel.com/en-us/articles/intel-xeon-phi-processor-7200-family-memory-management-optimizations "The Intel® Xeon Phi™ Processor Architecture" |
1257 // | Knights Mill | 64 | https://software.intel.com/sites/default/files/managed/9e/bc/64-ia-32-architectures-optimization-manual.pdf?countrylabel=Colombia "2.5.5.2 L1 DCache " |
1258 // +------------------------------------+-------------------------+--------------------------------------------------------------------------------------------------------------------------------------------------------------+
getCPUCacheLineSize() const1259 Optional<unsigned> X86TargetInfo::getCPUCacheLineSize() const {
1260 using namespace llvm::X86;
1261 switch (CPU) {
1262 // i386
1263 case CK_i386:
1264 // i486
1265 case CK_i486:
1266 case CK_WinChipC6:
1267 case CK_WinChip2:
1268 case CK_C3:
1269 // Lakemont
1270 case CK_Lakemont:
1271 return 16;
1272
1273 // i586
1274 case CK_i586:
1275 case CK_Pentium:
1276 case CK_PentiumMMX:
1277 // i686
1278 case CK_PentiumPro:
1279 case CK_i686:
1280 case CK_Pentium2:
1281 case CK_Pentium3:
1282 case CK_PentiumM:
1283 case CK_C3_2:
1284 // K6
1285 case CK_K6:
1286 case CK_K6_2:
1287 case CK_K6_3:
1288 // Geode
1289 case CK_Geode:
1290 return 32;
1291
1292 // Netburst
1293 case CK_Pentium4:
1294 case CK_Prescott:
1295 case CK_Nocona:
1296 // Atom
1297 case CK_Bonnell:
1298 case CK_Silvermont:
1299 case CK_Goldmont:
1300 case CK_GoldmontPlus:
1301 case CK_Tremont:
1302
1303 case CK_Westmere:
1304 case CK_SandyBridge:
1305 case CK_IvyBridge:
1306 case CK_Haswell:
1307 case CK_Broadwell:
1308 case CK_SkylakeClient:
1309 case CK_SkylakeServer:
1310 case CK_Cascadelake:
1311 case CK_Nehalem:
1312 case CK_Cooperlake:
1313 case CK_Cannonlake:
1314 case CK_Tigerlake:
1315 case CK_SapphireRapids:
1316 case CK_IcelakeClient:
1317 case CK_IcelakeServer:
1318 case CK_Alderlake:
1319 case CK_KNL:
1320 case CK_KNM:
1321 // K7
1322 case CK_Athlon:
1323 case CK_AthlonXP:
1324 // K8
1325 case CK_K8:
1326 case CK_K8SSE3:
1327 case CK_AMDFAM10:
1328 // Bobcat
1329 case CK_BTVER1:
1330 case CK_BTVER2:
1331 // Bulldozer
1332 case CK_BDVER1:
1333 case CK_BDVER2:
1334 case CK_BDVER3:
1335 case CK_BDVER4:
1336 // Zen
1337 case CK_ZNVER1:
1338 case CK_ZNVER2:
1339 case CK_ZNVER3:
1340 // Deprecated
1341 case CK_x86_64:
1342 case CK_x86_64_v2:
1343 case CK_x86_64_v3:
1344 case CK_x86_64_v4:
1345 case CK_Yonah:
1346 case CK_Penryn:
1347 case CK_Core2:
1348 return 64;
1349
1350 // The following currently have unknown cache line sizes (but they are probably all 64):
1351 // Core
1352 case CK_None:
1353 return None;
1354 }
1355 llvm_unreachable("Unknown CPU kind");
1356 }
1357
validateOutputSize(const llvm::StringMap<bool> & FeatureMap,StringRef Constraint,unsigned Size) const1358 bool X86TargetInfo::validateOutputSize(const llvm::StringMap<bool> &FeatureMap,
1359 StringRef Constraint,
1360 unsigned Size) const {
1361 // Strip off constraint modifiers.
1362 while (Constraint[0] == '=' || Constraint[0] == '+' || Constraint[0] == '&')
1363 Constraint = Constraint.substr(1);
1364
1365 return validateOperandSize(FeatureMap, Constraint, Size);
1366 }
1367
validateInputSize(const llvm::StringMap<bool> & FeatureMap,StringRef Constraint,unsigned Size) const1368 bool X86TargetInfo::validateInputSize(const llvm::StringMap<bool> &FeatureMap,
1369 StringRef Constraint,
1370 unsigned Size) const {
1371 return validateOperandSize(FeatureMap, Constraint, Size);
1372 }
1373
validateOperandSize(const llvm::StringMap<bool> & FeatureMap,StringRef Constraint,unsigned Size) const1374 bool X86TargetInfo::validateOperandSize(const llvm::StringMap<bool> &FeatureMap,
1375 StringRef Constraint,
1376 unsigned Size) const {
1377 switch (Constraint[0]) {
1378 default:
1379 break;
1380 case 'k':
1381 // Registers k0-k7 (AVX512) size limit is 64 bit.
1382 case 'y':
1383 return Size <= 64;
1384 case 'f':
1385 case 't':
1386 case 'u':
1387 return Size <= 128;
1388 case 'Y':
1389 // 'Y' is the first character for several 2-character constraints.
1390 switch (Constraint[1]) {
1391 default:
1392 return false;
1393 case 'm':
1394 // 'Ym' is synonymous with 'y'.
1395 case 'k':
1396 return Size <= 64;
1397 case 'z':
1398 // XMM0/YMM/ZMM0
1399 if (FeatureMap.lookup("avx512f"))
1400 // ZMM0 can be used if target supports AVX512F.
1401 return Size <= 512U;
1402 else if (FeatureMap.lookup("avx"))
1403 // YMM0 can be used if target supports AVX.
1404 return Size <= 256U;
1405 else if (FeatureMap.lookup("sse"))
1406 return Size <= 128U;
1407 return false;
1408 case 'i':
1409 case 't':
1410 case '2':
1411 // 'Yi','Yt','Y2' are synonymous with 'x' when SSE2 is enabled.
1412 if (SSELevel < SSE2)
1413 return false;
1414 break;
1415 }
1416 break;
1417 case 'v':
1418 case 'x':
1419 if (FeatureMap.lookup("avx512f"))
1420 // 512-bit zmm registers can be used if target supports AVX512F.
1421 return Size <= 512U;
1422 else if (FeatureMap.lookup("avx"))
1423 // 256-bit ymm registers can be used if target supports AVX.
1424 return Size <= 256U;
1425 return Size <= 128U;
1426
1427 }
1428
1429 return true;
1430 }
1431
convertConstraint(const char * & Constraint) const1432 std::string X86TargetInfo::convertConstraint(const char *&Constraint) const {
1433 switch (*Constraint) {
1434 case '@':
1435 if (auto Len = matchAsmCCConstraint(Constraint)) {
1436 std::string Converted = "{" + std::string(Constraint, Len) + "}";
1437 Constraint += Len - 1;
1438 return Converted;
1439 }
1440 return std::string(1, *Constraint);
1441 case 'a':
1442 return std::string("{ax}");
1443 case 'b':
1444 return std::string("{bx}");
1445 case 'c':
1446 return std::string("{cx}");
1447 case 'd':
1448 return std::string("{dx}");
1449 case 'S':
1450 return std::string("{si}");
1451 case 'D':
1452 return std::string("{di}");
1453 case 'p': // address
1454 return std::string("im");
1455 case 't': // top of floating point stack.
1456 return std::string("{st}");
1457 case 'u': // second from top of floating point stack.
1458 return std::string("{st(1)}"); // second from top of floating point stack.
1459 case 'Y':
1460 switch (Constraint[1]) {
1461 default:
1462 // Break from inner switch and fall through (copy single char),
1463 // continue parsing after copying the current constraint into
1464 // the return string.
1465 break;
1466 case 'k':
1467 case 'm':
1468 case 'i':
1469 case 't':
1470 case 'z':
1471 case '2':
1472 // "^" hints llvm that this is a 2 letter constraint.
1473 // "Constraint++" is used to promote the string iterator
1474 // to the next constraint.
1475 return std::string("^") + std::string(Constraint++, 2);
1476 }
1477 LLVM_FALLTHROUGH;
1478 default:
1479 return std::string(1, *Constraint);
1480 }
1481 }
1482
fillValidCPUList(SmallVectorImpl<StringRef> & Values) const1483 void X86TargetInfo::fillValidCPUList(SmallVectorImpl<StringRef> &Values) const {
1484 bool Only64Bit = getTriple().getArch() != llvm::Triple::x86;
1485 llvm::X86::fillValidCPUArchList(Values, Only64Bit);
1486 }
1487
fillValidTuneCPUList(SmallVectorImpl<StringRef> & Values) const1488 void X86TargetInfo::fillValidTuneCPUList(SmallVectorImpl<StringRef> &Values) const {
1489 llvm::X86::fillValidTuneCPUList(Values);
1490 }
1491
getGCCRegNames() const1492 ArrayRef<const char *> X86TargetInfo::getGCCRegNames() const {
1493 return llvm::makeArrayRef(GCCRegNames);
1494 }
1495
getGCCAddlRegNames() const1496 ArrayRef<TargetInfo::AddlRegName> X86TargetInfo::getGCCAddlRegNames() const {
1497 return llvm::makeArrayRef(AddlRegNames);
1498 }
1499
getTargetBuiltins() const1500 ArrayRef<Builtin::Info> X86_32TargetInfo::getTargetBuiltins() const {
1501 return llvm::makeArrayRef(BuiltinInfoX86, clang::X86::LastX86CommonBuiltin -
1502 Builtin::FirstTSBuiltin + 1);
1503 }
1504
getTargetBuiltins() const1505 ArrayRef<Builtin::Info> X86_64TargetInfo::getTargetBuiltins() const {
1506 return llvm::makeArrayRef(BuiltinInfoX86,
1507 X86::LastTSBuiltin - Builtin::FirstTSBuiltin);
1508 }
1509