1 //===-- X86.td - Target definition file for the Intel X86 --*- tablegen -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This is a target description file for the Intel i386 architecture, referred
10 // to here as the "X86" architecture.
12 //===----------------------------------------------------------------------===//
14 // Get the target-independent interfaces which we are implementing...
16 include "llvm/Target/Target.td"
18 //===----------------------------------------------------------------------===//
19 // X86 Subtarget state
22 def Mode64Bit : SubtargetFeature<"64bit-mode", "In64BitMode", "true",
23 "64-bit mode (x86_64)">;
24 def Mode32Bit : SubtargetFeature<"32bit-mode", "In32BitMode", "true",
25 "32-bit mode (80386)">;
26 def Mode16Bit : SubtargetFeature<"16bit-mode", "In16BitMode", "true",
27 "16-bit mode (i8086)">;
29 //===----------------------------------------------------------------------===//
30 // X86 Subtarget features
31 //===----------------------------------------------------------------------===//
33 def FeatureX87 : SubtargetFeature<"x87","HasX87", "true",
34 "Enable X87 float instructions">;
36 def FeatureNOPL : SubtargetFeature<"nopl", "HasNOPL", "true",
37 "Enable NOPL instruction">;
39 def FeatureCMOV : SubtargetFeature<"cmov","HasCMov", "true",
40 "Enable conditional move instructions">;
42 def FeatureCMPXCHG8B : SubtargetFeature<"cx8", "HasCmpxchg8b", "true",
43 "Support CMPXCHG8B instructions">;
45 def FeaturePOPCNT : SubtargetFeature<"popcnt", "HasPOPCNT", "true",
46 "Support POPCNT instruction">;
48 def FeatureFXSR : SubtargetFeature<"fxsr", "HasFXSR", "true",
49 "Support fxsave/fxrestore instructions">;
51 def FeatureXSAVE : SubtargetFeature<"xsave", "HasXSAVE", "true",
52 "Support xsave instructions">;
54 def FeatureXSAVEOPT: SubtargetFeature<"xsaveopt", "HasXSAVEOPT", "true",
55 "Support xsaveopt instructions">;
57 def FeatureXSAVEC : SubtargetFeature<"xsavec", "HasXSAVEC", "true",
58 "Support xsavec instructions">;
60 def FeatureXSAVES : SubtargetFeature<"xsaves", "HasXSAVES", "true",
61 "Support xsaves instructions">;
63 def FeatureSSE1 : SubtargetFeature<"sse", "X86SSELevel", "SSE1",
64 "Enable SSE instructions">;
65 def FeatureSSE2 : SubtargetFeature<"sse2", "X86SSELevel", "SSE2",
66 "Enable SSE2 instructions",
68 def FeatureSSE3 : SubtargetFeature<"sse3", "X86SSELevel", "SSE3",
69 "Enable SSE3 instructions",
71 def FeatureSSSE3 : SubtargetFeature<"ssse3", "X86SSELevel", "SSSE3",
72 "Enable SSSE3 instructions",
74 def FeatureSSE41 : SubtargetFeature<"sse4.1", "X86SSELevel", "SSE41",
75 "Enable SSE 4.1 instructions",
77 def FeatureSSE42 : SubtargetFeature<"sse4.2", "X86SSELevel", "SSE42",
78 "Enable SSE 4.2 instructions",
80 // The MMX subtarget feature is separate from the rest of the SSE features
81 // because it's important (for odd compatibility reasons) to be able to
82 // turn it off explicitly while allowing SSE+ to be on.
83 def FeatureMMX : SubtargetFeature<"mmx","X863DNowLevel", "MMX",
84 "Enable MMX instructions">;
85 def Feature3DNow : SubtargetFeature<"3dnow", "X863DNowLevel", "ThreeDNow",
86 "Enable 3DNow! instructions",
88 def Feature3DNowA : SubtargetFeature<"3dnowa", "X863DNowLevel", "ThreeDNowA",
89 "Enable 3DNow! Athlon instructions",
91 // All x86-64 hardware has SSE2, but we don't mark SSE2 as an implied
92 // feature, because SSE2 can be disabled (e.g. for compiling OS kernels)
93 // without disabling 64-bit mode. Nothing should imply this feature bit. It
94 // is used to enforce that only 64-bit capable CPUs are used in 64-bit mode.
95 def Feature64Bit : SubtargetFeature<"64bit", "HasX86_64", "true",
96 "Support 64-bit instructions">;
97 def FeatureCMPXCHG16B : SubtargetFeature<"cx16", "HasCmpxchg16b", "true",
98 "64-bit with cmpxchg16b",
100 def FeatureSlowSHLD : SubtargetFeature<"slow-shld", "IsSHLDSlow", "true",
101 "SHLD instruction is slow">;
102 def FeatureSlowPMULLD : SubtargetFeature<"slow-pmulld", "IsPMULLDSlow", "true",
103 "PMULLD instruction is slow">;
104 def FeatureSlowPMADDWD : SubtargetFeature<"slow-pmaddwd", "IsPMADDWDSlow",
106 "PMADDWD is slower than PMULLD">;
107 // FIXME: This should not apply to CPUs that do not have SSE.
108 def FeatureSlowUAMem16 : SubtargetFeature<"slow-unaligned-mem-16",
109 "IsUAMem16Slow", "true",
110 "Slow unaligned 16-byte memory access">;
111 def FeatureSlowUAMem32 : SubtargetFeature<"slow-unaligned-mem-32",
112 "IsUAMem32Slow", "true",
113 "Slow unaligned 32-byte memory access">;
114 def FeatureSSE4A : SubtargetFeature<"sse4a", "HasSSE4A", "true",
115 "Support SSE 4a instructions",
118 def FeatureAVX : SubtargetFeature<"avx", "X86SSELevel", "AVX",
119 "Enable AVX instructions",
121 def FeatureAVX2 : SubtargetFeature<"avx2", "X86SSELevel", "AVX2",
122 "Enable AVX2 instructions",
124 def FeatureFMA : SubtargetFeature<"fma", "HasFMA", "true",
125 "Enable three-operand fused multiple-add",
127 def FeatureF16C : SubtargetFeature<"f16c", "HasF16C", "true",
128 "Support 16-bit floating point conversion instructions",
130 def FeatureAVX512 : SubtargetFeature<"avx512f", "X86SSELevel", "AVX512F",
131 "Enable AVX-512 instructions",
132 [FeatureAVX2, FeatureFMA, FeatureF16C]>;
133 def FeatureERI : SubtargetFeature<"avx512er", "HasERI", "true",
134 "Enable AVX-512 Exponential and Reciprocal Instructions",
136 def FeatureCDI : SubtargetFeature<"avx512cd", "HasCDI", "true",
137 "Enable AVX-512 Conflict Detection Instructions",
139 def FeatureVPOPCNTDQ : SubtargetFeature<"avx512vpopcntdq", "HasVPOPCNTDQ",
140 "true", "Enable AVX-512 Population Count Instructions",
142 def FeaturePFI : SubtargetFeature<"avx512pf", "HasPFI", "true",
143 "Enable AVX-512 PreFetch Instructions",
145 def FeaturePREFETCHWT1 : SubtargetFeature<"prefetchwt1", "HasPREFETCHWT1",
147 "Prefetch with Intent to Write and T1 Hint">;
148 def FeatureDQI : SubtargetFeature<"avx512dq", "HasDQI", "true",
149 "Enable AVX-512 Doubleword and Quadword Instructions",
151 def FeatureBWI : SubtargetFeature<"avx512bw", "HasBWI", "true",
152 "Enable AVX-512 Byte and Word Instructions",
154 def FeatureVLX : SubtargetFeature<"avx512vl", "HasVLX", "true",
155 "Enable AVX-512 Vector Length eXtensions",
157 def FeatureVBMI : SubtargetFeature<"avx512vbmi", "HasVBMI", "true",
158 "Enable AVX-512 Vector Byte Manipulation Instructions",
160 def FeatureVBMI2 : SubtargetFeature<"avx512vbmi2", "HasVBMI2", "true",
161 "Enable AVX-512 further Vector Byte Manipulation Instructions",
163 def FeatureIFMA : SubtargetFeature<"avx512ifma", "HasIFMA", "true",
164 "Enable AVX-512 Integer Fused Multiple-Add",
166 def FeaturePKU : SubtargetFeature<"pku", "HasPKU", "true",
167 "Enable protection keys">;
168 def FeatureVNNI : SubtargetFeature<"avx512vnni", "HasVNNI", "true",
169 "Enable AVX-512 Vector Neural Network Instructions",
171 def FeatureBF16 : SubtargetFeature<"avx512bf16", "HasBF16", "true",
172 "Support bfloat16 floating point",
174 def FeatureBITALG : SubtargetFeature<"avx512bitalg", "HasBITALG", "true",
175 "Enable AVX-512 Bit Algorithms",
177 def FeatureVP2INTERSECT : SubtargetFeature<"avx512vp2intersect",
178 "HasVP2INTERSECT", "true",
179 "Enable AVX-512 vp2intersect",
181 def FeaturePCLMUL : SubtargetFeature<"pclmul", "HasPCLMUL", "true",
182 "Enable packed carry-less multiplication instructions",
184 def FeatureGFNI : SubtargetFeature<"gfni", "HasGFNI", "true",
185 "Enable Galois Field Arithmetic Instructions",
187 def FeatureVPCLMULQDQ : SubtargetFeature<"vpclmulqdq", "HasVPCLMULQDQ", "true",
188 "Enable vpclmulqdq instructions",
189 [FeatureAVX, FeaturePCLMUL]>;
190 def FeatureFMA4 : SubtargetFeature<"fma4", "HasFMA4", "true",
191 "Enable four-operand fused multiple-add",
192 [FeatureAVX, FeatureSSE4A]>;
193 def FeatureXOP : SubtargetFeature<"xop", "HasXOP", "true",
194 "Enable XOP instructions",
196 def FeatureSSEUnalignedMem : SubtargetFeature<"sse-unaligned-mem",
197 "HasSSEUnalignedMem", "true",
198 "Allow unaligned memory operands with SSE instructions">;
199 def FeatureAES : SubtargetFeature<"aes", "HasAES", "true",
200 "Enable AES instructions",
202 def FeatureVAES : SubtargetFeature<"vaes", "HasVAES", "true",
203 "Promote selected AES instructions to AVX512/AVX registers",
204 [FeatureAVX, FeatureAES]>;
205 def FeatureTBM : SubtargetFeature<"tbm", "HasTBM", "true",
206 "Enable TBM instructions">;
207 def FeatureLWP : SubtargetFeature<"lwp", "HasLWP", "true",
208 "Enable LWP instructions">;
209 def FeatureMOVBE : SubtargetFeature<"movbe", "HasMOVBE", "true",
210 "Support MOVBE instruction">;
211 def FeatureRDRAND : SubtargetFeature<"rdrnd", "HasRDRAND", "true",
212 "Support RDRAND instruction">;
213 def FeatureFSGSBase : SubtargetFeature<"fsgsbase", "HasFSGSBase", "true",
214 "Support FS/GS Base instructions">;
215 def FeatureLZCNT : SubtargetFeature<"lzcnt", "HasLZCNT", "true",
216 "Support LZCNT instruction">;
217 def FeatureBMI : SubtargetFeature<"bmi", "HasBMI", "true",
218 "Support BMI instructions">;
219 def FeatureBMI2 : SubtargetFeature<"bmi2", "HasBMI2", "true",
220 "Support BMI2 instructions">;
221 def FeatureRTM : SubtargetFeature<"rtm", "HasRTM", "true",
222 "Support RTM instructions">;
223 def FeatureADX : SubtargetFeature<"adx", "HasADX", "true",
224 "Support ADX instructions">;
225 def FeatureSHA : SubtargetFeature<"sha", "HasSHA", "true",
226 "Enable SHA instructions",
228 def FeatureSHSTK : SubtargetFeature<"shstk", "HasSHSTK", "true",
229 "Support CET Shadow-Stack instructions">;
230 def FeaturePRFCHW : SubtargetFeature<"prfchw", "HasPRFCHW", "true",
231 "Support PRFCHW instructions">;
232 def FeatureRDSEED : SubtargetFeature<"rdseed", "HasRDSEED", "true",
233 "Support RDSEED instruction">;
234 def FeatureLAHFSAHF : SubtargetFeature<"sahf", "HasLAHFSAHF", "true",
235 "Support LAHF and SAHF instructions">;
236 def FeatureMWAITX : SubtargetFeature<"mwaitx", "HasMWAITX", "true",
237 "Enable MONITORX/MWAITX timer functionality">;
238 def FeatureCLZERO : SubtargetFeature<"clzero", "HasCLZERO", "true",
239 "Enable Cache Line Zero">;
240 def FeatureCLDEMOTE : SubtargetFeature<"cldemote", "HasCLDEMOTE", "true",
241 "Enable Cache Demote">;
242 def FeaturePTWRITE : SubtargetFeature<"ptwrite", "HasPTWRITE", "true",
243 "Support ptwrite instruction">;
244 // FIXME: This feature is deprecated in 10.0 and should not be used for
245 // anything, but removing it would break IR files that may contain it in a
246 // target-feature attribute.
247 def FeatureDeprecatedMPX : SubtargetFeature<"mpx", "DeprecatedHasMPX", "false",
248 "Deprecated. Support MPX instructions">;
249 def FeatureLEAForSP : SubtargetFeature<"lea-sp", "UseLeaForSP", "true",
250 "Use LEA for adjusting the stack pointer">;
251 def FeatureSlowDivide32 : SubtargetFeature<"idivl-to-divb",
252 "HasSlowDivide32", "true",
253 "Use 8-bit divide for positive values less than 256">;
254 def FeatureSlowDivide64 : SubtargetFeature<"idivq-to-divl",
255 "HasSlowDivide64", "true",
256 "Use 32-bit divide for positive values less than 2^32">;
257 def FeaturePadShortFunctions : SubtargetFeature<"pad-short-functions",
258 "PadShortFunctions", "true",
259 "Pad short functions">;
260 def FeatureINVPCID : SubtargetFeature<"invpcid", "HasINVPCID", "true",
261 "Invalidate Process-Context Identifier">;
262 def FeatureSGX : SubtargetFeature<"sgx", "HasSGX", "true",
263 "Enable Software Guard Extensions">;
264 def FeatureCLFLUSHOPT : SubtargetFeature<"clflushopt", "HasCLFLUSHOPT", "true",
265 "Flush A Cache Line Optimized">;
266 def FeatureCLWB : SubtargetFeature<"clwb", "HasCLWB", "true",
267 "Cache Line Write Back">;
268 def FeatureWBNOINVD : SubtargetFeature<"wbnoinvd", "HasWBNOINVD", "true",
269 "Write Back No Invalidate">;
270 def FeatureRDPID : SubtargetFeature<"rdpid", "HasRDPID", "true",
271 "Support RDPID instructions">;
272 def FeatureWAITPKG : SubtargetFeature<"waitpkg", "HasWAITPKG", "true",
273 "Wait and pause enhancements">;
274 def FeatureENQCMD : SubtargetFeature<"enqcmd", "HasENQCMD", "true",
275 "Has ENQCMD instructions">;
276 // On some processors, instructions that implicitly take two memory operands are
277 // slow. In practice, this means that CALL, PUSH, and POP with memory operands
278 // should be avoided in favor of a MOV + register CALL/PUSH/POP.
279 def FeatureSlowTwoMemOps : SubtargetFeature<"slow-two-mem-ops",
280 "SlowTwoMemOps", "true",
281 "Two memory operand instructions are slow">;
282 def FeatureLEAUsesAG : SubtargetFeature<"lea-uses-ag", "LEAUsesAG", "true",
283 "LEA instruction needs inputs at AG stage">;
284 def FeatureSlowLEA : SubtargetFeature<"slow-lea", "SlowLEA", "true",
285 "LEA instruction with certain arguments is slow">;
286 def FeatureSlow3OpsLEA : SubtargetFeature<"slow-3ops-lea", "Slow3OpsLEA", "true",
287 "LEA instruction with 3 ops or certain registers is slow">;
288 def FeatureSlowIncDec : SubtargetFeature<"slow-incdec", "SlowIncDec", "true",
289 "INC and DEC instructions are slower than ADD and SUB">;
291 : SubtargetFeature<"soft-float", "UseSoftFloat", "true",
292 "Use software floating point features">;
293 def FeaturePOPCNTFalseDeps : SubtargetFeature<"false-deps-popcnt",
294 "HasPOPCNTFalseDeps", "true",
295 "POPCNT has a false dependency on dest register">;
296 def FeatureLZCNTFalseDeps : SubtargetFeature<"false-deps-lzcnt-tzcnt",
297 "HasLZCNTFalseDeps", "true",
298 "LZCNT/TZCNT have a false dependency on dest register">;
299 def FeaturePCONFIG : SubtargetFeature<"pconfig", "HasPCONFIG", "true",
300 "platform configuration instruction">;
301 // On recent X86 (port bound) processors, its preferable to combine to a single shuffle
302 // using a variable mask over multiple fixed shuffles.
303 def FeatureFastVariableShuffle
304 : SubtargetFeature<"fast-variable-shuffle",
305 "HasFastVariableShuffle",
306 "true", "Shuffles with variable masks are fast">;
307 // On some X86 processors, there is no performance hazard to writing only the
308 // lower parts of a YMM or ZMM register without clearing the upper part.
309 def FeatureFastPartialYMMorZMMWrite
310 : SubtargetFeature<"fast-partial-ymm-or-zmm-write",
311 "HasFastPartialYMMorZMMWrite",
312 "true", "Partial writes to YMM/ZMM registers are fast">;
313 // FeatureFastScalarFSQRT should be enabled if scalar FSQRT has shorter latency
314 // than the corresponding NR code. FeatureFastVectorFSQRT should be enabled if
315 // vector FSQRT has higher throughput than the corresponding NR code.
316 // The idea is that throughput bound code is likely to be vectorized, so for
317 // vectorized code we should care about the throughput of SQRT operations.
318 // But if the code is scalar that probably means that the code has some kind of
319 // dependency and we should care more about reducing the latency.
320 def FeatureFastScalarFSQRT
321 : SubtargetFeature<"fast-scalar-fsqrt", "HasFastScalarFSQRT",
322 "true", "Scalar SQRT is fast (disable Newton-Raphson)">;
323 def FeatureFastVectorFSQRT
324 : SubtargetFeature<"fast-vector-fsqrt", "HasFastVectorFSQRT",
325 "true", "Vector SQRT is fast (disable Newton-Raphson)">;
326 // If lzcnt has equivalent latency/throughput to most simple integer ops, it can
327 // be used to replace test/set sequences.
330 "fast-lzcnt", "HasFastLZCNT", "true",
331 "LZCNT instructions are as fast as most simple integer ops">;
332 // If the target can efficiently decode NOPs upto 11-bytes in length.
333 def FeatureFast11ByteNOP
335 "fast-11bytenop", "HasFast11ByteNOP", "true",
336 "Target can quickly decode up to 11 byte NOPs">;
337 // If the target can efficiently decode NOPs upto 15-bytes in length.
338 def FeatureFast15ByteNOP
340 "fast-15bytenop", "HasFast15ByteNOP", "true",
341 "Target can quickly decode up to 15 byte NOPs">;
342 // Sandy Bridge and newer processors can use SHLD with the same source on both
343 // inputs to implement rotate to avoid the partial flag update of the normal
344 // rotate instructions.
345 def FeatureFastSHLDRotate
347 "fast-shld-rotate", "HasFastSHLDRotate", "true",
348 "SHLD can be used as a faster rotate">;
350 // Ivy Bridge and newer processors have enhanced REP MOVSB and STOSB (aka
351 // "string operations"). See "REP String Enhancement" in the Intel Software
352 // Development Manual. This feature essentially means that REP MOVSB will copy
353 // using the largest available size instead of copying bytes one by one, making
354 // it at least as fast as REPMOVS{W,D,Q}.
357 "ermsb", "HasERMSB", "true",
358 "REP MOVS/STOS are fast">;
360 // Bulldozer and newer processors can merge CMP/TEST (but not other
361 // instructions) with conditional branches.
362 def FeatureBranchFusion
363 : SubtargetFeature<"branchfusion", "HasBranchFusion", "true",
364 "CMP/TEST can be fused with conditional branches">;
366 // Sandy Bridge and newer processors have many instructions that can be
367 // fused with conditional branches and pass through the CPU as a single
369 def FeatureMacroFusion
370 : SubtargetFeature<"macrofusion", "HasMacroFusion", "true",
371 "Various instructions can be fused with conditional branches">;
373 // Gather is available since Haswell (AVX2 set). So technically, we can
374 // generate Gathers on all AVX2 processors. But the overhead on HSW is high.
375 // Skylake Client processor has faster Gathers than HSW and performance is
376 // similar to Skylake Server (AVX-512).
377 def FeatureHasFastGather
378 : SubtargetFeature<"fast-gather", "HasFastGather", "true",
379 "Indicates if gather is reasonably fast">;
381 def FeaturePrefer128Bit
382 : SubtargetFeature<"prefer-128-bit", "Prefer128Bit", "true",
383 "Prefer 128-bit AVX instructions">;
385 def FeaturePrefer256Bit
386 : SubtargetFeature<"prefer-256-bit", "Prefer256Bit", "true",
387 "Prefer 256-bit AVX instructions">;
389 // Lower indirect calls using a special construct called a `retpoline` to
390 // mitigate potential Spectre v2 attacks against them.
391 def FeatureRetpolineIndirectCalls
393 "retpoline-indirect-calls", "UseRetpolineIndirectCalls", "true",
394 "Remove speculation of indirect calls from the generated code">;
396 // Lower indirect branches and switches either using conditional branch trees
397 // or using a special construct called a `retpoline` to mitigate potential
398 // Spectre v2 attacks against them.
399 def FeatureRetpolineIndirectBranches
401 "retpoline-indirect-branches", "UseRetpolineIndirectBranches", "true",
402 "Remove speculation of indirect branches from the generated code">;
404 // Deprecated umbrella feature for enabling both `retpoline-indirect-calls` and
405 // `retpoline-indirect-branches` above.
407 : SubtargetFeature<"retpoline", "DeprecatedUseRetpoline", "true",
408 "Remove speculation of indirect branches from the "
409 "generated code, either by avoiding them entirely or "
410 "lowering them with a speculation blocking construct",
411 [FeatureRetpolineIndirectCalls,
412 FeatureRetpolineIndirectBranches]>;
414 // Rely on external thunks for the emitted retpoline calls. This allows users
415 // to provide their own custom thunk definitions in highly specialized
416 // environments such as a kernel that does boot-time hot patching.
417 def FeatureRetpolineExternalThunk
419 "retpoline-external-thunk", "UseRetpolineExternalThunk", "true",
420 "When lowering an indirect call or branch using a `retpoline`, rely "
421 "on the specified user provided thunk rather than emitting one "
422 "ourselves. Only has effect when combined with some other retpoline "
423 "feature", [FeatureRetpolineIndirectCalls]>;
425 // Direct Move instructions.
426 def FeatureMOVDIRI : SubtargetFeature<"movdiri", "HasMOVDIRI", "true",
427 "Support movdiri instruction">;
428 def FeatureMOVDIR64B : SubtargetFeature<"movdir64b", "HasMOVDIR64B", "true",
429 "Support movdir64b instruction">;
431 def FeatureFastBEXTR : SubtargetFeature<"fast-bextr", "HasFastBEXTR", "true",
432 "Indicates that the BEXTR instruction is implemented as a single uop "
433 "with good throughput">;
435 // Combine vector math operations with shuffles into horizontal math
436 // instructions if a CPU implements horizontal operations (introduced with
437 // SSE3) with better latency/throughput than the alternative sequence.
438 def FeatureFastHorizontalOps
440 "fast-hops", "HasFastHorizontalOps", "true",
441 "Prefer horizontal vector math instructions (haddp, phsub, etc.) over "
442 "normal vector instructions with shuffles", [FeatureSSE3]>;
444 def FeatureFastScalarShiftMasks
446 "fast-scalar-shift-masks", "HasFastScalarShiftMasks", "true",
447 "Prefer a left/right scalar logical shift pair over a shift+and pair">;
449 def FeatureFastVectorShiftMasks
451 "fast-vector-shift-masks", "HasFastVectorShiftMasks", "true",
452 "Prefer a left/right vector logical shift pair over a shift+and pair">;
454 // Merge branches using three-way conditional code.
455 def FeatureMergeToThreeWayBranch : SubtargetFeature<"merge-to-threeway-branch",
456 "ThreewayBranchProfitable", "true",
457 "Merge branches to a three-way "
458 "conditional branch">;
460 // Enable use of alias analysis during code generation.
461 def FeatureUseAA : SubtargetFeature<"use-aa", "UseAA", "true",
462 "Use alias analysis during codegen">;
465 def ProcIntelAtom : SubtargetFeature<"", "X86ProcFamily", "IntelAtom", "">;
467 def ProcIntelSLM : SubtargetFeature<"", "X86ProcFamily", "IntelSLM", "">;
469 def ProcIntelGLM : SubtargetFeature<"", "X86ProcFamily", "IntelGLM", "">;
471 def ProcIntelGLP : SubtargetFeature<"", "X86ProcFamily", "IntelGLP", "">;
473 def ProcIntelTRM : SubtargetFeature<"", "X86ProcFamily", "IntelTRM", "">;
475 //===----------------------------------------------------------------------===//
476 // Register File Description
477 //===----------------------------------------------------------------------===//
479 include "X86RegisterInfo.td"
480 include "X86RegisterBanks.td"
482 //===----------------------------------------------------------------------===//
483 // Instruction Descriptions
484 //===----------------------------------------------------------------------===//
486 include "X86Schedule.td"
487 include "X86InstrInfo.td"
488 include "X86SchedPredicates.td"
490 def X86InstrInfo : InstrInfo;
492 //===----------------------------------------------------------------------===//
493 // X86 Scheduler Models
494 //===----------------------------------------------------------------------===//
496 include "X86ScheduleAtom.td"
497 include "X86SchedSandyBridge.td"
498 include "X86SchedHaswell.td"
499 include "X86SchedBroadwell.td"
500 include "X86ScheduleSLM.td"
501 include "X86ScheduleZnver1.td"
502 include "X86ScheduleBdVer2.td"
503 include "X86ScheduleBtVer2.td"
504 include "X86SchedSkylakeClient.td"
505 include "X86SchedSkylakeServer.td"
507 //===----------------------------------------------------------------------===//
508 // X86 Processor Feature Lists
509 //===----------------------------------------------------------------------===//
511 def ProcessorFeatures {
513 list<SubtargetFeature> NHMInheritableFeatures = [FeatureX87,
525 list<SubtargetFeature> NHMSpecificFeatures = [];
526 list<SubtargetFeature> NHMFeatures =
527 !listconcat(NHMInheritableFeatures, NHMSpecificFeatures);
530 list<SubtargetFeature> WSMAdditionalFeatures = [FeaturePCLMUL];
531 list<SubtargetFeature> WSMSpecificFeatures = [];
532 list<SubtargetFeature> WSMInheritableFeatures =
533 !listconcat(NHMInheritableFeatures, WSMAdditionalFeatures);
534 list<SubtargetFeature> WSMFeatures =
535 !listconcat(WSMInheritableFeatures, WSMSpecificFeatures);
538 list<SubtargetFeature> SNBAdditionalFeatures = [FeatureAVX,
543 FeatureFastScalarFSQRT,
544 FeatureFastSHLDRotate,
545 FeatureMergeToThreeWayBranch];
546 list<SubtargetFeature> SNBSpecificFeatures = [FeatureSlowUAMem32,
547 FeaturePOPCNTFalseDeps];
548 list<SubtargetFeature> SNBInheritableFeatures =
549 !listconcat(WSMInheritableFeatures, SNBAdditionalFeatures);
550 list<SubtargetFeature> SNBFeatures =
551 !listconcat(SNBInheritableFeatures, SNBSpecificFeatures);
554 list<SubtargetFeature> IVBAdditionalFeatures = [FeatureRDRAND,
557 list<SubtargetFeature> IVBSpecificFeatures = [FeatureSlowUAMem32,
558 FeaturePOPCNTFalseDeps];
559 list<SubtargetFeature> IVBInheritableFeatures =
560 !listconcat(SNBInheritableFeatures, IVBAdditionalFeatures);
561 list<SubtargetFeature> IVBFeatures =
562 !listconcat(IVBInheritableFeatures, IVBSpecificFeatures);
565 list<SubtargetFeature> HSWAdditionalFeatures = [FeatureAVX2,
573 FeatureFastVariableShuffle];
574 list<SubtargetFeature> HSWSpecificFeatures = [FeaturePOPCNTFalseDeps,
575 FeatureLZCNTFalseDeps];
576 list<SubtargetFeature> HSWInheritableFeatures =
577 !listconcat(IVBInheritableFeatures, HSWAdditionalFeatures);
578 list<SubtargetFeature> HSWFeatures =
579 !listconcat(HSWInheritableFeatures, HSWSpecificFeatures);
582 list<SubtargetFeature> BDWAdditionalFeatures = [FeatureADX,
585 list<SubtargetFeature> BDWSpecificFeatures = [FeaturePOPCNTFalseDeps,
586 FeatureLZCNTFalseDeps];
587 list<SubtargetFeature> BDWInheritableFeatures =
588 !listconcat(HSWInheritableFeatures, BDWAdditionalFeatures);
589 list<SubtargetFeature> BDWFeatures =
590 !listconcat(BDWInheritableFeatures, BDWSpecificFeatures);
593 list<SubtargetFeature> SKLAdditionalFeatures = [FeatureAES,
597 FeatureFastVectorFSQRT];
598 list<SubtargetFeature> SKLSpecificFeatures = [FeatureHasFastGather,
599 FeaturePOPCNTFalseDeps,
601 list<SubtargetFeature> SKLInheritableFeatures =
602 !listconcat(BDWInheritableFeatures, SKLAdditionalFeatures);
603 list<SubtargetFeature> SKLFeatures =
604 !listconcat(SKLInheritableFeatures, SKLSpecificFeatures);
607 list<SubtargetFeature> SKXAdditionalFeatures = [FeatureAVX512,
615 list<SubtargetFeature> SKXSpecificFeatures = [FeatureHasFastGather,
616 FeaturePOPCNTFalseDeps];
617 list<SubtargetFeature> SKXInheritableFeatures =
618 !listconcat(SKLInheritableFeatures, SKXAdditionalFeatures);
619 list<SubtargetFeature> SKXFeatures =
620 !listconcat(SKXInheritableFeatures, SKXSpecificFeatures);
623 list<SubtargetFeature> CLXAdditionalFeatures = [FeatureVNNI];
624 list<SubtargetFeature> CLXSpecificFeatures = [FeatureHasFastGather,
625 FeaturePOPCNTFalseDeps];
626 list<SubtargetFeature> CLXInheritableFeatures =
627 !listconcat(SKXInheritableFeatures, CLXAdditionalFeatures);
628 list<SubtargetFeature> CLXFeatures =
629 !listconcat(CLXInheritableFeatures, CLXSpecificFeatures);
632 list<SubtargetFeature> CPXAdditionalFeatures = [FeatureBF16];
633 list<SubtargetFeature> CPXSpecificFeatures = [FeatureHasFastGather,
634 FeaturePOPCNTFalseDeps];
635 list<SubtargetFeature> CPXInheritableFeatures =
636 !listconcat(CLXInheritableFeatures, CPXAdditionalFeatures);
637 list<SubtargetFeature> CPXFeatures =
638 !listconcat(CPXInheritableFeatures, CPXSpecificFeatures);
641 list<SubtargetFeature> CNLAdditionalFeatures = [FeatureAVX512,
652 list<SubtargetFeature> CNLSpecificFeatures = [FeatureHasFastGather];
653 list<SubtargetFeature> CNLInheritableFeatures =
654 !listconcat(SKLInheritableFeatures, CNLAdditionalFeatures);
655 list<SubtargetFeature> CNLFeatures =
656 !listconcat(CNLInheritableFeatures, CNLSpecificFeatures);
659 list<SubtargetFeature> ICLAdditionalFeatures = [FeatureBITALG,
668 list<SubtargetFeature> ICLSpecificFeatures = [FeatureHasFastGather];
669 list<SubtargetFeature> ICLInheritableFeatures =
670 !listconcat(CNLInheritableFeatures, ICLAdditionalFeatures);
671 list<SubtargetFeature> ICLFeatures =
672 !listconcat(ICLInheritableFeatures, ICLSpecificFeatures);
675 list<SubtargetFeature> ICXSpecificFeatures = [FeaturePCONFIG,
677 FeatureHasFastGather];
678 list<SubtargetFeature> ICXFeatures =
679 !listconcat(ICLInheritableFeatures, ICXSpecificFeatures);
682 list<SubtargetFeature> TGLAdditionalFeatures = [FeatureVP2INTERSECT,
686 list<SubtargetFeature> TGLSpecificFeatures = [FeatureHasFastGather];
687 list<SubtargetFeature> TGLInheritableFeatures =
688 !listconcat(TGLAdditionalFeatures ,TGLSpecificFeatures);
689 list<SubtargetFeature> TGLFeatures =
690 !listconcat(ICLFeatures, TGLInheritableFeatures );
693 list<SubtargetFeature> AtomInheritableFeatures = [FeatureX87,
703 FeatureSlowTwoMemOps,
705 list<SubtargetFeature> AtomSpecificFeatures = [ProcIntelAtom,
711 FeaturePadShortFunctions];
712 list<SubtargetFeature> AtomFeatures =
713 !listconcat(AtomInheritableFeatures, AtomSpecificFeatures);
716 list<SubtargetFeature> SLMAdditionalFeatures = [FeatureSSE42,
723 list<SubtargetFeature> SLMSpecificFeatures = [ProcIntelSLM,
726 FeaturePOPCNTFalseDeps];
727 list<SubtargetFeature> SLMInheritableFeatures =
728 !listconcat(AtomInheritableFeatures, SLMAdditionalFeatures);
729 list<SubtargetFeature> SLMFeatures =
730 !listconcat(SLMInheritableFeatures, SLMSpecificFeatures);
733 list<SubtargetFeature> GLMAdditionalFeatures = [FeatureAES,
742 list<SubtargetFeature> GLMSpecificFeatures = [ProcIntelGLM,
743 FeaturePOPCNTFalseDeps];
744 list<SubtargetFeature> GLMInheritableFeatures =
745 !listconcat(SLMInheritableFeatures, GLMAdditionalFeatures);
746 list<SubtargetFeature> GLMFeatures =
747 !listconcat(GLMInheritableFeatures, GLMSpecificFeatures);
750 list<SubtargetFeature> GLPAdditionalFeatures = [FeaturePTWRITE,
753 list<SubtargetFeature> GLPSpecificFeatures = [ProcIntelGLP];
754 list<SubtargetFeature> GLPInheritableFeatures =
755 !listconcat(GLMInheritableFeatures, GLPAdditionalFeatures);
756 list<SubtargetFeature> GLPFeatures =
757 !listconcat(GLPInheritableFeatures, GLPSpecificFeatures);
760 list<SubtargetFeature> TRMAdditionalFeatures = [FeatureCLDEMOTE,
765 list<SubtargetFeature> TRMSpecificFeatures = [ProcIntelTRM];
766 list<SubtargetFeature> TRMFeatures =
767 !listconcat(GLPInheritableFeatures, TRMAdditionalFeatures,
768 TRMSpecificFeatures);
771 list<SubtargetFeature> KNLFeatures = [FeatureX87,
804 FeatureSlowTwoMemOps,
805 FeatureFastPartialYMMorZMMWrite,
806 FeatureHasFastGather,
808 // TODO Add AVX5124FMAPS/AVX5124VNNIW features
809 list<SubtargetFeature> KNMFeatures =
810 !listconcat(KNLFeatures, [FeatureVPOPCNTDQ]);
813 list<SubtargetFeature> BarcelonaInheritableFeatures = [FeatureX87,
826 FeatureFastScalarShiftMasks];
827 list<SubtargetFeature> BarcelonaFeatures = BarcelonaInheritableFeatures;
830 list<SubtargetFeature> BtVer1InheritableFeatures = [FeatureX87,
845 FeatureFast15ByteNOP,
846 FeatureFastScalarShiftMasks,
847 FeatureFastVectorShiftMasks];
848 list<SubtargetFeature> BtVer1Features = BtVer1InheritableFeatures;
851 list<SubtargetFeature> BtVer2AdditionalFeatures = [FeatureAVX,
859 list<SubtargetFeature> BtVer2SpecificFeatures = [FeatureFastLZCNT,
861 FeatureFastPartialYMMorZMMWrite,
862 FeatureFastHorizontalOps];
863 list<SubtargetFeature> BtVer2InheritableFeatures =
864 !listconcat(BtVer1InheritableFeatures, BtVer2AdditionalFeatures);
865 list<SubtargetFeature> BtVer2Features =
866 !listconcat(BtVer2InheritableFeatures, BtVer2SpecificFeatures);
869 list<SubtargetFeature> BdVer1InheritableFeatures = [FeatureX87,
887 FeatureFast11ByteNOP,
888 FeatureFastScalarShiftMasks,
889 FeatureBranchFusion];
890 list<SubtargetFeature> BdVer1Features = BdVer1InheritableFeatures;
893 list<SubtargetFeature> BdVer2AdditionalFeatures = [FeatureF16C,
898 list<SubtargetFeature> BdVer2InheritableFeatures =
899 !listconcat(BdVer1InheritableFeatures, BdVer2AdditionalFeatures);
900 list<SubtargetFeature> BdVer2Features = BdVer2InheritableFeatures;
903 list<SubtargetFeature> BdVer3AdditionalFeatures = [FeatureXSAVEOPT,
905 list<SubtargetFeature> BdVer3InheritableFeatures =
906 !listconcat(BdVer2InheritableFeatures, BdVer3AdditionalFeatures);
907 list<SubtargetFeature> BdVer3Features = BdVer3InheritableFeatures;
910 list<SubtargetFeature> BdVer4AdditionalFeatures = [FeatureAVX2,
913 list<SubtargetFeature> BdVer4InheritableFeatures =
914 !listconcat(BdVer3InheritableFeatures, BdVer4AdditionalFeatures);
915 list<SubtargetFeature> BdVer4Features = BdVer4InheritableFeatures;
918 // AMD Zen Processors common ISAs
919 list<SubtargetFeature> ZNFeatures = [FeatureADX,
938 FeatureFast15ByteNOP,
940 FeatureFastScalarShiftMasks,
957 list<SubtargetFeature> ZN2AdditionalFeatures = [FeatureCLWB,
960 list<SubtargetFeature> ZN2Features =
961 !listconcat(ZNFeatures, ZN2AdditionalFeatures);
964 //===----------------------------------------------------------------------===//
965 // X86 processors supported.
966 //===----------------------------------------------------------------------===//
968 class Proc<string Name, list<SubtargetFeature> Features>
969 : ProcessorModel<Name, GenericModel, Features>;
971 // NOTE: CMPXCHG8B is here for legacy compatbility so that it is only disabled
972 // if i386/i486 is specifically requested.
973 def : Proc<"generic", [FeatureX87, FeatureSlowUAMem16,
975 def : Proc<"i386", [FeatureX87, FeatureSlowUAMem16]>;
976 def : Proc<"i486", [FeatureX87, FeatureSlowUAMem16]>;
977 def : Proc<"i586", [FeatureX87, FeatureSlowUAMem16,
979 def : Proc<"pentium", [FeatureX87, FeatureSlowUAMem16,
981 def : Proc<"pentium-mmx", [FeatureX87, FeatureSlowUAMem16,
982 FeatureCMPXCHG8B, FeatureMMX]>;
984 def : Proc<"i686", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
986 def : Proc<"pentiumpro", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
987 FeatureCMOV, FeatureNOPL]>;
989 def : Proc<"pentium2", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
990 FeatureMMX, FeatureCMOV, FeatureFXSR,
993 foreach P = ["pentium3", "pentium3m"] in {
994 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,FeatureMMX,
995 FeatureSSE1, FeatureFXSR, FeatureNOPL, FeatureCMOV]>;
998 // Enable the PostRAScheduler for SSE2 and SSE3 class cpus.
999 // The intent is to enable it for pentium4 which is the current default
1000 // processor in a vanilla 32-bit clang compilation when no specific
1001 // architecture is specified. This generally gives a nice performance
1002 // increase on silvermont, with largely neutral behavior on other
1003 // contemporary large core processors.
1004 // pentium-m, pentium4m, prescott and nocona are included as a preventative
1005 // measure to avoid performance surprises, in case clang's default cpu
1006 // changes slightly.
1008 def : ProcessorModel<"pentium-m", GenericPostRAModel,
1009 [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1010 FeatureMMX, FeatureSSE2, FeatureFXSR, FeatureNOPL,
1013 foreach P = ["pentium4", "pentium4m"] in {
1014 def : ProcessorModel<P, GenericPostRAModel,
1015 [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1016 FeatureMMX, FeatureSSE2, FeatureFXSR, FeatureNOPL,
1021 def : Proc<"lakemont", []>;
1024 def : ProcessorModel<"yonah", SandyBridgeModel,
1025 [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1026 FeatureMMX, FeatureSSE3, FeatureFXSR, FeatureNOPL,
1030 def : ProcessorModel<"prescott", GenericPostRAModel,
1031 [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1032 FeatureMMX, FeatureSSE3, FeatureFXSR, FeatureNOPL,
1034 def : ProcessorModel<"nocona", GenericPostRAModel, [
1047 // Intel Core 2 Solo/Duo.
1048 def : ProcessorModel<"core2", SandyBridgeModel, [
1062 def : ProcessorModel<"penryn", SandyBridgeModel, [
1078 foreach P = ["bonnell", "atom"] in {
1079 def : ProcessorModel<P, AtomModel, ProcessorFeatures.AtomFeatures>;
1082 foreach P = ["silvermont", "slm"] in {
1083 def : ProcessorModel<P, SLMModel, ProcessorFeatures.SLMFeatures>;
1086 def : ProcessorModel<"goldmont", SLMModel, ProcessorFeatures.GLMFeatures>;
1087 def : ProcessorModel<"goldmont-plus", SLMModel, ProcessorFeatures.GLPFeatures>;
1088 def : ProcessorModel<"tremont", SLMModel, ProcessorFeatures.TRMFeatures>;
1090 // "Arrandale" along with corei3 and corei5
1091 foreach P = ["nehalem", "corei7"] in {
1092 def : ProcessorModel<P, SandyBridgeModel, ProcessorFeatures.NHMFeatures>;
1095 // Westmere is the corei3/i5/i7 path from nehalem to sandybridge
1096 def : ProcessorModel<"westmere", SandyBridgeModel,
1097 ProcessorFeatures.WSMFeatures>;
1099 foreach P = ["sandybridge", "corei7-avx"] in {
1100 def : ProcessorModel<P, SandyBridgeModel, ProcessorFeatures.SNBFeatures>;
1103 foreach P = ["ivybridge", "core-avx-i"] in {
1104 def : ProcessorModel<P, SandyBridgeModel, ProcessorFeatures.IVBFeatures>;
1107 foreach P = ["haswell", "core-avx2"] in {
1108 def : ProcessorModel<P, HaswellModel, ProcessorFeatures.HSWFeatures>;
1111 def : ProcessorModel<"broadwell", BroadwellModel,
1112 ProcessorFeatures.BDWFeatures>;
1114 def : ProcessorModel<"skylake", SkylakeClientModel,
1115 ProcessorFeatures.SKLFeatures>;
1117 // FIXME: define KNL scheduler model
1118 def : ProcessorModel<"knl", HaswellModel, ProcessorFeatures.KNLFeatures>;
1119 def : ProcessorModel<"knm", HaswellModel, ProcessorFeatures.KNMFeatures>;
1121 foreach P = ["skylake-avx512", "skx"] in {
1122 def : ProcessorModel<P, SkylakeServerModel, ProcessorFeatures.SKXFeatures>;
1125 def : ProcessorModel<"cascadelake", SkylakeServerModel,
1126 ProcessorFeatures.CLXFeatures>;
1127 def : ProcessorModel<"cooperlake", SkylakeServerModel,
1128 ProcessorFeatures.CPXFeatures>;
1129 def : ProcessorModel<"cannonlake", SkylakeServerModel,
1130 ProcessorFeatures.CNLFeatures>;
1131 def : ProcessorModel<"icelake-client", SkylakeServerModel,
1132 ProcessorFeatures.ICLFeatures>;
1133 def : ProcessorModel<"icelake-server", SkylakeServerModel,
1134 ProcessorFeatures.ICXFeatures>;
1135 def : ProcessorModel<"tigerlake", SkylakeServerModel,
1136 ProcessorFeatures.TGLFeatures>;
1140 def : Proc<"k6", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1142 def : Proc<"k6-2", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1144 def : Proc<"k6-3", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1147 foreach P = ["athlon", "athlon-tbird"] in {
1148 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B, FeatureCMOV,
1149 Feature3DNowA, FeatureNOPL, FeatureSlowSHLD]>;
1152 foreach P = ["athlon-4", "athlon-xp", "athlon-mp"] in {
1153 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B, FeatureCMOV,
1154 FeatureSSE1, Feature3DNowA, FeatureFXSR, FeatureNOPL,
1158 foreach P = ["k8", "opteron", "athlon64", "athlon-fx"] in {
1159 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1160 FeatureSSE2, Feature3DNowA, FeatureFXSR, FeatureNOPL,
1161 Feature64Bit, FeatureSlowSHLD, FeatureCMOV,
1162 FeatureFastScalarShiftMasks]>;
1165 foreach P = ["k8-sse3", "opteron-sse3", "athlon64-sse3"] in {
1166 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B, FeatureSSE3,
1167 Feature3DNowA, FeatureFXSR, FeatureNOPL, FeatureCMPXCHG16B,
1168 FeatureSlowSHLD, FeatureCMOV, Feature64Bit,
1169 FeatureFastScalarShiftMasks]>;
1172 foreach P = ["amdfam10", "barcelona"] in {
1173 def : Proc<P, ProcessorFeatures.BarcelonaFeatures>;
1177 def : Proc<"btver1", ProcessorFeatures.BtVer1Features>;
1179 def : ProcessorModel<"btver2", BtVer2Model, ProcessorFeatures.BtVer2Features>;
1182 def : ProcessorModel<"bdver1", BdVer2Model, ProcessorFeatures.BdVer1Features>;
1184 def : ProcessorModel<"bdver2", BdVer2Model, ProcessorFeatures.BdVer2Features>;
1186 def : Proc<"bdver3", ProcessorFeatures.BdVer3Features>;
1188 def : Proc<"bdver4", ProcessorFeatures.BdVer4Features>;
1190 def : ProcessorModel<"znver1", Znver1Model, ProcessorFeatures.ZNFeatures>;
1191 def : ProcessorModel<"znver2", Znver1Model, ProcessorFeatures.ZN2Features>;
1193 def : Proc<"geode", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1196 def : Proc<"winchip-c6", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
1197 def : Proc<"winchip2", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
1198 def : Proc<"c3", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
1199 def : Proc<"c3-2", [FeatureX87, FeatureSlowUAMem16, FeatureCMPXCHG8B,
1200 FeatureMMX, FeatureSSE1, FeatureFXSR,
1203 // We also provide a generic 64-bit specific x86 processor model which tries to
1204 // be good for modern chips without enabling instruction set encodings past the
1205 // basic SSE2 and 64-bit ones. It disables slow things from any mainstream and
1206 // modern 64-bit x86 chip, and enables features that are generally beneficial.
1208 // We currently use the Sandy Bridge model as the default scheduling model as
1209 // we use it across Nehalem, Westmere, Sandy Bridge, and Ivy Bridge which
1210 // covers a huge swath of x86 processors. If there are specific scheduling
1211 // knobs which need to be tuned differently for AMD chips, we might consider
1212 // forming a common base for them.
1213 def : ProcessorModel<"x86-64", SandyBridgeModel, [
1227 //===----------------------------------------------------------------------===//
1228 // Calling Conventions
1229 //===----------------------------------------------------------------------===//
1231 include "X86CallingConv.td"
1234 //===----------------------------------------------------------------------===//
1236 //===----------------------------------------------------------------------===//
1238 def ATTAsmParserVariant : AsmParserVariant {
1242 string Name = "att";
1244 // Discard comments in assembly strings.
1245 string CommentDelimiter = "#";
1247 // Recognize hard coded registers.
1248 string RegisterPrefix = "%";
1251 def IntelAsmParserVariant : AsmParserVariant {
1255 string Name = "intel";
1257 // Discard comments in assembly strings.
1258 string CommentDelimiter = ";";
1260 // Recognize hard coded registers.
1261 string RegisterPrefix = "";
1264 //===----------------------------------------------------------------------===//
1265 // Assembly Printers
1266 //===----------------------------------------------------------------------===//
1268 // The X86 target supports two different syntaxes for emitting machine code.
1269 // This is controlled by the -x86-asm-syntax={att|intel}
1270 def ATTAsmWriter : AsmWriter {
1271 string AsmWriterClassName = "ATTInstPrinter";
1274 def IntelAsmWriter : AsmWriter {
1275 string AsmWriterClassName = "IntelInstPrinter";
1280 // Information about the instructions...
1281 let InstructionSet = X86InstrInfo;
1282 let AssemblyParserVariants = [ATTAsmParserVariant, IntelAsmParserVariant];
1283 let AssemblyWriters = [ATTAsmWriter, IntelAsmWriter];
1284 let AllowRegisterRenaming = 1;
1287 //===----------------------------------------------------------------------===//
1289 //===----------------------------------------------------------------------===//
1291 include "X86PfmCounters.td"