1 //===-- HexagonTargetMachine.cpp - Define TargetMachine for Hexagon -------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // Implements the info about Hexagon target spec.
11 //===----------------------------------------------------------------------===//
13 #include "HexagonTargetMachine.h"
15 #include "HexagonISelLowering.h"
16 #include "HexagonMachineScheduler.h"
17 #include "HexagonTargetObjectFile.h"
18 #include "HexagonTargetTransformInfo.h"
19 #include "llvm/CodeGen/Passes.h"
20 #include "llvm/CodeGen/TargetPassConfig.h"
21 #include "llvm/IR/LegacyPassManager.h"
22 #include "llvm/IR/Module.h"
23 #include "llvm/Support/CommandLine.h"
24 #include "llvm/Support/TargetRegistry.h"
25 #include "llvm/Transforms/IPO/PassManagerBuilder.h"
26 #include "llvm/Transforms/Scalar.h"
30 static cl::opt
<bool> EnableCExtOpt("hexagon-cext", cl::Hidden
, cl::ZeroOrMore
,
31 cl::init(true), cl::desc("Enable Hexagon constant-extender optimization"));
33 static cl::opt
<bool> EnableRDFOpt("rdf-opt", cl::Hidden
, cl::ZeroOrMore
,
34 cl::init(true), cl::desc("Enable RDF-based optimizations"));
36 static cl::opt
<bool> DisableHardwareLoops("disable-hexagon-hwloops",
37 cl::Hidden
, cl::desc("Disable Hardware Loops for Hexagon target"));
39 static cl::opt
<bool> DisableAModeOpt("disable-hexagon-amodeopt",
40 cl::Hidden
, cl::ZeroOrMore
, cl::init(false),
41 cl::desc("Disable Hexagon Addressing Mode Optimization"));
43 static cl::opt
<bool> DisableHexagonCFGOpt("disable-hexagon-cfgopt",
44 cl::Hidden
, cl::ZeroOrMore
, cl::init(false),
45 cl::desc("Disable Hexagon CFG Optimization"));
47 static cl::opt
<bool> DisableHCP("disable-hcp", cl::init(false), cl::Hidden
,
48 cl::ZeroOrMore
, cl::desc("Disable Hexagon constant propagation"));
50 static cl::opt
<bool> DisableStoreWidening("disable-store-widen",
51 cl::Hidden
, cl::init(false), cl::desc("Disable store widening"));
53 static cl::opt
<bool> EnableExpandCondsets("hexagon-expand-condsets",
54 cl::init(true), cl::Hidden
, cl::ZeroOrMore
,
55 cl::desc("Early expansion of MUX"));
57 static cl::opt
<bool> EnableEarlyIf("hexagon-eif", cl::init(true), cl::Hidden
,
58 cl::ZeroOrMore
, cl::desc("Enable early if-conversion"));
60 static cl::opt
<bool> EnableGenInsert("hexagon-insert", cl::init(true),
61 cl::Hidden
, cl::desc("Generate \"insert\" instructions"));
63 static cl::opt
<bool> EnableCommGEP("hexagon-commgep", cl::init(true),
64 cl::Hidden
, cl::ZeroOrMore
, cl::desc("Enable commoning of GEP instructions"));
66 static cl::opt
<bool> EnableGenExtract("hexagon-extract", cl::init(true),
67 cl::Hidden
, cl::desc("Generate \"extract\" instructions"));
69 static cl::opt
<bool> EnableGenMux("hexagon-mux", cl::init(true), cl::Hidden
,
70 cl::desc("Enable converting conditional transfers into MUX instructions"));
72 static cl::opt
<bool> EnableGenPred("hexagon-gen-pred", cl::init(true),
73 cl::Hidden
, cl::desc("Enable conversion of arithmetic operations to "
74 "predicate instructions"));
76 static cl::opt
<bool> EnableLoopPrefetch("hexagon-loop-prefetch",
77 cl::init(false), cl::Hidden
, cl::ZeroOrMore
,
78 cl::desc("Enable loop data prefetch on Hexagon"));
80 static cl::opt
<bool> DisableHSDR("disable-hsdr", cl::init(false), cl::Hidden
,
81 cl::desc("Disable splitting double registers"));
83 static cl::opt
<bool> EnableBitSimplify("hexagon-bit", cl::init(true),
84 cl::Hidden
, cl::desc("Bit simplification"));
86 static cl::opt
<bool> EnableLoopResched("hexagon-loop-resched", cl::init(true),
87 cl::Hidden
, cl::desc("Loop rescheduling"));
89 static cl::opt
<bool> HexagonNoOpt("hexagon-noopt", cl::init(false),
90 cl::Hidden
, cl::desc("Disable backend optimizations"));
92 static cl::opt
<bool> EnableVectorPrint("enable-hexagon-vector-print",
93 cl::Hidden
, cl::ZeroOrMore
, cl::init(false),
94 cl::desc("Enable Hexagon Vector print instr pass"));
96 static cl::opt
<bool> EnableVExtractOpt("hexagon-opt-vextract", cl::Hidden
,
97 cl::ZeroOrMore
, cl::init(true), cl::desc("Enable vextract optimization"));
99 static cl::opt
<bool> EnableInitialCFGCleanup("hexagon-initial-cfg-cleanup",
100 cl::Hidden
, cl::ZeroOrMore
, cl::init(true),
101 cl::desc("Simplify the CFG after atomic expansion pass"));
103 /// HexagonTargetMachineModule - Note that this is used on hosts that
104 /// cannot link in a library unless there are references into the
105 /// library. In particular, it seems that it is not possible to get
106 /// things to work on Win32 without this. Though it is unused, do not
108 extern "C" int HexagonTargetMachineModule
;
109 int HexagonTargetMachineModule
= 0;
111 static ScheduleDAGInstrs
*createVLIWMachineSched(MachineSchedContext
*C
) {
112 ScheduleDAGMILive
*DAG
=
113 new VLIWMachineScheduler(C
, make_unique
<ConvergingVLIWScheduler
>());
114 DAG
->addMutation(make_unique
<HexagonSubtarget::UsrOverflowMutation
>());
115 DAG
->addMutation(make_unique
<HexagonSubtarget::HVXMemLatencyMutation
>());
116 DAG
->addMutation(make_unique
<HexagonSubtarget::CallMutation
>());
117 DAG
->addMutation(createCopyConstrainDAGMutation(DAG
->TII
, DAG
->TRI
));
121 static MachineSchedRegistry
122 SchedCustomRegistry("hexagon", "Run Hexagon's custom scheduler",
123 createVLIWMachineSched
);
126 extern char &HexagonExpandCondsetsID
;
127 void initializeHexagonBitSimplifyPass(PassRegistry
&);
128 void initializeHexagonConstExtendersPass(PassRegistry
&);
129 void initializeHexagonConstPropagationPass(PassRegistry
&);
130 void initializeHexagonEarlyIfConversionPass(PassRegistry
&);
131 void initializeHexagonExpandCondsetsPass(PassRegistry
&);
132 void initializeHexagonGenMuxPass(PassRegistry
&);
133 void initializeHexagonHardwareLoopsPass(PassRegistry
&);
134 void initializeHexagonLoopIdiomRecognizePass(PassRegistry
&);
135 void initializeHexagonVectorLoopCarriedReusePass(PassRegistry
&);
136 void initializeHexagonNewValueJumpPass(PassRegistry
&);
137 void initializeHexagonOptAddrModePass(PassRegistry
&);
138 void initializeHexagonPacketizerPass(PassRegistry
&);
139 void initializeHexagonRDFOptPass(PassRegistry
&);
140 void initializeHexagonSplitDoubleRegsPass(PassRegistry
&);
141 void initializeHexagonVExtractPass(PassRegistry
&);
142 Pass
*createHexagonLoopIdiomPass();
143 Pass
*createHexagonVectorLoopCarriedReusePass();
145 FunctionPass
*createHexagonBitSimplify();
146 FunctionPass
*createHexagonBranchRelaxation();
147 FunctionPass
*createHexagonCallFrameInformation();
148 FunctionPass
*createHexagonCFGOptimizer();
149 FunctionPass
*createHexagonCommonGEP();
150 FunctionPass
*createHexagonConstExtenders();
151 FunctionPass
*createHexagonConstPropagationPass();
152 FunctionPass
*createHexagonCopyToCombine();
153 FunctionPass
*createHexagonEarlyIfConversion();
154 FunctionPass
*createHexagonFixupHwLoops();
155 FunctionPass
*createHexagonGenExtract();
156 FunctionPass
*createHexagonGenInsert();
157 FunctionPass
*createHexagonGenMux();
158 FunctionPass
*createHexagonGenPredicate();
159 FunctionPass
*createHexagonHardwareLoops();
160 FunctionPass
*createHexagonISelDag(HexagonTargetMachine
&TM
,
161 CodeGenOpt::Level OptLevel
);
162 FunctionPass
*createHexagonLoopRescheduling();
163 FunctionPass
*createHexagonNewValueJump();
164 FunctionPass
*createHexagonOptimizeSZextends();
165 FunctionPass
*createHexagonOptAddrMode();
166 FunctionPass
*createHexagonPacketizer(bool Minimal
);
167 FunctionPass
*createHexagonPeephole();
168 FunctionPass
*createHexagonRDFOpt();
169 FunctionPass
*createHexagonSplitConst32AndConst64();
170 FunctionPass
*createHexagonSplitDoubleRegs();
171 FunctionPass
*createHexagonStoreWidening();
172 FunctionPass
*createHexagonVectorPrint();
173 FunctionPass
*createHexagonVExtract();
174 } // end namespace llvm;
176 static Reloc::Model
getEffectiveRelocModel(Optional
<Reloc::Model
> RM
) {
178 return Reloc::Static
;
182 extern "C" void LLVMInitializeHexagonTarget() {
183 // Register the target.
184 RegisterTargetMachine
<HexagonTargetMachine
> X(getTheHexagonTarget());
186 PassRegistry
&PR
= *PassRegistry::getPassRegistry();
187 initializeHexagonBitSimplifyPass(PR
);
188 initializeHexagonConstExtendersPass(PR
);
189 initializeHexagonConstPropagationPass(PR
);
190 initializeHexagonEarlyIfConversionPass(PR
);
191 initializeHexagonGenMuxPass(PR
);
192 initializeHexagonHardwareLoopsPass(PR
);
193 initializeHexagonLoopIdiomRecognizePass(PR
);
194 initializeHexagonVectorLoopCarriedReusePass(PR
);
195 initializeHexagonNewValueJumpPass(PR
);
196 initializeHexagonOptAddrModePass(PR
);
197 initializeHexagonPacketizerPass(PR
);
198 initializeHexagonRDFOptPass(PR
);
199 initializeHexagonSplitDoubleRegsPass(PR
);
200 initializeHexagonVExtractPass(PR
);
203 HexagonTargetMachine::HexagonTargetMachine(const Target
&T
, const Triple
&TT
,
204 StringRef CPU
, StringRef FS
,
205 const TargetOptions
&Options
,
206 Optional
<Reloc::Model
> RM
,
207 Optional
<CodeModel::Model
> CM
,
208 CodeGenOpt::Level OL
, bool JIT
)
209 // Specify the vector alignment explicitly. For v512x1, the calculated
210 // alignment would be 512*alignment(i1), which is 512 bytes, instead of
211 // the required minimum of 64 bytes.
214 "e-m:e-p:32:32:32-a:0-n16:32-"
215 "i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-"
216 "v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048",
217 TT
, CPU
, FS
, Options
, getEffectiveRelocModel(RM
),
218 getEffectiveCodeModel(CM
, CodeModel::Small
),
219 (HexagonNoOpt
? CodeGenOpt::None
: OL
)),
220 TLOF(make_unique
<HexagonTargetObjectFile
>()) {
221 initializeHexagonExpandCondsetsPass(*PassRegistry::getPassRegistry());
225 const HexagonSubtarget
*
226 HexagonTargetMachine::getSubtargetImpl(const Function
&F
) const {
227 AttributeList FnAttrs
= F
.getAttributes();
229 FnAttrs
.getAttribute(AttributeList::FunctionIndex
, "target-cpu");
231 FnAttrs
.getAttribute(AttributeList::FunctionIndex
, "target-features");
233 std::string CPU
= !CPUAttr
.hasAttribute(Attribute::None
)
234 ? CPUAttr
.getValueAsString().str()
236 std::string FS
= !FSAttr
.hasAttribute(Attribute::None
)
237 ? FSAttr
.getValueAsString().str()
240 auto &I
= SubtargetMap
[CPU
+ FS
];
242 // This needs to be done before we create a new subtarget since any
243 // creation will depend on the TM and the code generation flags on the
244 // function that reside in TargetOptions.
245 resetTargetOptions(F
);
246 I
= llvm::make_unique
<HexagonSubtarget
>(TargetTriple
, CPU
, FS
, *this);
251 void HexagonTargetMachine::adjustPassManager(PassManagerBuilder
&PMB
) {
253 PassManagerBuilder::EP_LateLoopOptimizations
,
254 [&](const PassManagerBuilder
&, legacy::PassManagerBase
&PM
) {
255 PM
.add(createHexagonLoopIdiomPass());
258 PassManagerBuilder::EP_LoopOptimizerEnd
,
259 [&](const PassManagerBuilder
&, legacy::PassManagerBase
&PM
) {
260 PM
.add(createHexagonVectorLoopCarriedReusePass());
265 HexagonTargetMachine::getTargetTransformInfo(const Function
&F
) {
266 return TargetTransformInfo(HexagonTTIImpl(this, F
));
270 HexagonTargetMachine::~HexagonTargetMachine() {}
273 /// Hexagon Code Generator Pass Configuration Options.
274 class HexagonPassConfig
: public TargetPassConfig
{
276 HexagonPassConfig(HexagonTargetMachine
&TM
, PassManagerBase
&PM
)
277 : TargetPassConfig(TM
, PM
) {}
279 HexagonTargetMachine
&getHexagonTargetMachine() const {
280 return getTM
<HexagonTargetMachine
>();
284 createMachineScheduler(MachineSchedContext
*C
) const override
{
285 return createVLIWMachineSched(C
);
288 void addIRPasses() override
;
289 bool addInstSelector() override
;
290 void addPreRegAlloc() override
;
291 void addPostRegAlloc() override
;
292 void addPreSched2() override
;
293 void addPreEmitPass() override
;
297 TargetPassConfig
*HexagonTargetMachine::createPassConfig(PassManagerBase
&PM
) {
298 return new HexagonPassConfig(*this, PM
);
301 void HexagonPassConfig::addIRPasses() {
302 TargetPassConfig::addIRPasses();
303 bool NoOpt
= (getOptLevel() == CodeGenOpt::None
);
306 addPass(createConstantPropagationPass());
307 addPass(createDeadCodeEliminationPass());
310 addPass(createAtomicExpandPass());
313 if (EnableInitialCFGCleanup
)
314 addPass(createCFGSimplificationPass(1, true, true, false, true));
315 if (EnableLoopPrefetch
)
316 addPass(createLoopDataPrefetchPass());
318 addPass(createHexagonCommonGEP());
319 // Replace certain combinations of shifts and ands with extracts.
320 if (EnableGenExtract
)
321 addPass(createHexagonGenExtract());
325 bool HexagonPassConfig::addInstSelector() {
326 HexagonTargetMachine
&TM
= getHexagonTargetMachine();
327 bool NoOpt
= (getOptLevel() == CodeGenOpt::None
);
330 addPass(createHexagonOptimizeSZextends());
332 addPass(createHexagonISelDag(TM
, getOptLevel()));
335 if (EnableVExtractOpt
)
336 addPass(createHexagonVExtract());
337 // Create logical operations on predicate registers.
339 addPass(createHexagonGenPredicate());
340 // Rotate loops to expose bit-simplification opportunities.
341 if (EnableLoopResched
)
342 addPass(createHexagonLoopRescheduling());
343 // Split double registers.
345 addPass(createHexagonSplitDoubleRegs());
346 // Bit simplification.
347 if (EnableBitSimplify
)
348 addPass(createHexagonBitSimplify());
349 addPass(createHexagonPeephole());
350 // Constant propagation.
352 addPass(createHexagonConstPropagationPass());
353 addPass(&UnreachableMachineBlockElimID
);
356 addPass(createHexagonGenInsert());
358 addPass(createHexagonEarlyIfConversion());
364 void HexagonPassConfig::addPreRegAlloc() {
365 if (getOptLevel() != CodeGenOpt::None
) {
367 addPass(createHexagonConstExtenders());
368 if (EnableExpandCondsets
)
369 insertPass(&RegisterCoalescerID
, &HexagonExpandCondsetsID
);
370 if (!DisableStoreWidening
)
371 addPass(createHexagonStoreWidening());
372 if (!DisableHardwareLoops
)
373 addPass(createHexagonHardwareLoops());
375 if (TM
->getOptLevel() >= CodeGenOpt::Default
)
376 addPass(&MachinePipelinerID
);
379 void HexagonPassConfig::addPostRegAlloc() {
380 if (getOptLevel() != CodeGenOpt::None
) {
382 addPass(createHexagonRDFOpt());
383 if (!DisableHexagonCFGOpt
)
384 addPass(createHexagonCFGOptimizer());
385 if (!DisableAModeOpt
)
386 addPass(createHexagonOptAddrMode());
390 void HexagonPassConfig::addPreSched2() {
391 addPass(createHexagonCopyToCombine());
392 if (getOptLevel() != CodeGenOpt::None
)
393 addPass(&IfConverterID
);
394 addPass(createHexagonSplitConst32AndConst64());
397 void HexagonPassConfig::addPreEmitPass() {
398 bool NoOpt
= (getOptLevel() == CodeGenOpt::None
);
401 addPass(createHexagonNewValueJump());
403 addPass(createHexagonBranchRelaxation());
406 if (!DisableHardwareLoops
)
407 addPass(createHexagonFixupHwLoops());
408 // Generate MUX from pairs of conditional transfers.
410 addPass(createHexagonGenMux());
413 // Packetization is mandatory: it handles gather/scatter at all opt levels.
414 addPass(createHexagonPacketizer(NoOpt
), false);
416 if (EnableVectorPrint
)
417 addPass(createHexagonVectorPrint(), false);
419 // Add CFI instructions if necessary.
420 addPass(createHexagonCallFrameInformation(), false);