1 //===--------------------- Scheduler.h ------------------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// A scheduler for Processor Resource Units and Processor Resource Groups.
12 //===----------------------------------------------------------------------===//
14 #ifndef LLVM_MCA_SCHEDULER_H
15 #define LLVM_MCA_SCHEDULER_H
17 #include "llvm/ADT/SmallVector.h"
18 #include "llvm/MC/MCSchedule.h"
19 #include "llvm/MCA/HardwareUnits/HardwareUnit.h"
20 #include "llvm/MCA/HardwareUnits/LSUnit.h"
21 #include "llvm/MCA/HardwareUnits/ResourceManager.h"
22 #include "llvm/MCA/Support.h"
27 class SchedulerStrategy
{
29 SchedulerStrategy() = default;
30 virtual ~SchedulerStrategy();
32 /// Returns true if Lhs should take priority over Rhs.
34 /// This method is used by class Scheduler to select the "best" ready
35 /// instruction to issue to the underlying pipelines.
36 virtual bool compare(const InstRef
&Lhs
, const InstRef
&Rhs
) const = 0;
39 /// Default instruction selection strategy used by class Scheduler.
40 class DefaultSchedulerStrategy
: public SchedulerStrategy
{
41 /// This method ranks instructions based on their age, and the number of known
42 /// users. The lower the rank value, the better.
43 int computeRank(const InstRef
&Lhs
) const {
44 return Lhs
.getSourceIndex() - Lhs
.getInstruction()->getNumUsers();
48 DefaultSchedulerStrategy() = default;
49 virtual ~DefaultSchedulerStrategy();
51 bool compare(const InstRef
&Lhs
, const InstRef
&Rhs
) const override
{
52 int LhsRank
= computeRank(Lhs
);
53 int RhsRank
= computeRank(Rhs
);
55 /// Prioritize older instructions over younger instructions to minimize the
56 /// pressure on the reorder buffer.
57 if (LhsRank
== RhsRank
)
58 return Lhs
.getSourceIndex() < Rhs
.getSourceIndex();
59 return LhsRank
< RhsRank
;
63 /// Class Scheduler is responsible for issuing instructions to pipeline
66 /// Internally, it delegates to a ResourceManager the management of processor
67 /// resources. This class is also responsible for tracking the progress of
68 /// instructions from the dispatch stage, until the write-back stage.
70 class Scheduler
: public HardwareUnit
{
73 // Instruction selection strategy for this Scheduler.
74 std::unique_ptr
<SchedulerStrategy
> Strategy
;
76 // Hardware resources that are managed by this scheduler.
77 std::unique_ptr
<ResourceManager
> Resources
;
79 // Instructions dispatched to the Scheduler are internally classified based on
80 // the instruction stage (see Instruction::InstrStage).
82 // An Instruction dispatched to the Scheduler is added to the WaitSet if not
83 // all its register operands are available, and at least one latency is
84 // unknown. By construction, the WaitSet only contains instructions that are
85 // in the IS_DISPATCHED stage.
87 // An Instruction transitions from the WaitSet to the PendingSet if the
88 // instruction is not ready yet, but the latency of every register read is
89 // known. Instructions in the PendingSet can only be in the IS_PENDING or
90 // IS_READY stage. Only IS_READY instructions that are waiting on memory
91 // dependencies can be added to the PendingSet.
93 // Instructions in the PendingSet are immediately dominated only by
94 // instructions that have already been issued to the underlying pipelines. In
95 // the presence of bottlenecks caused by data dependencies, the PendingSet can
96 // be inspected to identify problematic data dependencies between
99 // An instruction is moved to the ReadySet when all register operands become
100 // available, and all memory dependencies are met. Instructions that are
101 // moved from the PendingSet to the ReadySet must transition to the 'IS_READY'
104 // On every cycle, the Scheduler checks if it can promote instructions from the
105 // PendingSet to the ReadySet.
107 // An Instruction is moved from the ReadySet to the `IssuedSet` when it starts
108 // exection. This event also causes an instruction state transition (i.e. from
109 // state IS_READY, to state IS_EXECUTING). An Instruction leaves the IssuedSet
110 // only when it reaches the write-back stage.
111 std::vector
<InstRef
> WaitSet
;
112 std::vector
<InstRef
> PendingSet
;
113 std::vector
<InstRef
> ReadySet
;
114 std::vector
<InstRef
> IssuedSet
;
116 // A mask of busy resource units. It defaults to the empty set (i.e. a zero
117 // mask), and it is cleared at the beginning of every cycle.
118 // It is updated every time the scheduler fails to issue an instruction from
119 // the ready set due to unavailable pipeline resources.
120 // Each bit of the mask represents an unavailable resource.
121 uint64_t BusyResourceUnits
;
123 // Counts the number of instructions in the pending set that were dispatched
124 // during this cycle.
125 unsigned NumDispatchedToThePendingSet
;
127 // True if the previous pipeline Stage was unable to dispatch a full group of
128 // opcodes because scheduler buffers (or LS queues) were unavailable.
131 /// Verify the given selection strategy and set the Strategy member
132 /// accordingly. If no strategy is provided, the DefaultSchedulerStrategy is
134 void initializeStrategy(std::unique_ptr
<SchedulerStrategy
> S
);
136 /// Issue an instruction without updating the ready queue.
137 void issueInstructionImpl(
139 SmallVectorImpl
<std::pair
<ResourceRef
, ResourceCycles
>> &Pipes
);
141 // Identify instructions that have finished executing, and remove them from
142 // the IssuedSet. References to executed instructions are added to input
143 // vector 'Executed'.
144 void updateIssuedSet(SmallVectorImpl
<InstRef
> &Executed
);
146 // Try to promote instructions from the PendingSet to the ReadySet.
147 // Add promoted instructions to the 'Ready' vector in input.
148 // Returns true if at least one instruction was promoted.
149 bool promoteToReadySet(SmallVectorImpl
<InstRef
> &Ready
);
151 // Try to promote instructions from the WaitSet to the PendingSet.
152 // Add promoted instructions to the 'Pending' vector in input.
153 // Returns true if at least one instruction was promoted.
154 bool promoteToPendingSet(SmallVectorImpl
<InstRef
> &Pending
);
157 Scheduler(const MCSchedModel
&Model
, LSUnit
&Lsu
)
158 : Scheduler(Model
, Lsu
, nullptr) {}
160 Scheduler(const MCSchedModel
&Model
, LSUnit
&Lsu
,
161 std::unique_ptr
<SchedulerStrategy
> SelectStrategy
)
162 : Scheduler(std::make_unique
<ResourceManager
>(Model
), Lsu
,
163 std::move(SelectStrategy
)) {}
165 Scheduler(std::unique_ptr
<ResourceManager
> RM
, LSUnit
&Lsu
,
166 std::unique_ptr
<SchedulerStrategy
> SelectStrategy
)
167 : LSU(Lsu
), Resources(std::move(RM
)), BusyResourceUnits(0),
168 NumDispatchedToThePendingSet(0), HadTokenStall(false) {
169 initializeStrategy(std::move(SelectStrategy
));
172 // Stalls generated by the scheduler.
178 SC_DISPATCH_GROUP_STALL
,
181 /// Check if the instruction in 'IR' can be dispatched during this cycle.
182 /// Return SC_AVAILABLE if both scheduler and LS resources are available.
184 /// This method is also responsible for setting field HadTokenStall if
185 /// IR cannot be dispatched to the Scheduler due to unavailable resources.
186 Status
isAvailable(const InstRef
&IR
);
188 /// Reserves buffer and LSUnit queue resources that are necessary to issue
189 /// this instruction.
191 /// Returns true if instruction IR is ready to be issued to the underlying
192 /// pipelines. Note that this operation cannot fail; it assumes that a
193 /// previous call to method `isAvailable(IR)` returned `SC_AVAILABLE`.
195 /// If IR is a memory operation, then the Scheduler queries the LS unit to
196 /// obtain a LS token. An LS token is used internally to track memory
198 bool dispatch(InstRef
&IR
);
200 /// Issue an instruction and populates a vector of used pipeline resources,
201 /// and a vector of instructions that transitioned to the ready state as a
202 /// result of this event.
203 void issueInstruction(
205 SmallVectorImpl
<std::pair
<ResourceRef
, ResourceCycles
>> &Used
,
206 SmallVectorImpl
<InstRef
> &Pending
,
207 SmallVectorImpl
<InstRef
> &Ready
);
209 /// Returns true if IR has to be issued immediately, or if IR is a zero
210 /// latency instruction.
211 bool mustIssueImmediately(const InstRef
&IR
) const;
213 /// This routine notifies the Scheduler that a new cycle just started.
215 /// It notifies the underlying ResourceManager that a new cycle just started.
216 /// Vector `Freed` is populated with resourceRef related to resources that
217 /// have changed in state, and that are now available to new instructions.
218 /// Instructions executed are added to vector Executed, while vector Ready is
219 /// populated with instructions that have become ready in this new cycle.
220 /// Vector Pending is popluated by instructions that have transitioned through
221 /// the pending stat during this cycle. The Pending and Ready sets may not be
222 /// disjoint. An instruction is allowed to transition from the WAIT state to
223 /// the READY state (going through the PENDING state) within a single cycle.
224 /// That means, instructions may appear in both the Pending and Ready set.
225 void cycleEvent(SmallVectorImpl
<ResourceRef
> &Freed
,
226 SmallVectorImpl
<InstRef
> &Executed
,
227 SmallVectorImpl
<InstRef
> &Pending
,
228 SmallVectorImpl
<InstRef
> &Ready
);
230 /// Convert a resource mask into a valid llvm processor resource identifier.
232 /// Only the most significant bit of the Mask is used by this method to
233 /// identify the processor resource.
234 unsigned getResourceID(uint64_t Mask
) const {
235 return Resources
->resolveResourceMask(Mask
);
238 /// Select the next instruction to issue from the ReadySet. Returns an invalid
239 /// instruction reference if there are no ready instructions, or if processor
240 /// resources are not available.
243 bool isReadySetEmpty() const { return ReadySet
.empty(); }
244 bool isWaitSetEmpty() const { return WaitSet
.empty(); }
246 /// This method is called by the ExecuteStage at the end of each cycle to
247 /// identify bottlenecks caused by data dependencies. Vector RegDeps is
248 /// populated by instructions that were not issued because of unsolved
249 /// register dependencies. Vector MemDeps is populated by instructions that
250 /// were not issued because of unsolved memory dependencies.
251 void analyzeDataDependencies(SmallVectorImpl
<InstRef
> &RegDeps
,
252 SmallVectorImpl
<InstRef
> &MemDeps
);
254 /// Returns a mask of busy resources, and populates vector Insts with
255 /// instructions that could not be issued to the underlying pipelines because
256 /// not all pipeline resources were available.
257 uint64_t analyzeResourcePressure(SmallVectorImpl
<InstRef
> &Insts
);
259 // Returns true if the dispatch logic couldn't dispatch a full group due to
260 // unavailable scheduler and/or LS resources.
261 bool hadTokenStall() const { return HadTokenStall
; }
264 // Update the ready queues.
267 // This routine performs a sanity check. This routine should only be called
268 // when we know that 'IR' is not in the scheduler's instruction queues.
269 void sanityCheck(const InstRef
&IR
) const {
270 assert(find(WaitSet
, IR
) == WaitSet
.end() && "Already in the wait set!");
271 assert(find(ReadySet
, IR
) == ReadySet
.end() && "Already in the ready set!");
272 assert(find(IssuedSet
, IR
) == IssuedSet
.end() && "Already executing!");
279 #endif // LLVM_MCA_SCHEDULER_H