1 //===--------------------- ResourceManager.h --------------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// The classes here represent processor resource units and their management
11 /// strategy. These classes are managed by the Scheduler.
13 //===----------------------------------------------------------------------===//
15 #ifndef LLVM_MCA_RESOURCE_MANAGER_H
16 #define LLVM_MCA_RESOURCE_MANAGER_H
18 #include "llvm/ADT/ArrayRef.h"
19 #include "llvm/ADT/DenseMap.h"
20 #include "llvm/ADT/SmallVector.h"
21 #include "llvm/MC/MCSchedule.h"
22 #include "llvm/MCA/Instruction.h"
23 #include "llvm/MCA/Support.h"
28 /// Used to notify the internal state of a processor resource.
30 /// A processor resource is available if it is not reserved, and there are
31 /// available slots in the buffer. A processor resource is unavailable if it
32 /// is either reserved, or the associated buffer is full. A processor resource
33 /// with a buffer size of -1 is always available if it is not reserved.
35 /// Values of type ResourceStateEvent are returned by method
36 /// ResourceManager::canBeDispatched()
38 /// The naming convention for resource state events is:
39 /// * Event names start with prefix RS_
40 /// * Prefix RS_ is followed by a string describing the actual resource state.
41 enum ResourceStateEvent
{
43 RS_BUFFER_UNAVAILABLE
,
47 /// Resource allocation strategy used by hardware scheduler resources.
48 class ResourceStrategy
{
49 ResourceStrategy(const ResourceStrategy
&) = delete;
50 ResourceStrategy
&operator=(const ResourceStrategy
&) = delete;
54 virtual ~ResourceStrategy();
56 /// Selects a processor resource unit from a ReadyMask.
57 virtual uint64_t select(uint64_t ReadyMask
) = 0;
59 /// Called by the ResourceManager when a processor resource group, or a
60 /// processor resource with multiple units has become unavailable.
62 /// The default strategy uses this information to bias its selection logic.
63 virtual void used(uint64_t ResourceMask
) {}
66 /// Default resource allocation strategy used by processor resource groups and
67 /// processor resources with multiple units.
68 class DefaultResourceStrategy final
: public ResourceStrategy
{
69 /// A Mask of resource unit identifiers.
71 /// There is one bit set for every available resource unit.
72 /// It defaults to the value of field ResourceSizeMask in ResourceState.
73 const uint64_t ResourceUnitMask
;
75 /// A simple round-robin selector for processor resource units.
76 /// Each bit of this mask identifies a sub resource within a group.
78 /// As an example, lets assume that this is a default policy for a
79 /// processor resource group composed by the following three units:
80 /// ResourceA -- 0b001
81 /// ResourceB -- 0b010
82 /// ResourceC -- 0b100
84 /// Field NextInSequenceMask is used to select the next unit from the set of
85 /// resource units. It defaults to the value of field `ResourceUnitMasks` (in
86 /// this example, it defaults to mask '0b111').
88 /// The round-robin selector would firstly select 'ResourceC', then
89 /// 'ResourceB', and eventually 'ResourceA'. When a resource R is used, the
90 /// corresponding bit in NextInSequenceMask is cleared. For example, if
91 /// 'ResourceC' is selected, then the new value of NextInSequenceMask becomes
94 /// When NextInSequenceMask becomes zero, it is automatically reset to the
95 /// default value (i.e. ResourceUnitMask).
96 uint64_t NextInSequenceMask
;
98 /// This field is used to track resource units that are used (i.e. selected)
99 /// by other groups other than the one associated with this strategy object.
101 /// In LLVM processor resource groups are allowed to partially (or fully)
102 /// overlap. That means, a same unit may be visible to multiple groups.
103 /// This field keeps track of uses that have originated from outside of
104 /// this group. The idea is to bias the selection strategy, so that resources
105 /// that haven't been used by other groups get prioritized.
107 /// The end goal is to (try to) keep the resource distribution as much uniform
108 /// as possible. By construction, this mask only tracks one-level of resource
109 /// usage. Therefore, this strategy is expected to be less accurate when same
110 /// units are used multiple times by other groups within a single round of
113 /// Note: an LRU selector would have a better accuracy at the cost of being
114 /// slightly more expensive (mostly in terms of runtime cost). Methods
115 /// 'select' and 'used', are always in the hot execution path of llvm-mca.
116 /// Therefore, a slow implementation of 'select' would have a negative impact
117 /// on the overall performance of the tool.
118 uint64_t RemovedFromNextInSequence
;
121 DefaultResourceStrategy(uint64_t UnitMask
)
122 : ResourceStrategy(), ResourceUnitMask(UnitMask
),
123 NextInSequenceMask(UnitMask
), RemovedFromNextInSequence(0) {}
124 virtual ~DefaultResourceStrategy() = default;
126 uint64_t select(uint64_t ReadyMask
) override
;
127 void used(uint64_t Mask
) override
;
130 /// A processor resource descriptor.
132 /// There is an instance of this class for every processor resource defined by
133 /// the machine scheduling model.
134 /// Objects of class ResourceState dynamically track the usage of processor
136 class ResourceState
{
137 /// An index to the MCProcResourceDesc entry in the processor model.
138 const unsigned ProcResourceDescIndex
;
139 /// A resource mask. This is generated by the tool with the help of
140 /// function `mca::computeProcResourceMasks' (see Support.h).
142 /// Field ResourceMask only has one bit set if this resource state describes a
143 /// processor resource unit (i.e. this is not a group). That means, we can
144 /// quickly check if a resource is a group by simply counting the number of
145 /// bits that are set in the mask.
147 /// The most significant bit of a mask (MSB) uniquely identifies a resource.
148 /// Remaining bits are used to describe the composition of a group (Group).
150 /// Example (little endian):
151 /// Resource | Mask | MSB | Group
152 /// ---------+------------+------------+------------
153 /// A | 0b000001 | 0b000001 | 0b000000
155 /// B | 0b000010 | 0b000010 | 0b000000
157 /// C | 0b010000 | 0b010000 | 0b000000
159 /// D | 0b110010 | 0b100000 | 0b010010
161 /// In this example, resources A, B and C are processor resource units.
162 /// Only resource D is a group resource, and it contains resources B and C.
163 /// That is because MSB(B) and MSB(C) are both contained within Group(D).
164 const uint64_t ResourceMask
;
166 /// A ProcResource can have multiple units.
168 /// For processor resource groups this field is a mask of contained resource
169 /// units. It is obtained from ResourceMask by clearing the highest set bit.
170 /// The number of resource units in a group can be simply computed as the
171 /// population count of this field.
173 /// For normal (i.e. non-group) resources, the number of bits set in this mask
174 /// is equivalent to the number of units declared by the processor model (see
175 /// field 'NumUnits' in 'ProcResourceUnits').
176 uint64_t ResourceSizeMask
;
178 /// A mask of ready units.
181 /// Buffered resources will have this field set to a positive number different
182 /// than zero. A buffered resource behaves like a reservation station
183 /// implementing its own buffer for out-of-order execution.
185 /// A BufferSize of 1 is used by scheduler resources that force in-order
188 /// A BufferSize of 0 is used to model in-order issue/dispatch resources.
189 /// Since in-order issue/dispatch resources don't implement buffers, dispatch
190 /// events coincide with issue events.
191 /// Also, no other instruction ca be dispatched/issue while this resource is
192 /// in use. Only when all the "resource cycles" are consumed (after the issue
193 /// event), a new instruction ca be dispatched.
194 const int BufferSize
;
196 /// Available slots in the buffer (zero, if this is not a buffered resource).
197 unsigned AvailableSlots
;
199 /// This field is set if this resource is currently reserved.
201 /// Resources can be reserved for a number of cycles.
202 /// Instructions can still be dispatched to reserved resources. However,
203 /// istructions dispatched to a reserved resource cannot be issued to the
204 /// underlying units (i.e. pipelines) until the resource is released.
209 /// Checks for the availability of unit 'SubResMask' in the group.
210 bool isSubResourceReady(uint64_t SubResMask
) const {
211 return ReadyMask
& SubResMask
;
215 ResourceState(const MCProcResourceDesc
&Desc
, unsigned Index
, uint64_t Mask
);
217 unsigned getProcResourceID() const { return ProcResourceDescIndex
; }
218 uint64_t getResourceMask() const { return ResourceMask
; }
219 uint64_t getReadyMask() const { return ReadyMask
; }
220 int getBufferSize() const { return BufferSize
; }
222 bool isBuffered() const { return BufferSize
> 0; }
223 bool isInOrder() const { return BufferSize
== 1; }
225 /// Returns true if this is an in-order dispatch/issue resource.
226 bool isADispatchHazard() const { return BufferSize
== 0; }
227 bool isReserved() const { return Unavailable
; }
229 void setReserved() { Unavailable
= true; }
230 void clearReserved() { Unavailable
= false; }
232 /// Returs true if this resource is not reserved, and if there are at least
233 /// `NumUnits` available units.
234 bool isReady(unsigned NumUnits
= 1) const;
236 bool isAResourceGroup() const { return IsAGroup
; }
238 bool containsResource(uint64_t ID
) const { return ResourceMask
& ID
; }
240 void markSubResourceAsUsed(uint64_t ID
) {
241 assert(isSubResourceReady(ID
));
245 void releaseSubResource(uint64_t ID
) {
246 assert(!isSubResourceReady(ID
));
250 unsigned getNumUnits() const {
251 return isAResourceGroup() ? 1U : countPopulation(ResourceSizeMask
);
254 /// Checks if there is an available slot in the resource buffer.
256 /// Returns RS_BUFFER_AVAILABLE if this is not a buffered resource, or if
257 /// there is a slot available.
259 /// Returns RS_RESERVED if this buffered resource is a dispatch hazard, and it
262 /// Returns RS_BUFFER_UNAVAILABLE if there are no available slots.
263 ResourceStateEvent
isBufferAvailable() const;
265 /// Reserve a buffer slot.
267 /// Returns true if the buffer is not full.
268 /// It always returns true if BufferSize is set to zero.
269 bool reserveBuffer() {
274 assert(AvailableSlots
<= static_cast<unsigned>(BufferSize
));
275 return AvailableSlots
;
278 /// Releases a slot in the buffer.
279 void releaseBuffer() {
280 // Ignore dispatch hazards or invalid buffer sizes.
285 assert(AvailableSlots
<= static_cast<unsigned>(BufferSize
));
293 /// A resource unit identifier.
295 /// This is used to identify a specific processor resource unit using a pair
296 /// of indices where the 'first' index is a processor resource mask, and the
297 /// 'second' index is an index for a "sub-resource" (i.e. unit).
298 typedef std::pair
<uint64_t, uint64_t> ResourceRef
;
300 // First: a MCProcResourceDesc index identifying a buffered resource.
301 // Second: max number of buffer entries used in this resource.
302 typedef std::pair
<unsigned, unsigned> BufferUsageEntry
;
304 /// A resource manager for processor resource units and groups.
306 /// This class owns all the ResourceState objects, and it is responsible for
307 /// acting on requests from a Scheduler by updating the internal state of
308 /// ResourceState objects.
309 /// This class doesn't know about instruction itineraries and functional units.
310 /// In future, it can be extended to support itineraries too through the same
311 /// public interface.
312 class ResourceManager
{
313 // Set of resources available on the subtarget.
315 // There is an instance of ResourceState for every resource declared by the
316 // target scheduling model.
318 // Elements of this vector are ordered by resource kind. In particular,
319 // resource units take precedence over resource groups.
321 // The index of a processor resource in this vector depends on the value of
322 // its mask (see the description of field ResourceState::ResourceMask). In
323 // particular, it is computed as the position of the most significant bit set
324 // (MSB) in the mask plus one (since we want to ignore the invalid resource
325 // descriptor at index zero).
327 // Example (little endian):
329 // Resource | Mask | MSB | Index
330 // ---------+---------+---------+-------
331 // A | 0b00001 | 0b00001 | 1
333 // B | 0b00100 | 0b00100 | 3
335 // C | 0b10010 | 0b10000 | 5
338 // The same index is also used to address elements within vector `Strategies`
339 // and vector `Resource2Groups`.
340 std::vector
<std::unique_ptr
<ResourceState
>> Resources
;
341 std::vector
<std::unique_ptr
<ResourceStrategy
>> Strategies
;
343 // Used to quickly identify groups that own a particular resource unit.
344 std::vector
<uint64_t> Resource2Groups
;
346 // A table that maps processor resource IDs to processor resource masks.
347 SmallVector
<uint64_t, 8> ProcResID2Mask
;
349 // A table that maps resource indices to actual processor resource IDs in the
351 SmallVector
<unsigned, 8> ResIndex2ProcResID
;
353 // Keeps track of which resources are busy, and how many cycles are left
354 // before those become usable again.
355 SmallDenseMap
<ResourceRef
, unsigned> BusyResources
;
357 // Set of processor resource units available on the target.
358 uint64_t ProcResUnitMask
;
360 // Set of processor resource units that are available during this cycle.
361 uint64_t AvailableProcResUnits
;
363 // Set of processor resources that are currently reserved.
364 uint64_t ReservedResourceGroups
;
366 // Set of unavailable scheduler buffer resources. This is used internally to
367 // speedup `canBeDispatched()` queries.
368 uint64_t AvailableBuffers
;
370 // Set of dispatch hazard buffer resources that are currently unavailable.
371 uint64_t ReservedBuffers
;
373 // Returns the actual resource unit that will be used.
374 ResourceRef
selectPipe(uint64_t ResourceID
);
376 void use(const ResourceRef
&RR
);
377 void release(const ResourceRef
&RR
);
379 unsigned getNumUnits(uint64_t ResourceID
) const;
381 // Overrides the selection strategy for the processor resource with the given
383 void setCustomStrategyImpl(std::unique_ptr
<ResourceStrategy
> S
,
384 uint64_t ResourceMask
);
387 ResourceManager(const MCSchedModel
&SM
);
388 virtual ~ResourceManager() = default;
390 // Overrides the selection strategy for the resource at index ResourceID in
391 // the MCProcResourceDesc table.
392 void setCustomStrategy(std::unique_ptr
<ResourceStrategy
> S
,
393 unsigned ResourceID
) {
394 assert(ResourceID
< ProcResID2Mask
.size() &&
395 "Invalid resource index in input!");
396 return setCustomStrategyImpl(std::move(S
), ProcResID2Mask
[ResourceID
]);
399 // Returns RS_BUFFER_AVAILABLE if buffered resources are not reserved, and if
400 // there are enough available slots in the buffers.
401 ResourceStateEvent
canBeDispatched(uint64_t ConsumedBuffers
) const;
403 // Return the processor resource identifier associated to this Mask.
404 unsigned resolveResourceMask(uint64_t Mask
) const;
406 // Acquires a slot from every buffered resource in mask `ConsumedBuffers`.
407 // Units that are dispatch hazards (i.e. BufferSize=0) are marked as reserved.
408 void reserveBuffers(uint64_t ConsumedBuffers
);
410 // Releases a slot from every buffered resource in mask `ConsumedBuffers`.
411 // ConsumedBuffers is a bitmask of previously acquired buffers (using method
412 // `reserveBuffers`). Units that are dispatch hazards (i.e. BufferSize=0) are
413 // not automatically unreserved by this method.
414 void releaseBuffers(uint64_t ConsumedBuffers
);
416 // Reserve a processor resource. A reserved resource is not available for
417 // instruction issue until it is released.
418 void reserveResource(uint64_t ResourceID
);
420 // Release a previously reserved processor resource.
421 void releaseResource(uint64_t ResourceID
);
423 // Returns a zero mask if resources requested by Desc are all available during
424 // this cycle. It returns a non-zero mask value only if there are unavailable
425 // processor resources; each bit set in the mask represents a busy processor
426 // resource unit or a reserved processor resource group.
427 uint64_t checkAvailability(const InstrDesc
&Desc
) const;
429 uint64_t getProcResUnitMask() const { return ProcResUnitMask
; }
430 uint64_t getAvailableProcResUnits() const { return AvailableProcResUnits
; }
432 void issueInstruction(
433 const InstrDesc
&Desc
,
434 SmallVectorImpl
<std::pair
<ResourceRef
, ResourceCycles
>> &Pipes
);
436 void cycleEvent(SmallVectorImpl
<ResourceRef
> &ResourcesFreed
);
440 for (const std::unique_ptr
<ResourceState
> &Resource
: Resources
)
448 #endif // LLVM_MCA_RESOURCE_MANAGER_H