Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
14 | pmbaty | 1 | //===--------------------- Scheduler.h ------------------------*- C++ -*-===// |
2 | // |
||
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
4 | // See https://llvm.org/LICENSE.txt for license information. |
||
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
6 | // |
||
7 | //===----------------------------------------------------------------------===// |
||
8 | /// \file |
||
9 | /// |
||
10 | /// A scheduler for Processor Resource Units and Processor Resource Groups. |
||
11 | /// |
||
12 | //===----------------------------------------------------------------------===// |
||
13 | |||
14 | #ifndef LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |
||
15 | #define LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |
||
16 | |||
17 | #include "llvm/ADT/SmallVector.h" |
||
18 | #include "llvm/MC/MCSchedule.h" |
||
19 | #include "llvm/MCA/HardwareUnits/HardwareUnit.h" |
||
20 | #include "llvm/MCA/HardwareUnits/LSUnit.h" |
||
21 | #include "llvm/MCA/HardwareUnits/ResourceManager.h" |
||
22 | #include "llvm/MCA/Support.h" |
||
23 | |||
24 | namespace llvm { |
||
25 | namespace mca { |
||
26 | |||
27 | class SchedulerStrategy { |
||
28 | public: |
||
29 | SchedulerStrategy() = default; |
||
30 | virtual ~SchedulerStrategy(); |
||
31 | |||
32 | /// Returns true if Lhs should take priority over Rhs. |
||
33 | /// |
||
34 | /// This method is used by class Scheduler to select the "best" ready |
||
35 | /// instruction to issue to the underlying pipelines. |
||
36 | virtual bool compare(const InstRef &Lhs, const InstRef &Rhs) const = 0; |
||
37 | }; |
||
38 | |||
39 | /// Default instruction selection strategy used by class Scheduler. |
||
40 | class DefaultSchedulerStrategy : public SchedulerStrategy { |
||
41 | /// This method ranks instructions based on their age, and the number of known |
||
42 | /// users. The lower the rank value, the better. |
||
43 | int computeRank(const InstRef &Lhs) const { |
||
44 | return Lhs.getSourceIndex() - Lhs.getInstruction()->getNumUsers(); |
||
45 | } |
||
46 | |||
47 | public: |
||
48 | DefaultSchedulerStrategy() = default; |
||
49 | virtual ~DefaultSchedulerStrategy(); |
||
50 | |||
51 | bool compare(const InstRef &Lhs, const InstRef &Rhs) const override { |
||
52 | int LhsRank = computeRank(Lhs); |
||
53 | int RhsRank = computeRank(Rhs); |
||
54 | |||
55 | /// Prioritize older instructions over younger instructions to minimize the |
||
56 | /// pressure on the reorder buffer. |
||
57 | if (LhsRank == RhsRank) |
||
58 | return Lhs.getSourceIndex() < Rhs.getSourceIndex(); |
||
59 | return LhsRank < RhsRank; |
||
60 | } |
||
61 | }; |
||
62 | |||
63 | /// Class Scheduler is responsible for issuing instructions to pipeline |
||
64 | /// resources. |
||
65 | /// |
||
66 | /// Internally, it delegates to a ResourceManager the management of processor |
||
67 | /// resources. This class is also responsible for tracking the progress of |
||
68 | /// instructions from the dispatch stage, until the write-back stage. |
||
69 | /// |
||
70 | class Scheduler : public HardwareUnit { |
||
71 | LSUnitBase &LSU; |
||
72 | |||
73 | // Instruction selection strategy for this Scheduler. |
||
74 | std::unique_ptr<SchedulerStrategy> Strategy; |
||
75 | |||
76 | // Hardware resources that are managed by this scheduler. |
||
77 | std::unique_ptr<ResourceManager> Resources; |
||
78 | |||
79 | // Instructions dispatched to the Scheduler are internally classified based on |
||
80 | // the instruction stage (see Instruction::InstrStage). |
||
81 | // |
||
82 | // An Instruction dispatched to the Scheduler is added to the WaitSet if not |
||
83 | // all its register operands are available, and at least one latency is |
||
84 | // unknown. By construction, the WaitSet only contains instructions that are |
||
85 | // in the IS_DISPATCHED stage. |
||
86 | // |
||
87 | // An Instruction transitions from the WaitSet to the PendingSet if the |
||
88 | // instruction is not ready yet, but the latency of every register read is |
||
89 | // known. Instructions in the PendingSet can only be in the IS_PENDING or |
||
90 | // IS_READY stage. Only IS_READY instructions that are waiting on memory |
||
91 | // dependencies can be added to the PendingSet. |
||
92 | // |
||
93 | // Instructions in the PendingSet are immediately dominated only by |
||
94 | // instructions that have already been issued to the underlying pipelines. In |
||
95 | // the presence of bottlenecks caused by data dependencies, the PendingSet can |
||
96 | // be inspected to identify problematic data dependencies between |
||
97 | // instructions. |
||
98 | // |
||
99 | // An instruction is moved to the ReadySet when all register operands become |
||
100 | // available, and all memory dependencies are met. Instructions that are |
||
101 | // moved from the PendingSet to the ReadySet must transition to the 'IS_READY' |
||
102 | // stage. |
||
103 | // |
||
104 | // On every cycle, the Scheduler checks if it can promote instructions from the |
||
105 | // PendingSet to the ReadySet. |
||
106 | // |
||
107 | // An Instruction is moved from the ReadySet to the `IssuedSet` when it starts |
||
108 | // exection. This event also causes an instruction state transition (i.e. from |
||
109 | // state IS_READY, to state IS_EXECUTING). An Instruction leaves the IssuedSet |
||
110 | // only when it reaches the write-back stage. |
||
111 | std::vector<InstRef> WaitSet; |
||
112 | std::vector<InstRef> PendingSet; |
||
113 | std::vector<InstRef> ReadySet; |
||
114 | std::vector<InstRef> IssuedSet; |
||
115 | |||
116 | // A mask of busy resource units. It defaults to the empty set (i.e. a zero |
||
117 | // mask), and it is cleared at the beginning of every cycle. |
||
118 | // It is updated every time the scheduler fails to issue an instruction from |
||
119 | // the ready set due to unavailable pipeline resources. |
||
120 | // Each bit of the mask represents an unavailable resource. |
||
121 | uint64_t BusyResourceUnits; |
||
122 | |||
123 | // Counts the number of instructions in the pending set that were dispatched |
||
124 | // during this cycle. |
||
125 | unsigned NumDispatchedToThePendingSet; |
||
126 | |||
127 | // True if the previous pipeline Stage was unable to dispatch a full group of |
||
128 | // opcodes because scheduler buffers (or LS queues) were unavailable. |
||
129 | bool HadTokenStall; |
||
130 | |||
131 | /// Verify the given selection strategy and set the Strategy member |
||
132 | /// accordingly. If no strategy is provided, the DefaultSchedulerStrategy is |
||
133 | /// used. |
||
134 | void initializeStrategy(std::unique_ptr<SchedulerStrategy> S); |
||
135 | |||
136 | /// Issue an instruction without updating the ready queue. |
||
137 | void issueInstructionImpl( |
||
138 | InstRef &IR, |
||
139 | SmallVectorImpl<std::pair<ResourceRef, ResourceCycles>> &Pipes); |
||
140 | |||
141 | // Identify instructions that have finished executing, and remove them from |
||
142 | // the IssuedSet. References to executed instructions are added to input |
||
143 | // vector 'Executed'. |
||
144 | void updateIssuedSet(SmallVectorImpl<InstRef> &Executed); |
||
145 | |||
146 | // Try to promote instructions from the PendingSet to the ReadySet. |
||
147 | // Add promoted instructions to the 'Ready' vector in input. |
||
148 | // Returns true if at least one instruction was promoted. |
||
149 | bool promoteToReadySet(SmallVectorImpl<InstRef> &Ready); |
||
150 | |||
151 | // Try to promote instructions from the WaitSet to the PendingSet. |
||
152 | // Add promoted instructions to the 'Pending' vector in input. |
||
153 | // Returns true if at least one instruction was promoted. |
||
154 | bool promoteToPendingSet(SmallVectorImpl<InstRef> &Pending); |
||
155 | |||
156 | public: |
||
157 | Scheduler(const MCSchedModel &Model, LSUnitBase &Lsu) |
||
158 | : Scheduler(Model, Lsu, nullptr) {} |
||
159 | |||
160 | Scheduler(const MCSchedModel &Model, LSUnitBase &Lsu, |
||
161 | std::unique_ptr<SchedulerStrategy> SelectStrategy) |
||
162 | : Scheduler(std::make_unique<ResourceManager>(Model), Lsu, |
||
163 | std::move(SelectStrategy)) {} |
||
164 | |||
165 | Scheduler(std::unique_ptr<ResourceManager> RM, LSUnitBase &Lsu, |
||
166 | std::unique_ptr<SchedulerStrategy> SelectStrategy) |
||
167 | : LSU(Lsu), Resources(std::move(RM)), BusyResourceUnits(0), |
||
168 | NumDispatchedToThePendingSet(0), HadTokenStall(false) { |
||
169 | initializeStrategy(std::move(SelectStrategy)); |
||
170 | } |
||
171 | |||
172 | // Stalls generated by the scheduler. |
||
173 | enum Status { |
||
174 | SC_AVAILABLE, |
||
175 | SC_LOAD_QUEUE_FULL, |
||
176 | SC_STORE_QUEUE_FULL, |
||
177 | SC_BUFFERS_FULL, |
||
178 | SC_DISPATCH_GROUP_STALL, |
||
179 | }; |
||
180 | |||
181 | /// Check if the instruction in 'IR' can be dispatched during this cycle. |
||
182 | /// Return SC_AVAILABLE if both scheduler and LS resources are available. |
||
183 | /// |
||
184 | /// This method is also responsible for setting field HadTokenStall if |
||
185 | /// IR cannot be dispatched to the Scheduler due to unavailable resources. |
||
186 | Status isAvailable(const InstRef &IR); |
||
187 | |||
188 | /// Reserves buffer and LSUnit queue resources that are necessary to issue |
||
189 | /// this instruction. |
||
190 | /// |
||
191 | /// Returns true if instruction IR is ready to be issued to the underlying |
||
192 | /// pipelines. Note that this operation cannot fail; it assumes that a |
||
193 | /// previous call to method `isAvailable(IR)` returned `SC_AVAILABLE`. |
||
194 | /// |
||
195 | /// If IR is a memory operation, then the Scheduler queries the LS unit to |
||
196 | /// obtain a LS token. An LS token is used internally to track memory |
||
197 | /// dependencies. |
||
198 | bool dispatch(InstRef &IR); |
||
199 | |||
200 | /// Issue an instruction and populates a vector of used pipeline resources, |
||
201 | /// and a vector of instructions that transitioned to the ready state as a |
||
202 | /// result of this event. |
||
203 | void issueInstruction( |
||
204 | InstRef &IR, |
||
205 | SmallVectorImpl<std::pair<ResourceRef, ResourceCycles>> &Used, |
||
206 | SmallVectorImpl<InstRef> &Pending, |
||
207 | SmallVectorImpl<InstRef> &Ready); |
||
208 | |||
209 | /// Returns true if IR has to be issued immediately, or if IR is a zero |
||
210 | /// latency instruction. |
||
211 | bool mustIssueImmediately(const InstRef &IR) const; |
||
212 | |||
213 | /// This routine notifies the Scheduler that a new cycle just started. |
||
214 | /// |
||
215 | /// It notifies the underlying ResourceManager that a new cycle just started. |
||
216 | /// Vector `Freed` is populated with resourceRef related to resources that |
||
217 | /// have changed in state, and that are now available to new instructions. |
||
218 | /// Instructions executed are added to vector Executed, while vector Ready is |
||
219 | /// populated with instructions that have become ready in this new cycle. |
||
220 | /// Vector Pending is popluated by instructions that have transitioned through |
||
221 | /// the pending stat during this cycle. The Pending and Ready sets may not be |
||
222 | /// disjoint. An instruction is allowed to transition from the WAIT state to |
||
223 | /// the READY state (going through the PENDING state) within a single cycle. |
||
224 | /// That means, instructions may appear in both the Pending and Ready set. |
||
225 | void cycleEvent(SmallVectorImpl<ResourceRef> &Freed, |
||
226 | SmallVectorImpl<InstRef> &Executed, |
||
227 | SmallVectorImpl<InstRef> &Pending, |
||
228 | SmallVectorImpl<InstRef> &Ready); |
||
229 | |||
230 | /// Convert a resource mask into a valid llvm processor resource identifier. |
||
231 | /// |
||
232 | /// Only the most significant bit of the Mask is used by this method to |
||
233 | /// identify the processor resource. |
||
234 | unsigned getResourceID(uint64_t Mask) const { |
||
235 | return Resources->resolveResourceMask(Mask); |
||
236 | } |
||
237 | |||
238 | /// Select the next instruction to issue from the ReadySet. Returns an invalid |
||
239 | /// instruction reference if there are no ready instructions, or if processor |
||
240 | /// resources are not available. |
||
241 | InstRef select(); |
||
242 | |||
243 | bool isReadySetEmpty() const { return ReadySet.empty(); } |
||
244 | bool isWaitSetEmpty() const { return WaitSet.empty(); } |
||
245 | |||
246 | /// This method is called by the ExecuteStage at the end of each cycle to |
||
247 | /// identify bottlenecks caused by data dependencies. Vector RegDeps is |
||
248 | /// populated by instructions that were not issued because of unsolved |
||
249 | /// register dependencies. Vector MemDeps is populated by instructions that |
||
250 | /// were not issued because of unsolved memory dependencies. |
||
251 | void analyzeDataDependencies(SmallVectorImpl<InstRef> &RegDeps, |
||
252 | SmallVectorImpl<InstRef> &MemDeps); |
||
253 | |||
254 | /// Returns a mask of busy resources, and populates vector Insts with |
||
255 | /// instructions that could not be issued to the underlying pipelines because |
||
256 | /// not all pipeline resources were available. |
||
257 | uint64_t analyzeResourcePressure(SmallVectorImpl<InstRef> &Insts); |
||
258 | |||
259 | // Returns true if the dispatch logic couldn't dispatch a full group due to |
||
260 | // unavailable scheduler and/or LS resources. |
||
261 | bool hadTokenStall() const { return HadTokenStall; } |
||
262 | |||
263 | #ifndef NDEBUG |
||
264 | // Update the ready queues. |
||
265 | void dump() const; |
||
266 | |||
267 | // This routine performs a basic correctness check. This routine should only |
||
268 | // be called when we know that 'IR' is not in the scheduler's instruction |
||
269 | // queues. |
||
270 | void instructionCheck(const InstRef &IR) const { |
||
271 | assert(!is_contained(WaitSet, IR) && "Already in the wait set!"); |
||
272 | assert(!is_contained(ReadySet, IR) && "Already in the ready set!"); |
||
273 | assert(!is_contained(IssuedSet, IR) && "Already executing!"); |
||
274 | } |
||
275 | #endif // !NDEBUG |
||
276 | }; |
||
277 | } // namespace mca |
||
278 | } // namespace llvm |
||
279 | |||
280 | #endif // LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |