Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line |
|---|---|---|---|
| 14 | pmbaty | 1 | //===--------------------- Scheduler.h ------------------------*- C++ -*-===// |
| 2 | // |
||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
| 6 | // |
||
| 7 | //===----------------------------------------------------------------------===// |
||
| 8 | /// \file |
||
| 9 | /// |
||
| 10 | /// A scheduler for Processor Resource Units and Processor Resource Groups. |
||
| 11 | /// |
||
| 12 | //===----------------------------------------------------------------------===// |
||
| 13 | |||
| 14 | #ifndef LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |
||
| 15 | #define LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |
||
| 16 | |||
| 17 | #include "llvm/ADT/SmallVector.h" |
||
| 18 | #include "llvm/MC/MCSchedule.h" |
||
| 19 | #include "llvm/MCA/HardwareUnits/HardwareUnit.h" |
||
| 20 | #include "llvm/MCA/HardwareUnits/LSUnit.h" |
||
| 21 | #include "llvm/MCA/HardwareUnits/ResourceManager.h" |
||
| 22 | #include "llvm/MCA/Support.h" |
||
| 23 | |||
| 24 | namespace llvm { |
||
| 25 | namespace mca { |
||
| 26 | |||
| 27 | class SchedulerStrategy { |
||
| 28 | public: |
||
| 29 | SchedulerStrategy() = default; |
||
| 30 | virtual ~SchedulerStrategy(); |
||
| 31 | |||
| 32 | /// Returns true if Lhs should take priority over Rhs. |
||
| 33 | /// |
||
| 34 | /// This method is used by class Scheduler to select the "best" ready |
||
| 35 | /// instruction to issue to the underlying pipelines. |
||
| 36 | virtual bool compare(const InstRef &Lhs, const InstRef &Rhs) const = 0; |
||
| 37 | }; |
||
| 38 | |||
| 39 | /// Default instruction selection strategy used by class Scheduler. |
||
| 40 | class DefaultSchedulerStrategy : public SchedulerStrategy { |
||
| 41 | /// This method ranks instructions based on their age, and the number of known |
||
| 42 | /// users. The lower the rank value, the better. |
||
| 43 | int computeRank(const InstRef &Lhs) const { |
||
| 44 | return Lhs.getSourceIndex() - Lhs.getInstruction()->getNumUsers(); |
||
| 45 | } |
||
| 46 | |||
| 47 | public: |
||
| 48 | DefaultSchedulerStrategy() = default; |
||
| 49 | virtual ~DefaultSchedulerStrategy(); |
||
| 50 | |||
| 51 | bool compare(const InstRef &Lhs, const InstRef &Rhs) const override { |
||
| 52 | int LhsRank = computeRank(Lhs); |
||
| 53 | int RhsRank = computeRank(Rhs); |
||
| 54 | |||
| 55 | /// Prioritize older instructions over younger instructions to minimize the |
||
| 56 | /// pressure on the reorder buffer. |
||
| 57 | if (LhsRank == RhsRank) |
||
| 58 | return Lhs.getSourceIndex() < Rhs.getSourceIndex(); |
||
| 59 | return LhsRank < RhsRank; |
||
| 60 | } |
||
| 61 | }; |
||
| 62 | |||
| 63 | /// Class Scheduler is responsible for issuing instructions to pipeline |
||
| 64 | /// resources. |
||
| 65 | /// |
||
| 66 | /// Internally, it delegates to a ResourceManager the management of processor |
||
| 67 | /// resources. This class is also responsible for tracking the progress of |
||
| 68 | /// instructions from the dispatch stage, until the write-back stage. |
||
| 69 | /// |
||
| 70 | class Scheduler : public HardwareUnit { |
||
| 71 | LSUnitBase &LSU; |
||
| 72 | |||
| 73 | // Instruction selection strategy for this Scheduler. |
||
| 74 | std::unique_ptr<SchedulerStrategy> Strategy; |
||
| 75 | |||
| 76 | // Hardware resources that are managed by this scheduler. |
||
| 77 | std::unique_ptr<ResourceManager> Resources; |
||
| 78 | |||
| 79 | // Instructions dispatched to the Scheduler are internally classified based on |
||
| 80 | // the instruction stage (see Instruction::InstrStage). |
||
| 81 | // |
||
| 82 | // An Instruction dispatched to the Scheduler is added to the WaitSet if not |
||
| 83 | // all its register operands are available, and at least one latency is |
||
| 84 | // unknown. By construction, the WaitSet only contains instructions that are |
||
| 85 | // in the IS_DISPATCHED stage. |
||
| 86 | // |
||
| 87 | // An Instruction transitions from the WaitSet to the PendingSet if the |
||
| 88 | // instruction is not ready yet, but the latency of every register read is |
||
| 89 | // known. Instructions in the PendingSet can only be in the IS_PENDING or |
||
| 90 | // IS_READY stage. Only IS_READY instructions that are waiting on memory |
||
| 91 | // dependencies can be added to the PendingSet. |
||
| 92 | // |
||
| 93 | // Instructions in the PendingSet are immediately dominated only by |
||
| 94 | // instructions that have already been issued to the underlying pipelines. In |
||
| 95 | // the presence of bottlenecks caused by data dependencies, the PendingSet can |
||
| 96 | // be inspected to identify problematic data dependencies between |
||
| 97 | // instructions. |
||
| 98 | // |
||
| 99 | // An instruction is moved to the ReadySet when all register operands become |
||
| 100 | // available, and all memory dependencies are met. Instructions that are |
||
| 101 | // moved from the PendingSet to the ReadySet must transition to the 'IS_READY' |
||
| 102 | // stage. |
||
| 103 | // |
||
| 104 | // On every cycle, the Scheduler checks if it can promote instructions from the |
||
| 105 | // PendingSet to the ReadySet. |
||
| 106 | // |
||
| 107 | // An Instruction is moved from the ReadySet to the `IssuedSet` when it starts |
||
| 108 | // exection. This event also causes an instruction state transition (i.e. from |
||
| 109 | // state IS_READY, to state IS_EXECUTING). An Instruction leaves the IssuedSet |
||
| 110 | // only when it reaches the write-back stage. |
||
| 111 | std::vector<InstRef> WaitSet; |
||
| 112 | std::vector<InstRef> PendingSet; |
||
| 113 | std::vector<InstRef> ReadySet; |
||
| 114 | std::vector<InstRef> IssuedSet; |
||
| 115 | |||
| 116 | // A mask of busy resource units. It defaults to the empty set (i.e. a zero |
||
| 117 | // mask), and it is cleared at the beginning of every cycle. |
||
| 118 | // It is updated every time the scheduler fails to issue an instruction from |
||
| 119 | // the ready set due to unavailable pipeline resources. |
||
| 120 | // Each bit of the mask represents an unavailable resource. |
||
| 121 | uint64_t BusyResourceUnits; |
||
| 122 | |||
| 123 | // Counts the number of instructions in the pending set that were dispatched |
||
| 124 | // during this cycle. |
||
| 125 | unsigned NumDispatchedToThePendingSet; |
||
| 126 | |||
| 127 | // True if the previous pipeline Stage was unable to dispatch a full group of |
||
| 128 | // opcodes because scheduler buffers (or LS queues) were unavailable. |
||
| 129 | bool HadTokenStall; |
||
| 130 | |||
| 131 | /// Verify the given selection strategy and set the Strategy member |
||
| 132 | /// accordingly. If no strategy is provided, the DefaultSchedulerStrategy is |
||
| 133 | /// used. |
||
| 134 | void initializeStrategy(std::unique_ptr<SchedulerStrategy> S); |
||
| 135 | |||
| 136 | /// Issue an instruction without updating the ready queue. |
||
| 137 | void issueInstructionImpl( |
||
| 138 | InstRef &IR, |
||
| 139 | SmallVectorImpl<std::pair<ResourceRef, ResourceCycles>> &Pipes); |
||
| 140 | |||
| 141 | // Identify instructions that have finished executing, and remove them from |
||
| 142 | // the IssuedSet. References to executed instructions are added to input |
||
| 143 | // vector 'Executed'. |
||
| 144 | void updateIssuedSet(SmallVectorImpl<InstRef> &Executed); |
||
| 145 | |||
| 146 | // Try to promote instructions from the PendingSet to the ReadySet. |
||
| 147 | // Add promoted instructions to the 'Ready' vector in input. |
||
| 148 | // Returns true if at least one instruction was promoted. |
||
| 149 | bool promoteToReadySet(SmallVectorImpl<InstRef> &Ready); |
||
| 150 | |||
| 151 | // Try to promote instructions from the WaitSet to the PendingSet. |
||
| 152 | // Add promoted instructions to the 'Pending' vector in input. |
||
| 153 | // Returns true if at least one instruction was promoted. |
||
| 154 | bool promoteToPendingSet(SmallVectorImpl<InstRef> &Pending); |
||
| 155 | |||
| 156 | public: |
||
| 157 | Scheduler(const MCSchedModel &Model, LSUnitBase &Lsu) |
||
| 158 | : Scheduler(Model, Lsu, nullptr) {} |
||
| 159 | |||
| 160 | Scheduler(const MCSchedModel &Model, LSUnitBase &Lsu, |
||
| 161 | std::unique_ptr<SchedulerStrategy> SelectStrategy) |
||
| 162 | : Scheduler(std::make_unique<ResourceManager>(Model), Lsu, |
||
| 163 | std::move(SelectStrategy)) {} |
||
| 164 | |||
| 165 | Scheduler(std::unique_ptr<ResourceManager> RM, LSUnitBase &Lsu, |
||
| 166 | std::unique_ptr<SchedulerStrategy> SelectStrategy) |
||
| 167 | : LSU(Lsu), Resources(std::move(RM)), BusyResourceUnits(0), |
||
| 168 | NumDispatchedToThePendingSet(0), HadTokenStall(false) { |
||
| 169 | initializeStrategy(std::move(SelectStrategy)); |
||
| 170 | } |
||
| 171 | |||
| 172 | // Stalls generated by the scheduler. |
||
| 173 | enum Status { |
||
| 174 | SC_AVAILABLE, |
||
| 175 | SC_LOAD_QUEUE_FULL, |
||
| 176 | SC_STORE_QUEUE_FULL, |
||
| 177 | SC_BUFFERS_FULL, |
||
| 178 | SC_DISPATCH_GROUP_STALL, |
||
| 179 | }; |
||
| 180 | |||
| 181 | /// Check if the instruction in 'IR' can be dispatched during this cycle. |
||
| 182 | /// Return SC_AVAILABLE if both scheduler and LS resources are available. |
||
| 183 | /// |
||
| 184 | /// This method is also responsible for setting field HadTokenStall if |
||
| 185 | /// IR cannot be dispatched to the Scheduler due to unavailable resources. |
||
| 186 | Status isAvailable(const InstRef &IR); |
||
| 187 | |||
| 188 | /// Reserves buffer and LSUnit queue resources that are necessary to issue |
||
| 189 | /// this instruction. |
||
| 190 | /// |
||
| 191 | /// Returns true if instruction IR is ready to be issued to the underlying |
||
| 192 | /// pipelines. Note that this operation cannot fail; it assumes that a |
||
| 193 | /// previous call to method `isAvailable(IR)` returned `SC_AVAILABLE`. |
||
| 194 | /// |
||
| 195 | /// If IR is a memory operation, then the Scheduler queries the LS unit to |
||
| 196 | /// obtain a LS token. An LS token is used internally to track memory |
||
| 197 | /// dependencies. |
||
| 198 | bool dispatch(InstRef &IR); |
||
| 199 | |||
| 200 | /// Issue an instruction and populates a vector of used pipeline resources, |
||
| 201 | /// and a vector of instructions that transitioned to the ready state as a |
||
| 202 | /// result of this event. |
||
| 203 | void issueInstruction( |
||
| 204 | InstRef &IR, |
||
| 205 | SmallVectorImpl<std::pair<ResourceRef, ResourceCycles>> &Used, |
||
| 206 | SmallVectorImpl<InstRef> &Pending, |
||
| 207 | SmallVectorImpl<InstRef> &Ready); |
||
| 208 | |||
| 209 | /// Returns true if IR has to be issued immediately, or if IR is a zero |
||
| 210 | /// latency instruction. |
||
| 211 | bool mustIssueImmediately(const InstRef &IR) const; |
||
| 212 | |||
| 213 | /// This routine notifies the Scheduler that a new cycle just started. |
||
| 214 | /// |
||
| 215 | /// It notifies the underlying ResourceManager that a new cycle just started. |
||
| 216 | /// Vector `Freed` is populated with resourceRef related to resources that |
||
| 217 | /// have changed in state, and that are now available to new instructions. |
||
| 218 | /// Instructions executed are added to vector Executed, while vector Ready is |
||
| 219 | /// populated with instructions that have become ready in this new cycle. |
||
| 220 | /// Vector Pending is popluated by instructions that have transitioned through |
||
| 221 | /// the pending stat during this cycle. The Pending and Ready sets may not be |
||
| 222 | /// disjoint. An instruction is allowed to transition from the WAIT state to |
||
| 223 | /// the READY state (going through the PENDING state) within a single cycle. |
||
| 224 | /// That means, instructions may appear in both the Pending and Ready set. |
||
| 225 | void cycleEvent(SmallVectorImpl<ResourceRef> &Freed, |
||
| 226 | SmallVectorImpl<InstRef> &Executed, |
||
| 227 | SmallVectorImpl<InstRef> &Pending, |
||
| 228 | SmallVectorImpl<InstRef> &Ready); |
||
| 229 | |||
| 230 | /// Convert a resource mask into a valid llvm processor resource identifier. |
||
| 231 | /// |
||
| 232 | /// Only the most significant bit of the Mask is used by this method to |
||
| 233 | /// identify the processor resource. |
||
| 234 | unsigned getResourceID(uint64_t Mask) const { |
||
| 235 | return Resources->resolveResourceMask(Mask); |
||
| 236 | } |
||
| 237 | |||
| 238 | /// Select the next instruction to issue from the ReadySet. Returns an invalid |
||
| 239 | /// instruction reference if there are no ready instructions, or if processor |
||
| 240 | /// resources are not available. |
||
| 241 | InstRef select(); |
||
| 242 | |||
| 243 | bool isReadySetEmpty() const { return ReadySet.empty(); } |
||
| 244 | bool isWaitSetEmpty() const { return WaitSet.empty(); } |
||
| 245 | |||
| 246 | /// This method is called by the ExecuteStage at the end of each cycle to |
||
| 247 | /// identify bottlenecks caused by data dependencies. Vector RegDeps is |
||
| 248 | /// populated by instructions that were not issued because of unsolved |
||
| 249 | /// register dependencies. Vector MemDeps is populated by instructions that |
||
| 250 | /// were not issued because of unsolved memory dependencies. |
||
| 251 | void analyzeDataDependencies(SmallVectorImpl<InstRef> &RegDeps, |
||
| 252 | SmallVectorImpl<InstRef> &MemDeps); |
||
| 253 | |||
| 254 | /// Returns a mask of busy resources, and populates vector Insts with |
||
| 255 | /// instructions that could not be issued to the underlying pipelines because |
||
| 256 | /// not all pipeline resources were available. |
||
| 257 | uint64_t analyzeResourcePressure(SmallVectorImpl<InstRef> &Insts); |
||
| 258 | |||
| 259 | // Returns true if the dispatch logic couldn't dispatch a full group due to |
||
| 260 | // unavailable scheduler and/or LS resources. |
||
| 261 | bool hadTokenStall() const { return HadTokenStall; } |
||
| 262 | |||
| 263 | #ifndef NDEBUG |
||
| 264 | // Update the ready queues. |
||
| 265 | void dump() const; |
||
| 266 | |||
| 267 | // This routine performs a basic correctness check. This routine should only |
||
| 268 | // be called when we know that 'IR' is not in the scheduler's instruction |
||
| 269 | // queues. |
||
| 270 | void instructionCheck(const InstRef &IR) const { |
||
| 271 | assert(!is_contained(WaitSet, IR) && "Already in the wait set!"); |
||
| 272 | assert(!is_contained(ReadySet, IR) && "Already in the ready set!"); |
||
| 273 | assert(!is_contained(IssuedSet, IR) && "Already executing!"); |
||
| 274 | } |
||
| 275 | #endif // !NDEBUG |
||
| 276 | }; |
||
| 277 | } // namespace mca |
||
| 278 | } // namespace llvm |
||
| 279 | |||
| 280 | #endif // LLVM_MCA_HARDWAREUNITS_SCHEDULER_H |