Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line | 
|---|---|---|---|
| 14 | pmbaty | 1 | //===- LoopGeneratorsGOMP.h - IR helper to create loops ---------*- C++ -*-===// | 
| 2 | // | ||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | ||
| 4 | // See https://llvm.org/LICENSE.txt for license information. | ||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | ||
| 6 | // | ||
| 7 | //===----------------------------------------------------------------------===// | ||
| 8 | // | ||
| 9 | // This file contains functions to create scalar and OpenMP parallel loops | ||
| 10 | // as LLVM-IR. | ||
| 11 | // | ||
| 12 | //===----------------------------------------------------------------------===// | ||
| 13 | #ifndef POLLY_LOOP_GENERATORS_GOMP_H | ||
| 14 | #define POLLY_LOOP_GENERATORS_GOMP_H | ||
| 15 | |||
| 16 | #include "polly/CodeGen/IRBuilder.h" | ||
| 17 | #include "polly/CodeGen/LoopGenerators.h" | ||
| 18 | #include "polly/Support/ScopHelper.h" | ||
| 19 | #include "llvm/ADT/SetVector.h" | ||
| 20 | |||
| 21 | namespace polly { | ||
| 22 | |||
| 23 | /// This ParallelLoopGenerator subclass handles the generation of parallelized | ||
| 24 | /// code, utilizing the GNU OpenMP library. | ||
| 25 | class ParallelLoopGeneratorGOMP final : public ParallelLoopGenerator { | ||
| 26 | public: | ||
| 27 |   /// Create a parallel loop generator for the current function. | ||
| 28 | ParallelLoopGeneratorGOMP(PollyIRBuilder &Builder, LoopInfo &LI, | ||
| 29 | DominatorTree &DT, const DataLayout &DL) | ||
| 30 | : ParallelLoopGenerator(Builder, LI, DT, DL) {} | ||
| 31 | |||
| 32 |   // The functions below may be used if one does not want to generate a | ||
| 33 |   // specific OpenMP parallel loop, but generate individual parts of it | ||
| 34 |   // (e.g. the subfunction definition). | ||
| 35 | |||
| 36 |   /// Create a runtime library call to spawn the worker threads. | ||
| 37 |   /// | ||
| 38 |   /// @param SubFn      The subfunction which holds the loop body. | ||
| 39 |   /// @param SubFnParam The parameter for the subfunction (basically the struct | ||
| 40 |   ///                   filled with the outside values). | ||
| 41 |   /// @param LB         The lower bound for the loop we parallelize. | ||
| 42 |   /// @param UB         The upper bound for the loop we parallelize. | ||
| 43 |   /// @param Stride     The stride of the loop we parallelize. | ||
| 44 | void createCallSpawnThreads(Value *SubFn, Value *SubFnParam, Value *LB, | ||
| 45 | Value *UB, Value *Stride); | ||
| 46 | |||
| 47 | void deployParallelExecution(Function *SubFn, Value *SubFnParam, Value *LB, | ||
| 48 | Value *UB, Value *Stride) override; | ||
| 49 | |||
| 50 | Function *prepareSubFnDefinition(Function *F) const override; | ||
| 51 | |||
| 52 | std::tuple<Value *, Function *> createSubFn(Value *Stride, AllocaInst *Struct, | ||
| 53 | SetVector<Value *> UsedValues, | ||
| 54 | ValueMapT &VMap) override; | ||
| 55 | |||
| 56 |   /// Create a runtime library call to join the worker threads. | ||
| 57 | void createCallJoinThreads(); | ||
| 58 | |||
| 59 |   /// Create a runtime library call to get the next work item. | ||
| 60 |   /// | ||
| 61 |   /// @param LBPtr A pointer value to store the work item begin in. | ||
| 62 |   /// @param UBPtr A pointer value to store the work item end in. | ||
| 63 |   /// | ||
| 64 |   /// @returns A true value if the work item is not empty. | ||
| 65 | Value *createCallGetWorkItem(Value *LBPtr, Value *UBPtr); | ||
| 66 | |||
| 67 |   /// Create a runtime library call to allow cleanup of the thread. | ||
| 68 |   /// | ||
| 69 |   /// @note This function is called right before the thread will exit the | ||
| 70 |   ///       subfunction and only if the runtime system depends on it. | ||
| 71 | void createCallCleanupThread(); | ||
| 72 | }; | ||
| 73 | } // end namespace polly | ||
| 74 | #endif |