//===- LoopGeneratorsGOMP.h - IR helper to create loops ---------*- C++ -*-===//
 
//
 
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 
// See https://llvm.org/LICENSE.txt for license information.
 
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 
//
 
//===----------------------------------------------------------------------===//
 
//
 
// This file contains functions to create scalar and OpenMP parallel loops
 
// as LLVM-IR.
 
//
 
//===----------------------------------------------------------------------===//
 
#ifndef POLLY_LOOP_GENERATORS_GOMP_H
 
#define POLLY_LOOP_GENERATORS_GOMP_H
 
 
 
#include "polly/CodeGen/IRBuilder.h"
 
#include "polly/CodeGen/LoopGenerators.h"
 
#include "polly/Support/ScopHelper.h"
 
#include "llvm/ADT/SetVector.h"
 
 
 
namespace polly {
 
 
 
/// This ParallelLoopGenerator subclass handles the generation of parallelized
 
/// code, utilizing the GNU OpenMP library.
 
class ParallelLoopGeneratorGOMP final : public ParallelLoopGenerator {
 
public:
 
  /// Create a parallel loop generator for the current function.
 
  ParallelLoopGeneratorGOMP(PollyIRBuilder &Builder, LoopInfo &LI,
 
                            DominatorTree &DT, const DataLayout &DL)
 
      : ParallelLoopGenerator(Builder, LI, DT, DL) {}
 
 
 
  // The functions below may be used if one does not want to generate a
 
  // specific OpenMP parallel loop, but generate individual parts of it
 
  // (e.g. the subfunction definition).
 
 
 
  /// Create a runtime library call to spawn the worker threads.
 
  ///
 
  /// @param SubFn      The subfunction which holds the loop body.
 
  /// @param SubFnParam The parameter for the subfunction (basically the struct
 
  ///                   filled with the outside values).
 
  /// @param LB         The lower bound for the loop we parallelize.
 
  /// @param UB         The upper bound for the loop we parallelize.
 
  /// @param Stride     The stride of the loop we parallelize.
 
  void createCallSpawnThreads(Value *SubFn, Value *SubFnParam, Value *LB,
 
                              Value *UB, Value *Stride);
 
 
 
  void deployParallelExecution(Function *SubFn, Value *SubFnParam, Value *LB,
 
                               Value *UB, Value *Stride) override;
 
 
 
  Function *prepareSubFnDefinition(Function *F) const override;
 
 
 
  std::tuple<Value *, Function *> createSubFn(Value *Stride, AllocaInst *Struct,
 
                                              SetVector<Value *> UsedValues,
 
                                              ValueMapT &VMap) override;
 
 
 
  /// Create a runtime library call to join the worker threads.
 
  void createCallJoinThreads();
 
 
 
  /// Create a runtime library call to get the next work item.
 
  ///
 
  /// @param LBPtr A pointer value to store the work item begin in.
 
  /// @param UBPtr A pointer value to store the work item end in.
 
  ///
 
  /// @returns A true value if the work item is not empty.
 
  Value *createCallGetWorkItem(Value *LBPtr, Value *UBPtr);
 
 
 
  /// Create a runtime library call to allow cleanup of the thread.
 
  ///
 
  /// @note This function is called right before the thread will exit the
 
  ///       subfunction and only if the runtime system depends on it.
 
  void createCallCleanupThread();
 
};
 
} // end namespace polly
 
#endif