Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line |
|---|---|---|---|
| 14 | pmbaty | 1 | //===-------- LLVM-provided High-Level Optimization levels -*- C++ -*------===// |
| 2 | // |
||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
| 6 | // |
||
| 7 | //===----------------------------------------------------------------------===// |
||
| 8 | /// \file |
||
| 9 | /// |
||
| 10 | /// This header enumerates the LLVM-provided high-level optimization levels. |
||
| 11 | /// Each level has a specific goal and rationale. |
||
| 12 | /// |
||
| 13 | //===----------------------------------------------------------------------===// |
||
| 14 | |||
| 15 | #ifndef LLVM_PASSES_OPTIMIZATIONLEVEL_H |
||
| 16 | #define LLVM_PASSES_OPTIMIZATIONLEVEL_H |
||
| 17 | |||
| 18 | #include <assert.h> |
||
| 19 | |||
| 20 | namespace llvm { |
||
| 21 | |||
| 22 | class OptimizationLevel final { |
||
| 23 | unsigned SpeedLevel = 2; |
||
| 24 | unsigned SizeLevel = 0; |
||
| 25 | OptimizationLevel(unsigned SpeedLevel, unsigned SizeLevel) |
||
| 26 | : SpeedLevel(SpeedLevel), SizeLevel(SizeLevel) { |
||
| 27 | // Check that only valid combinations are passed. |
||
| 28 | assert(SpeedLevel <= 3 && |
||
| 29 | "Optimization level for speed should be 0, 1, 2, or 3"); |
||
| 30 | assert(SizeLevel <= 2 && |
||
| 31 | "Optimization level for size should be 0, 1, or 2"); |
||
| 32 | assert((SizeLevel == 0 || SpeedLevel == 2) && |
||
| 33 | "Optimize for size should be encoded with speedup level == 2"); |
||
| 34 | } |
||
| 35 | |||
| 36 | public: |
||
| 37 | OptimizationLevel() = default; |
||
| 38 | /// Disable as many optimizations as possible. This doesn't completely |
||
| 39 | /// disable the optimizer in all cases, for example always_inline functions |
||
| 40 | /// can be required to be inlined for correctness. |
||
| 41 | static const OptimizationLevel O0; |
||
| 42 | |||
| 43 | /// Optimize quickly without destroying debuggability. |
||
| 44 | /// |
||
| 45 | /// This level is tuned to produce a result from the optimizer as quickly |
||
| 46 | /// as possible and to avoid destroying debuggability. This tends to result |
||
| 47 | /// in a very good development mode where the compiled code will be |
||
| 48 | /// immediately executed as part of testing. As a consequence, where |
||
| 49 | /// possible, we would like to produce efficient-to-execute code, but not |
||
| 50 | /// if it significantly slows down compilation or would prevent even basic |
||
| 51 | /// debugging of the resulting binary. |
||
| 52 | /// |
||
| 53 | /// As an example, complex loop transformations such as versioning, |
||
| 54 | /// vectorization, or fusion don't make sense here due to the degree to |
||
| 55 | /// which the executed code differs from the source code, and the compile |
||
| 56 | /// time cost. |
||
| 57 | static const OptimizationLevel O1; |
||
| 58 | /// Optimize for fast execution as much as possible without triggering |
||
| 59 | /// significant incremental compile time or code size growth. |
||
| 60 | /// |
||
| 61 | /// The key idea is that optimizations at this level should "pay for |
||
| 62 | /// themselves". So if an optimization increases compile time by 5% or |
||
| 63 | /// increases code size by 5% for a particular benchmark, that benchmark |
||
| 64 | /// should also be one which sees a 5% runtime improvement. If the compile |
||
| 65 | /// time or code size penalties happen on average across a diverse range of |
||
| 66 | /// LLVM users' benchmarks, then the improvements should as well. |
||
| 67 | /// |
||
| 68 | /// And no matter what, the compile time needs to not grow superlinearly |
||
| 69 | /// with the size of input to LLVM so that users can control the runtime of |
||
| 70 | /// the optimizer in this mode. |
||
| 71 | /// |
||
| 72 | /// This is expected to be a good default optimization level for the vast |
||
| 73 | /// majority of users. |
||
| 74 | static const OptimizationLevel O2; |
||
| 75 | /// Optimize for fast execution as much as possible. |
||
| 76 | /// |
||
| 77 | /// This mode is significantly more aggressive in trading off compile time |
||
| 78 | /// and code size to get execution time improvements. The core idea is that |
||
| 79 | /// this mode should include any optimization that helps execution time on |
||
| 80 | /// balance across a diverse collection of benchmarks, even if it increases |
||
| 81 | /// code size or compile time for some benchmarks without corresponding |
||
| 82 | /// improvements to execution time. |
||
| 83 | /// |
||
| 84 | /// Despite being willing to trade more compile time off to get improved |
||
| 85 | /// execution time, this mode still tries to avoid superlinear growth in |
||
| 86 | /// order to make even significantly slower compile times at least scale |
||
| 87 | /// reasonably. This does not preclude very substantial constant factor |
||
| 88 | /// costs though. |
||
| 89 | static const OptimizationLevel O3; |
||
| 90 | /// Similar to \c O2 but tries to optimize for small code size instead of |
||
| 91 | /// fast execution without triggering significant incremental execution |
||
| 92 | /// time slowdowns. |
||
| 93 | /// |
||
| 94 | /// The logic here is exactly the same as \c O2, but with code size and |
||
| 95 | /// execution time metrics swapped. |
||
| 96 | /// |
||
| 97 | /// A consequence of the different core goal is that this should in general |
||
| 98 | /// produce substantially smaller executables that still run in |
||
| 99 | /// a reasonable amount of time. |
||
| 100 | static const OptimizationLevel Os; |
||
| 101 | /// A very specialized mode that will optimize for code size at any and all |
||
| 102 | /// costs. |
||
| 103 | /// |
||
| 104 | /// This is useful primarily when there are absolute size limitations and |
||
| 105 | /// any effort taken to reduce the size is worth it regardless of the |
||
| 106 | /// execution time impact. You should expect this level to produce rather |
||
| 107 | /// slow, but very small, code. |
||
| 108 | static const OptimizationLevel Oz; |
||
| 109 | |||
| 110 | bool isOptimizingForSpeed() const { return SizeLevel == 0 && SpeedLevel > 0; } |
||
| 111 | |||
| 112 | bool isOptimizingForSize() const { return SizeLevel > 0; } |
||
| 113 | |||
| 114 | bool operator==(const OptimizationLevel &Other) const { |
||
| 115 | return SizeLevel == Other.SizeLevel && SpeedLevel == Other.SpeedLevel; |
||
| 116 | } |
||
| 117 | bool operator!=(const OptimizationLevel &Other) const { |
||
| 118 | return SizeLevel != Other.SizeLevel || SpeedLevel != Other.SpeedLevel; |
||
| 119 | } |
||
| 120 | |||
| 121 | unsigned getSpeedupLevel() const { return SpeedLevel; } |
||
| 122 | |||
| 123 | unsigned getSizeLevel() const { return SizeLevel; } |
||
| 124 | }; |
||
| 125 | } // namespace llvm |
||
| 126 | |||
| 127 | #endif |