Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line |
|---|---|---|---|
| 14 | pmbaty | 1 | //===- MemoryLocation.h - Memory location descriptions ----------*- C++ -*-===// |
| 2 | // |
||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
| 6 | // |
||
| 7 | //===----------------------------------------------------------------------===// |
||
| 8 | /// \file |
||
| 9 | /// This file provides utility analysis objects describing memory locations. |
||
| 10 | /// These are used both by the Alias Analysis infrastructure and more |
||
| 11 | /// specialized memory analysis layers. |
||
| 12 | /// |
||
| 13 | //===----------------------------------------------------------------------===// |
||
| 14 | |||
| 15 | #ifndef LLVM_ANALYSIS_MEMORYLOCATION_H |
||
| 16 | #define LLVM_ANALYSIS_MEMORYLOCATION_H |
||
| 17 | |||
| 18 | #include "llvm/ADT/DenseMapInfo.h" |
||
| 19 | #include "llvm/IR/Metadata.h" |
||
| 20 | #include "llvm/Support/TypeSize.h" |
||
| 21 | |||
| 22 | #include <optional> |
||
| 23 | |||
| 24 | namespace llvm { |
||
| 25 | |||
| 26 | class CallBase; |
||
| 27 | class Instruction; |
||
| 28 | class LoadInst; |
||
| 29 | class StoreInst; |
||
| 30 | class MemTransferInst; |
||
| 31 | class MemIntrinsic; |
||
| 32 | class AtomicCmpXchgInst; |
||
| 33 | class AtomicMemTransferInst; |
||
| 34 | class AtomicMemIntrinsic; |
||
| 35 | class AtomicRMWInst; |
||
| 36 | class AnyMemTransferInst; |
||
| 37 | class AnyMemIntrinsic; |
||
| 38 | class TargetLibraryInfo; |
||
| 39 | class VAArgInst; |
||
| 40 | class Value; |
||
| 41 | |||
| 42 | // Represents the size of a MemoryLocation. Logically, it's an |
||
| 43 | // std::optional<uint63_t> that also carries a bit to represent whether the |
||
| 44 | // integer it contains, N, is 'precise'. Precise, in this context, means that we |
||
| 45 | // know that the area of storage referenced by the given MemoryLocation must be |
||
| 46 | // precisely N bytes. An imprecise value is formed as the union of two or more |
||
| 47 | // precise values, and can conservatively represent all of the values unioned |
||
| 48 | // into it. Importantly, imprecise values are an *upper-bound* on the size of a |
||
| 49 | // MemoryLocation. |
||
| 50 | // |
||
| 51 | // Concretely, a precise MemoryLocation is (%p, 4) in |
||
| 52 | // store i32 0, i32* %p |
||
| 53 | // |
||
| 54 | // Since we know that %p must be at least 4 bytes large at this point. |
||
| 55 | // Otherwise, we have UB. An example of an imprecise MemoryLocation is (%p, 4) |
||
| 56 | // at the memcpy in |
||
| 57 | // |
||
| 58 | // %n = select i1 %foo, i64 1, i64 4 |
||
| 59 | // call void @llvm.memcpy.p0i8.p0i8.i64(i8* %p, i8* %baz, i64 %n, i32 1, |
||
| 60 | // i1 false) |
||
| 61 | // |
||
| 62 | // ...Since we'll copy *up to* 4 bytes into %p, but we can't guarantee that |
||
| 63 | // we'll ever actually do so. |
||
| 64 | // |
||
| 65 | // If asked to represent a pathologically large value, this will degrade to |
||
| 66 | // std::nullopt. |
||
| 67 | class LocationSize { |
||
| 68 | enum : uint64_t { |
||
| 69 | BeforeOrAfterPointer = ~uint64_t(0), |
||
| 70 | AfterPointer = BeforeOrAfterPointer - 1, |
||
| 71 | MapEmpty = BeforeOrAfterPointer - 2, |
||
| 72 | MapTombstone = BeforeOrAfterPointer - 3, |
||
| 73 | ImpreciseBit = uint64_t(1) << 63, |
||
| 74 | |||
| 75 | // The maximum value we can represent without falling back to 'unknown'. |
||
| 76 | MaxValue = (MapTombstone - 1) & ~ImpreciseBit, |
||
| 77 | }; |
||
| 78 | |||
| 79 | uint64_t Value; |
||
| 80 | |||
| 81 | // Hack to support implicit construction. This should disappear when the |
||
| 82 | // public LocationSize ctor goes away. |
||
| 83 | enum DirectConstruction { Direct }; |
||
| 84 | |||
| 85 | constexpr LocationSize(uint64_t Raw, DirectConstruction): Value(Raw) {} |
||
| 86 | |||
| 87 | static_assert(AfterPointer & ImpreciseBit, |
||
| 88 | "AfterPointer is imprecise by definition."); |
||
| 89 | static_assert(BeforeOrAfterPointer & ImpreciseBit, |
||
| 90 | "BeforeOrAfterPointer is imprecise by definition."); |
||
| 91 | |||
| 92 | public: |
||
| 93 | // FIXME: Migrate all users to construct via either `precise` or `upperBound`, |
||
| 94 | // to make it more obvious at the callsite the kind of size that they're |
||
| 95 | // providing. |
||
| 96 | // |
||
| 97 | // Since the overwhelming majority of users of this provide precise values, |
||
| 98 | // this assumes the provided value is precise. |
||
| 99 | constexpr LocationSize(uint64_t Raw) |
||
| 100 | : Value(Raw > MaxValue ? AfterPointer : Raw) {} |
||
| 101 | |||
| 102 | static LocationSize precise(uint64_t Value) { return LocationSize(Value); } |
||
| 103 | static LocationSize precise(TypeSize Value) { |
||
| 104 | if (Value.isScalable()) |
||
| 105 | return afterPointer(); |
||
| 106 | return precise(Value.getFixedValue()); |
||
| 107 | } |
||
| 108 | |||
| 109 | static LocationSize upperBound(uint64_t Value) { |
||
| 110 | // You can't go lower than 0, so give a precise result. |
||
| 111 | if (LLVM_UNLIKELY(Value == 0)) |
||
| 112 | return precise(0); |
||
| 113 | if (LLVM_UNLIKELY(Value > MaxValue)) |
||
| 114 | return afterPointer(); |
||
| 115 | return LocationSize(Value | ImpreciseBit, Direct); |
||
| 116 | } |
||
| 117 | static LocationSize upperBound(TypeSize Value) { |
||
| 118 | if (Value.isScalable()) |
||
| 119 | return afterPointer(); |
||
| 120 | return upperBound(Value.getFixedValue()); |
||
| 121 | } |
||
| 122 | |||
| 123 | /// Any location after the base pointer (but still within the underlying |
||
| 124 | /// object). |
||
| 125 | constexpr static LocationSize afterPointer() { |
||
| 126 | return LocationSize(AfterPointer, Direct); |
||
| 127 | } |
||
| 128 | |||
| 129 | /// Any location before or after the base pointer (but still within the |
||
| 130 | /// underlying object). |
||
| 131 | constexpr static LocationSize beforeOrAfterPointer() { |
||
| 132 | return LocationSize(BeforeOrAfterPointer, Direct); |
||
| 133 | } |
||
| 134 | |||
| 135 | // Sentinel values, generally used for maps. |
||
| 136 | constexpr static LocationSize mapTombstone() { |
||
| 137 | return LocationSize(MapTombstone, Direct); |
||
| 138 | } |
||
| 139 | constexpr static LocationSize mapEmpty() { |
||
| 140 | return LocationSize(MapEmpty, Direct); |
||
| 141 | } |
||
| 142 | |||
| 143 | // Returns a LocationSize that can correctly represent either `*this` or |
||
| 144 | // `Other`. |
||
| 145 | LocationSize unionWith(LocationSize Other) const { |
||
| 146 | if (Other == *this) |
||
| 147 | return *this; |
||
| 148 | |||
| 149 | if (Value == BeforeOrAfterPointer || Other.Value == BeforeOrAfterPointer) |
||
| 150 | return beforeOrAfterPointer(); |
||
| 151 | if (Value == AfterPointer || Other.Value == AfterPointer) |
||
| 152 | return afterPointer(); |
||
| 153 | |||
| 154 | return upperBound(std::max(getValue(), Other.getValue())); |
||
| 155 | } |
||
| 156 | |||
| 157 | bool hasValue() const { |
||
| 158 | return Value != AfterPointer && Value != BeforeOrAfterPointer; |
||
| 159 | } |
||
| 160 | uint64_t getValue() const { |
||
| 161 | assert(hasValue() && "Getting value from an unknown LocationSize!"); |
||
| 162 | return Value & ~ImpreciseBit; |
||
| 163 | } |
||
| 164 | |||
| 165 | // Returns whether or not this value is precise. Note that if a value is |
||
| 166 | // precise, it's guaranteed to not be unknown. |
||
| 167 | bool isPrecise() const { |
||
| 168 | return (Value & ImpreciseBit) == 0; |
||
| 169 | } |
||
| 170 | |||
| 171 | // Convenience method to check if this LocationSize's value is 0. |
||
| 172 | bool isZero() const { return hasValue() && getValue() == 0; } |
||
| 173 | |||
| 174 | /// Whether accesses before the base pointer are possible. |
||
| 175 | bool mayBeBeforePointer() const { return Value == BeforeOrAfterPointer; } |
||
| 176 | |||
| 177 | bool operator==(const LocationSize &Other) const { |
||
| 178 | return Value == Other.Value; |
||
| 179 | } |
||
| 180 | |||
| 181 | bool operator!=(const LocationSize &Other) const { |
||
| 182 | return !(*this == Other); |
||
| 183 | } |
||
| 184 | |||
| 185 | // Ordering operators are not provided, since it's unclear if there's only one |
||
| 186 | // reasonable way to compare: |
||
| 187 | // - values that don't exist against values that do, and |
||
| 188 | // - precise values to imprecise values |
||
| 189 | |||
| 190 | void print(raw_ostream &OS) const; |
||
| 191 | |||
| 192 | // Returns an opaque value that represents this LocationSize. Cannot be |
||
| 193 | // reliably converted back into a LocationSize. |
||
| 194 | uint64_t toRaw() const { return Value; } |
||
| 195 | }; |
||
| 196 | |||
| 197 | inline raw_ostream &operator<<(raw_ostream &OS, LocationSize Size) { |
||
| 198 | Size.print(OS); |
||
| 199 | return OS; |
||
| 200 | } |
||
| 201 | |||
| 202 | /// Representation for a specific memory location. |
||
| 203 | /// |
||
| 204 | /// This abstraction can be used to represent a specific location in memory. |
||
| 205 | /// The goal of the location is to represent enough information to describe |
||
| 206 | /// abstract aliasing, modification, and reference behaviors of whatever |
||
| 207 | /// value(s) are stored in memory at the particular location. |
||
| 208 | /// |
||
| 209 | /// The primary user of this interface is LLVM's Alias Analysis, but other |
||
| 210 | /// memory analyses such as MemoryDependence can use it as well. |
||
| 211 | class MemoryLocation { |
||
| 212 | public: |
||
| 213 | /// UnknownSize - This is a special value which can be used with the |
||
| 214 | /// size arguments in alias queries to indicate that the caller does not |
||
| 215 | /// know the sizes of the potential memory references. |
||
| 216 | enum : uint64_t { UnknownSize = ~UINT64_C(0) }; |
||
| 217 | |||
| 218 | /// The address of the start of the location. |
||
| 219 | const Value *Ptr; |
||
| 220 | |||
| 221 | /// The maximum size of the location, in address-units, or |
||
| 222 | /// UnknownSize if the size is not known. |
||
| 223 | /// |
||
| 224 | /// Note that an unknown size does not mean the pointer aliases the entire |
||
| 225 | /// virtual address space, because there are restrictions on stepping out of |
||
| 226 | /// one object and into another. See |
||
| 227 | /// http://llvm.org/docs/LangRef.html#pointeraliasing |
||
| 228 | LocationSize Size; |
||
| 229 | |||
| 230 | /// The metadata nodes which describes the aliasing of the location (each |
||
| 231 | /// member is null if that kind of information is unavailable). |
||
| 232 | AAMDNodes AATags; |
||
| 233 | |||
| 234 | void print(raw_ostream &OS) const { OS << *Ptr << " " << Size << "\n"; } |
||
| 235 | |||
| 236 | /// Return a location with information about the memory reference by the given |
||
| 237 | /// instruction. |
||
| 238 | static MemoryLocation get(const LoadInst *LI); |
||
| 239 | static MemoryLocation get(const StoreInst *SI); |
||
| 240 | static MemoryLocation get(const VAArgInst *VI); |
||
| 241 | static MemoryLocation get(const AtomicCmpXchgInst *CXI); |
||
| 242 | static MemoryLocation get(const AtomicRMWInst *RMWI); |
||
| 243 | static MemoryLocation get(const Instruction *Inst) { |
||
| 244 | return *MemoryLocation::getOrNone(Inst); |
||
| 245 | } |
||
| 246 | static std::optional<MemoryLocation> getOrNone(const Instruction *Inst); |
||
| 247 | |||
| 248 | /// Return a location representing the source of a memory transfer. |
||
| 249 | static MemoryLocation getForSource(const MemTransferInst *MTI); |
||
| 250 | static MemoryLocation getForSource(const AtomicMemTransferInst *MTI); |
||
| 251 | static MemoryLocation getForSource(const AnyMemTransferInst *MTI); |
||
| 252 | |||
| 253 | /// Return a location representing the destination of a memory set or |
||
| 254 | /// transfer. |
||
| 255 | static MemoryLocation getForDest(const MemIntrinsic *MI); |
||
| 256 | static MemoryLocation getForDest(const AtomicMemIntrinsic *MI); |
||
| 257 | static MemoryLocation getForDest(const AnyMemIntrinsic *MI); |
||
| 258 | static std::optional<MemoryLocation> getForDest(const CallBase *CI, |
||
| 259 | const TargetLibraryInfo &TLI); |
||
| 260 | |||
| 261 | /// Return a location representing a particular argument of a call. |
||
| 262 | static MemoryLocation getForArgument(const CallBase *Call, unsigned ArgIdx, |
||
| 263 | const TargetLibraryInfo *TLI); |
||
| 264 | static MemoryLocation getForArgument(const CallBase *Call, unsigned ArgIdx, |
||
| 265 | const TargetLibraryInfo &TLI) { |
||
| 266 | return getForArgument(Call, ArgIdx, &TLI); |
||
| 267 | } |
||
| 268 | |||
| 269 | /// Return a location that may access any location after Ptr, while remaining |
||
| 270 | /// within the underlying object. |
||
| 271 | static MemoryLocation getAfter(const Value *Ptr, |
||
| 272 | const AAMDNodes &AATags = AAMDNodes()) { |
||
| 273 | return MemoryLocation(Ptr, LocationSize::afterPointer(), AATags); |
||
| 274 | } |
||
| 275 | |||
| 276 | /// Return a location that may access any location before or after Ptr, while |
||
| 277 | /// remaining within the underlying object. |
||
| 278 | static MemoryLocation |
||
| 279 | getBeforeOrAfter(const Value *Ptr, const AAMDNodes &AATags = AAMDNodes()) { |
||
| 280 | return MemoryLocation(Ptr, LocationSize::beforeOrAfterPointer(), AATags); |
||
| 281 | } |
||
| 282 | |||
| 283 | // Return the exact size if the exact size is known at compiletime, |
||
| 284 | // otherwise return MemoryLocation::UnknownSize. |
||
| 285 | static uint64_t getSizeOrUnknown(const TypeSize &T) { |
||
| 286 | return T.isScalable() ? UnknownSize : T.getFixedValue(); |
||
| 287 | } |
||
| 288 | |||
| 289 | MemoryLocation() : Ptr(nullptr), Size(LocationSize::beforeOrAfterPointer()) {} |
||
| 290 | |||
| 291 | explicit MemoryLocation(const Value *Ptr, LocationSize Size, |
||
| 292 | const AAMDNodes &AATags = AAMDNodes()) |
||
| 293 | : Ptr(Ptr), Size(Size), AATags(AATags) {} |
||
| 294 | |||
| 295 | MemoryLocation getWithNewPtr(const Value *NewPtr) const { |
||
| 296 | MemoryLocation Copy(*this); |
||
| 297 | Copy.Ptr = NewPtr; |
||
| 298 | return Copy; |
||
| 299 | } |
||
| 300 | |||
| 301 | MemoryLocation getWithNewSize(LocationSize NewSize) const { |
||
| 302 | MemoryLocation Copy(*this); |
||
| 303 | Copy.Size = NewSize; |
||
| 304 | return Copy; |
||
| 305 | } |
||
| 306 | |||
| 307 | MemoryLocation getWithoutAATags() const { |
||
| 308 | MemoryLocation Copy(*this); |
||
| 309 | Copy.AATags = AAMDNodes(); |
||
| 310 | return Copy; |
||
| 311 | } |
||
| 312 | |||
| 313 | bool operator==(const MemoryLocation &Other) const { |
||
| 314 | return Ptr == Other.Ptr && Size == Other.Size && AATags == Other.AATags; |
||
| 315 | } |
||
| 316 | }; |
||
| 317 | |||
| 318 | // Specialize DenseMapInfo. |
||
| 319 | template <> struct DenseMapInfo<LocationSize> { |
||
| 320 | static inline LocationSize getEmptyKey() { |
||
| 321 | return LocationSize::mapEmpty(); |
||
| 322 | } |
||
| 323 | static inline LocationSize getTombstoneKey() { |
||
| 324 | return LocationSize::mapTombstone(); |
||
| 325 | } |
||
| 326 | static unsigned getHashValue(const LocationSize &Val) { |
||
| 327 | return DenseMapInfo<uint64_t>::getHashValue(Val.toRaw()); |
||
| 328 | } |
||
| 329 | static bool isEqual(const LocationSize &LHS, const LocationSize &RHS) { |
||
| 330 | return LHS == RHS; |
||
| 331 | } |
||
| 332 | }; |
||
| 333 | |||
| 334 | template <> struct DenseMapInfo<MemoryLocation> { |
||
| 335 | static inline MemoryLocation getEmptyKey() { |
||
| 336 | return MemoryLocation(DenseMapInfo<const Value *>::getEmptyKey(), |
||
| 337 | DenseMapInfo<LocationSize>::getEmptyKey()); |
||
| 338 | } |
||
| 339 | static inline MemoryLocation getTombstoneKey() { |
||
| 340 | return MemoryLocation(DenseMapInfo<const Value *>::getTombstoneKey(), |
||
| 341 | DenseMapInfo<LocationSize>::getTombstoneKey()); |
||
| 342 | } |
||
| 343 | static unsigned getHashValue(const MemoryLocation &Val) { |
||
| 344 | return DenseMapInfo<const Value *>::getHashValue(Val.Ptr) ^ |
||
| 345 | DenseMapInfo<LocationSize>::getHashValue(Val.Size) ^ |
||
| 346 | DenseMapInfo<AAMDNodes>::getHashValue(Val.AATags); |
||
| 347 | } |
||
| 348 | static bool isEqual(const MemoryLocation &LHS, const MemoryLocation &RHS) { |
||
| 349 | return LHS == RHS; |
||
| 350 | } |
||
| 351 | }; |
||
| 352 | } |
||
| 353 | |||
| 354 | #endif |