Details | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line | 
|---|---|---|---|
| 14 | pmbaty | 1 | //===- MsgPackReader.h - Simple MsgPack reader ------------------*- C++ -*-===// | 
| 2 | // | ||
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | ||
| 4 | // See https://llvm.org/LICENSE.txt for license information. | ||
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | ||
| 6 | // | ||
| 7 | //===----------------------------------------------------------------------===// | ||
| 8 | /// | ||
| 9 | ///  \file | ||
| 10 | ///  This is a MessagePack reader. | ||
| 11 | /// | ||
| 12 | ///  See https://github.com/msgpack/msgpack/blob/master/spec.md for the full | ||
| 13 | ///  standard. | ||
| 14 | /// | ||
| 15 | ///  Typical usage: | ||
| 16 | ///  \code | ||
| 17 | ///  StringRef input = GetInput(); | ||
| 18 | ///  msgpack::Reader MPReader(input); | ||
| 19 | ///  msgpack::Object Obj; | ||
| 20 | /// | ||
| 21 | ///  while (MPReader.read(Obj)) { | ||
| 22 | ///    switch (Obj.Kind) { | ||
| 23 | ///    case msgpack::Type::Int: | ||
| 24 | //       // Use Obj.Int | ||
| 25 | ///      break; | ||
| 26 | ///    // ... | ||
| 27 | ///    } | ||
| 28 | ///  } | ||
| 29 | ///  \endcode | ||
| 30 | /// | ||
| 31 | //===----------------------------------------------------------------------===// | ||
| 32 | |||
| 33 | #ifndef LLVM_BINARYFORMAT_MSGPACKREADER_H | ||
| 34 | #define LLVM_BINARYFORMAT_MSGPACKREADER_H | ||
| 35 | |||
| 36 | #include "llvm/Support/Error.h" | ||
| 37 | #include "llvm/Support/MemoryBufferRef.h" | ||
| 38 | #include <cstdint> | ||
| 39 | |||
| 40 | namespace llvm { | ||
| 41 | namespace msgpack { | ||
| 42 | |||
| 43 | /// MessagePack types as defined in the standard, with the exception of Integer | ||
| 44 | /// being divided into a signed Int and unsigned UInt variant in order to map | ||
| 45 | /// directly to C++ types. | ||
| 46 | /// | ||
| 47 | /// The types map onto corresponding union members of the \c Object struct. | ||
| 48 | enum class Type : uint8_t { | ||
| 49 | Int, | ||
| 50 | UInt, | ||
| 51 | Nil, | ||
| 52 | Boolean, | ||
| 53 | Float, | ||
| 54 | String, | ||
| 55 | Binary, | ||
| 56 | Array, | ||
| 57 | Map, | ||
| 58 | Extension, | ||
| 59 |   Empty, // Used by MsgPackDocument to represent an empty node | ||
| 60 | }; | ||
| 61 | |||
| 62 | /// Extension types are composed of a user-defined type ID and an uninterpreted | ||
| 63 | /// sequence of bytes. | ||
| 64 | struct ExtensionType { | ||
| 65 |   /// User-defined extension type. | ||
| 66 | int8_t Type; | ||
| 67 |   /// Raw bytes of the extension object. | ||
| 68 |   StringRef Bytes; | ||
| 69 | }; | ||
| 70 | |||
| 71 | /// MessagePack object, represented as a tagged union of C++ types. | ||
| 72 | /// | ||
| 73 | /// All types except \c Type::Nil (which has only one value, and so is | ||
| 74 | /// completely represented by the \c Kind itself) map to a exactly one union | ||
| 75 | /// member. | ||
| 76 | struct Object { | ||
| 77 |   Type Kind; | ||
| 78 | union { | ||
| 79 |     /// Value for \c Type::Int. | ||
| 80 | int64_t Int; | ||
| 81 |     /// Value for \c Type::Uint. | ||
| 82 | uint64_t UInt; | ||
| 83 |     /// Value for \c Type::Boolean. | ||
| 84 | bool Bool; | ||
| 85 |     /// Value for \c Type::Float. | ||
| 86 | double Float; | ||
| 87 |     /// Value for \c Type::String and \c Type::Binary. | ||
| 88 |     StringRef Raw; | ||
| 89 |     /// Value for \c Type::Array and \c Type::Map. | ||
| 90 | size_t Length; | ||
| 91 |     /// Value for \c Type::Extension. | ||
| 92 |     ExtensionType Extension; | ||
| 93 | }; | ||
| 94 | |||
| 95 | Object() : Kind(Type::Int), Int(0) {} | ||
| 96 | }; | ||
| 97 | |||
| 98 | /// Reads MessagePack objects from memory, one at a time. | ||
| 99 | class Reader { | ||
| 100 | public: | ||
| 101 |   /// Construct a reader, keeping a reference to the \p InputBuffer. | ||
| 102 | Reader(MemoryBufferRef InputBuffer); | ||
| 103 |   /// Construct a reader, keeping a reference to the \p Input. | ||
| 104 | Reader(StringRef Input); | ||
| 105 | |||
| 106 | Reader(const Reader &) = delete; | ||
| 107 | Reader &operator=(const Reader &) = delete; | ||
| 108 | |||
| 109 |   /// Read one object from the input buffer, advancing past it. | ||
| 110 |   /// | ||
| 111 |   /// The \p Obj is updated with the kind of the object read, and the | ||
| 112 |   /// corresponding union member is updated. | ||
| 113 |   /// | ||
| 114 |   /// For the collection objects (Array and Map), only the length is read, and | ||
| 115 |   /// the caller must make and additional \c N calls (in the case of Array) or | ||
| 116 |   /// \c N*2 calls (in the case of Map) to \c Read to retrieve the collection | ||
| 117 |   /// elements. | ||
| 118 |   /// | ||
| 119 |   /// \param [out] Obj filled with next object on success. | ||
| 120 |   /// | ||
| 121 |   /// \returns true when object successfully read, false when at end of | ||
| 122 |   /// input (and so \p Obj was not updated), otherwise an error. | ||
| 123 | Expected<bool> read(Object &Obj); | ||
| 124 | |||
| 125 | private: | ||
| 126 |   MemoryBufferRef InputBuffer; | ||
| 127 | StringRef::iterator Current; | ||
| 128 | StringRef::iterator End; | ||
| 129 | |||
| 130 | size_t remainingSpace() { | ||
| 131 |     // The rest of the code maintains the invariant that End >= Current, so | ||
| 132 |     // that this cast is always defined behavior. | ||
| 133 | return static_cast<size_t>(End - Current); | ||
| 134 |   } | ||
| 135 | |||
| 136 | template <class T> Expected<bool> readRaw(Object &Obj); | ||
| 137 | template <class T> Expected<bool> readInt(Object &Obj); | ||
| 138 | template <class T> Expected<bool> readUInt(Object &Obj); | ||
| 139 | template <class T> Expected<bool> readLength(Object &Obj); | ||
| 140 | template <class T> Expected<bool> readExt(Object &Obj); | ||
| 141 | Expected<bool> createRaw(Object &Obj, uint32_t Size); | ||
| 142 | Expected<bool> createExt(Object &Obj, uint32_t Size); | ||
| 143 | }; | ||
| 144 | |||
| 145 | } // end namespace msgpack | ||
| 146 | } // end namespace llvm | ||
| 147 | |||
| 148 | #endif // LLVM_BINARYFORMAT_MSGPACKREADER_H |