Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
14 | pmbaty | 1 | //===- MsgPackReader.h - Simple MsgPack reader ------------------*- C++ -*-===// |
2 | // |
||
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
||
4 | // See https://llvm.org/LICENSE.txt for license information. |
||
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
||
6 | // |
||
7 | //===----------------------------------------------------------------------===// |
||
8 | /// |
||
9 | /// \file |
||
10 | /// This is a MessagePack reader. |
||
11 | /// |
||
12 | /// See https://github.com/msgpack/msgpack/blob/master/spec.md for the full |
||
13 | /// standard. |
||
14 | /// |
||
15 | /// Typical usage: |
||
16 | /// \code |
||
17 | /// StringRef input = GetInput(); |
||
18 | /// msgpack::Reader MPReader(input); |
||
19 | /// msgpack::Object Obj; |
||
20 | /// |
||
21 | /// while (MPReader.read(Obj)) { |
||
22 | /// switch (Obj.Kind) { |
||
23 | /// case msgpack::Type::Int: |
||
24 | // // Use Obj.Int |
||
25 | /// break; |
||
26 | /// // ... |
||
27 | /// } |
||
28 | /// } |
||
29 | /// \endcode |
||
30 | /// |
||
31 | //===----------------------------------------------------------------------===// |
||
32 | |||
33 | #ifndef LLVM_BINARYFORMAT_MSGPACKREADER_H |
||
34 | #define LLVM_BINARYFORMAT_MSGPACKREADER_H |
||
35 | |||
36 | #include "llvm/Support/Error.h" |
||
37 | #include "llvm/Support/MemoryBufferRef.h" |
||
38 | #include <cstdint> |
||
39 | |||
40 | namespace llvm { |
||
41 | namespace msgpack { |
||
42 | |||
43 | /// MessagePack types as defined in the standard, with the exception of Integer |
||
44 | /// being divided into a signed Int and unsigned UInt variant in order to map |
||
45 | /// directly to C++ types. |
||
46 | /// |
||
47 | /// The types map onto corresponding union members of the \c Object struct. |
||
48 | enum class Type : uint8_t { |
||
49 | Int, |
||
50 | UInt, |
||
51 | Nil, |
||
52 | Boolean, |
||
53 | Float, |
||
54 | String, |
||
55 | Binary, |
||
56 | Array, |
||
57 | Map, |
||
58 | Extension, |
||
59 | Empty, // Used by MsgPackDocument to represent an empty node |
||
60 | }; |
||
61 | |||
62 | /// Extension types are composed of a user-defined type ID and an uninterpreted |
||
63 | /// sequence of bytes. |
||
64 | struct ExtensionType { |
||
65 | /// User-defined extension type. |
||
66 | int8_t Type; |
||
67 | /// Raw bytes of the extension object. |
||
68 | StringRef Bytes; |
||
69 | }; |
||
70 | |||
71 | /// MessagePack object, represented as a tagged union of C++ types. |
||
72 | /// |
||
73 | /// All types except \c Type::Nil (which has only one value, and so is |
||
74 | /// completely represented by the \c Kind itself) map to a exactly one union |
||
75 | /// member. |
||
76 | struct Object { |
||
77 | Type Kind; |
||
78 | union { |
||
79 | /// Value for \c Type::Int. |
||
80 | int64_t Int; |
||
81 | /// Value for \c Type::Uint. |
||
82 | uint64_t UInt; |
||
83 | /// Value for \c Type::Boolean. |
||
84 | bool Bool; |
||
85 | /// Value for \c Type::Float. |
||
86 | double Float; |
||
87 | /// Value for \c Type::String and \c Type::Binary. |
||
88 | StringRef Raw; |
||
89 | /// Value for \c Type::Array and \c Type::Map. |
||
90 | size_t Length; |
||
91 | /// Value for \c Type::Extension. |
||
92 | ExtensionType Extension; |
||
93 | }; |
||
94 | |||
95 | Object() : Kind(Type::Int), Int(0) {} |
||
96 | }; |
||
97 | |||
98 | /// Reads MessagePack objects from memory, one at a time. |
||
99 | class Reader { |
||
100 | public: |
||
101 | /// Construct a reader, keeping a reference to the \p InputBuffer. |
||
102 | Reader(MemoryBufferRef InputBuffer); |
||
103 | /// Construct a reader, keeping a reference to the \p Input. |
||
104 | Reader(StringRef Input); |
||
105 | |||
106 | Reader(const Reader &) = delete; |
||
107 | Reader &operator=(const Reader &) = delete; |
||
108 | |||
109 | /// Read one object from the input buffer, advancing past it. |
||
110 | /// |
||
111 | /// The \p Obj is updated with the kind of the object read, and the |
||
112 | /// corresponding union member is updated. |
||
113 | /// |
||
114 | /// For the collection objects (Array and Map), only the length is read, and |
||
115 | /// the caller must make and additional \c N calls (in the case of Array) or |
||
116 | /// \c N*2 calls (in the case of Map) to \c Read to retrieve the collection |
||
117 | /// elements. |
||
118 | /// |
||
119 | /// \param [out] Obj filled with next object on success. |
||
120 | /// |
||
121 | /// \returns true when object successfully read, false when at end of |
||
122 | /// input (and so \p Obj was not updated), otherwise an error. |
||
123 | Expected<bool> read(Object &Obj); |
||
124 | |||
125 | private: |
||
126 | MemoryBufferRef InputBuffer; |
||
127 | StringRef::iterator Current; |
||
128 | StringRef::iterator End; |
||
129 | |||
130 | size_t remainingSpace() { |
||
131 | // The rest of the code maintains the invariant that End >= Current, so |
||
132 | // that this cast is always defined behavior. |
||
133 | return static_cast<size_t>(End - Current); |
||
134 | } |
||
135 | |||
136 | template <class T> Expected<bool> readRaw(Object &Obj); |
||
137 | template <class T> Expected<bool> readInt(Object &Obj); |
||
138 | template <class T> Expected<bool> readUInt(Object &Obj); |
||
139 | template <class T> Expected<bool> readLength(Object &Obj); |
||
140 | template <class T> Expected<bool> readExt(Object &Obj); |
||
141 | Expected<bool> createRaw(Object &Obj, uint32_t Size); |
||
142 | Expected<bool> createExt(Object &Obj, uint32_t Size); |
||
143 | }; |
||
144 | |||
145 | } // end namespace msgpack |
||
146 | } // end namespace llvm |
||
147 | |||
148 | #endif // LLVM_BINARYFORMAT_MSGPACKREADER_H |