1 | // Protocol Buffers - Google's data interchange format |
2 | // Copyright 2008 Google Inc. All rights reserved. |
3 | // https://developers.google.com/protocol-buffers/ |
4 | // |
5 | // Redistribution and use in source and binary forms, with or without |
6 | // modification, are permitted provided that the following conditions are |
7 | // met: |
8 | // |
9 | // * Redistributions of source code must retain the above copyright |
10 | // notice, this list of conditions and the following disclaimer. |
11 | // * Redistributions in binary form must reproduce the above |
12 | // copyright notice, this list of conditions and the following disclaimer |
13 | // in the documentation and/or other materials provided with the |
14 | // distribution. |
15 | // * Neither the name of Google Inc. nor the names of its |
16 | // contributors may be used to endorse or promote products derived from |
17 | // this software without specific prior written permission. |
18 | // |
19 | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
20 | // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
21 | // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
22 | // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
23 | // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
24 | // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
25 | // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
26 | // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
27 | // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
28 | // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
29 | // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
30 | |
31 | #ifndef GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__ |
32 | #define GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__ |
33 | |
34 | #include <google/protobuf/map.h> |
35 | #include <google/protobuf/map_entry_lite.h> |
36 | #include <google/protobuf/map_field_lite.h> |
37 | #include <google/protobuf/message_lite.h> |
38 | #include <google/protobuf/wire_format_lite.h> |
39 | |
40 | // We require C++11 and Clang to use constexpr for variables, as GCC 4.8 |
41 | // requires constexpr to be consistent between declarations of variables |
42 | // unnecessarily (see https://gcc.gnu.org/bugzilla/show_bug.cgi?id=58541). |
43 | // VS 2017 Update 3 also supports this usage of constexpr. |
44 | #if defined(__clang__) || (defined(_MSC_VER) && _MSC_VER >= 1911) |
45 | #define PROTOBUF_CONSTEXPR_VAR constexpr |
46 | #else // !__clang__ |
47 | #define PROTOBUF_CONSTEXPR_VAR |
48 | #endif // !_clang |
49 | |
50 | #ifdef SWIG |
51 | #error "You cannot SWIG proto headers" |
52 | #endif |
53 | |
54 | #include <google/protobuf/port_def.inc> |
55 | |
56 | namespace google { |
57 | namespace protobuf { |
58 | namespace internal { |
59 | |
60 | // Processing-type masks. |
61 | static constexpr const unsigned char kOneofMask = 0x40; |
62 | static constexpr const unsigned char kRepeatedMask = 0x20; |
63 | // Mask for the raw type: either a WireFormatLite::FieldType or one of the |
64 | // ProcessingTypes below, without the oneof or repeated flag. |
65 | static constexpr const unsigned char kTypeMask = 0x1f; |
66 | |
67 | // Wire type masks. |
68 | static constexpr const unsigned char kNotPackedMask = 0x10; |
69 | static constexpr const unsigned char kInvalidMask = 0x20; |
70 | |
71 | enum ProcessingTypes { |
72 | TYPE_STRING_CORD = 19, |
73 | TYPE_STRING_STRING_PIECE = 20, |
74 | TYPE_BYTES_CORD = 21, |
75 | TYPE_BYTES_STRING_PIECE = 22, |
76 | TYPE_STRING_INLINED = 23, |
77 | TYPE_BYTES_INLINED = 24, |
78 | TYPE_MAP = 25, |
79 | }; |
80 | |
81 | static_assert(TYPE_MAP < kRepeatedMask, "Invalid enum" ); |
82 | |
83 | struct PROTOBUF_EXPORT FieldMetadata { |
84 | uint32 offset; // offset of this field in the struct |
85 | uint32 tag; // field * 8 + wire_type |
86 | // byte offset * 8 + bit_offset; |
87 | // if the high bit is set then this is the byte offset of the oneof_case |
88 | // for this field. |
89 | uint32 has_offset; |
90 | uint32 type; // the type of this field. |
91 | const void* ptr; // auxiliary data |
92 | |
93 | // From the serializer point of view each fundamental type can occur in |
94 | // 4 different ways. For simplicity we treat all combinations as a cartesion |
95 | // product although not all combinations are allowed. |
96 | enum FieldTypeClass { |
97 | kPresence, |
98 | kNoPresence, |
99 | kRepeated, |
100 | kPacked, |
101 | kOneOf, |
102 | kNumTypeClasses // must be last enum |
103 | }; |
104 | // C++ protobuf has 20 fundamental types, were we added Cord and StringPiece |
105 | // and also distinquish the same types if they have different wire format. |
106 | enum { |
107 | kCordType = 19, |
108 | kStringPieceType = 20, |
109 | kInlinedType = 21, |
110 | kNumTypes = 21, |
111 | kSpecial = kNumTypes * kNumTypeClasses, |
112 | }; |
113 | |
114 | static int CalculateType(int fundamental_type, FieldTypeClass type_class); |
115 | }; |
116 | |
117 | // TODO(ckennelly): Add a static assertion to ensure that these masks do not |
118 | // conflict with wiretypes. |
119 | |
120 | // ParseTableField is kept small to help simplify instructions for computing |
121 | // offsets, as we will always need this information to parse a field. |
122 | // Additional data, needed for some types, is stored in |
123 | // AuxillaryParseTableField. |
124 | struct ParseTableField { |
125 | uint32 offset; |
126 | // The presence_index ordinarily represents a has_bit index, but for fields |
127 | // inside a oneof it represents the index in _oneof_case_. |
128 | uint32 presence_index; |
129 | unsigned char normal_wiretype; |
130 | unsigned char packed_wiretype; |
131 | |
132 | // processing_type is given by: |
133 | // (FieldDescriptor->type() << 1) | FieldDescriptor->is_packed() |
134 | unsigned char processing_type; |
135 | |
136 | unsigned char tag_size; |
137 | }; |
138 | |
139 | struct ParseTable; |
140 | |
141 | union AuxillaryParseTableField { |
142 | typedef bool (*EnumValidator)(int); |
143 | |
144 | // Enums |
145 | struct enum_aux { |
146 | EnumValidator validator; |
147 | }; |
148 | enum_aux enums; |
149 | // Group, messages |
150 | struct message_aux { |
151 | // ExplicitlyInitialized<T> -> T requires a reinterpret_cast, which prevents |
152 | // the tables from being constructed as a constexpr. We use void to avoid |
153 | // the cast. |
154 | const void* default_message_void; |
155 | const MessageLite* default_message() const { |
156 | return static_cast<const MessageLite*>(default_message_void); |
157 | } |
158 | }; |
159 | message_aux messages; |
160 | // Strings |
161 | struct string_aux { |
162 | const void* default_ptr; |
163 | const char* field_name; |
164 | }; |
165 | string_aux strings; |
166 | |
167 | struct map_aux { |
168 | bool (*parse_map)(io::CodedInputStream*, void*); |
169 | }; |
170 | map_aux maps; |
171 | |
172 | AuxillaryParseTableField() = default; |
173 | constexpr AuxillaryParseTableField(AuxillaryParseTableField::enum_aux e) |
174 | : enums(e) {} |
175 | constexpr AuxillaryParseTableField(AuxillaryParseTableField::message_aux m) |
176 | : messages(m) {} |
177 | constexpr AuxillaryParseTableField(AuxillaryParseTableField::string_aux s) |
178 | : strings(s) {} |
179 | constexpr AuxillaryParseTableField(AuxillaryParseTableField::map_aux m) |
180 | : maps(m) {} |
181 | }; |
182 | |
183 | struct ParseTable { |
184 | const ParseTableField* fields; |
185 | const AuxillaryParseTableField* aux; |
186 | int max_field_number; |
187 | // TODO(ckennelly): Do something with this padding. |
188 | |
189 | // TODO(ckennelly): Vet these for sign extension. |
190 | int64 has_bits_offset; |
191 | int64 oneof_case_offset; |
192 | int64 extension_offset; |
193 | int64 arena_offset; |
194 | |
195 | // ExplicitlyInitialized<T> -> T requires a reinterpret_cast, which prevents |
196 | // the tables from being constructed as a constexpr. We use void to avoid |
197 | // the cast. |
198 | const void* default_instance_void; |
199 | const MessageLite* default_instance() const { |
200 | return static_cast<const MessageLite*>(default_instance_void); |
201 | } |
202 | |
203 | bool unknown_field_set; |
204 | }; |
205 | |
206 | static_assert(sizeof(ParseTableField) <= 16, "ParseTableField is too large" ); |
207 | // The tables must be composed of POD components to ensure link-time |
208 | // initialization. |
209 | static_assert(std::is_pod<ParseTableField>::value, "" ); |
210 | static_assert(std::is_pod<AuxillaryParseTableField>::value, "" ); |
211 | static_assert(std::is_pod<AuxillaryParseTableField::enum_aux>::value, "" ); |
212 | static_assert(std::is_pod<AuxillaryParseTableField::message_aux>::value, "" ); |
213 | static_assert(std::is_pod<AuxillaryParseTableField::string_aux>::value, "" ); |
214 | static_assert(std::is_pod<ParseTable>::value, "" ); |
215 | |
216 | // TODO(ckennelly): Consolidate these implementations into a single one, using |
217 | // dynamic dispatch to the appropriate unknown field handler. |
218 | bool MergePartialFromCodedStream(MessageLite* msg, const ParseTable& table, |
219 | io::CodedInputStream* input); |
220 | bool MergePartialFromCodedStreamLite(MessageLite* msg, const ParseTable& table, |
221 | io::CodedInputStream* input); |
222 | |
223 | template <typename Entry> |
224 | bool ParseMap(io::CodedInputStream* input, void* map_field) { |
225 | typedef typename MapEntryToMapField<Entry>::MapFieldType MapFieldType; |
226 | typedef Map<typename Entry::EntryKeyType, typename Entry::EntryValueType> |
227 | MapType; |
228 | typedef typename Entry::template Parser<MapFieldType, MapType> ParserType; |
229 | |
230 | ParserType parser(static_cast<MapFieldType*>(map_field)); |
231 | return WireFormatLite::ReadMessageNoVirtual(input, &parser); |
232 | } |
233 | |
234 | struct SerializationTable { |
235 | int num_fields; |
236 | const FieldMetadata* field_table; |
237 | }; |
238 | |
239 | PROTOBUF_EXPORT void SerializeInternal(const uint8* base, |
240 | const FieldMetadata* table, |
241 | int32 num_fields, |
242 | io::CodedOutputStream* output); |
243 | |
244 | inline void TableSerialize(const MessageLite& msg, |
245 | const SerializationTable* table, |
246 | io::CodedOutputStream* output) { |
247 | const FieldMetadata* field_table = table->field_table; |
248 | int num_fields = table->num_fields - 1; |
249 | const uint8* base = reinterpret_cast<const uint8*>(&msg); |
250 | // TODO(gerbens) This skips the first test if we could use the fast |
251 | // array serialization path, we should make this |
252 | // int cached_size = |
253 | // *reinterpret_cast<const int32*>(base + field_table->offset); |
254 | // SerializeWithCachedSize(msg, field_table + 1, num_fields, cached_size, ...) |
255 | // But we keep conformance with the old way for now. |
256 | SerializeInternal(base, table: field_table + 1, num_fields, output); |
257 | } |
258 | |
259 | uint8* SerializeInternalToArray(const uint8* base, const FieldMetadata* table, |
260 | int32 num_fields, bool is_deterministic, |
261 | uint8* buffer); |
262 | |
263 | inline uint8* TableSerializeToArray(const MessageLite& msg, |
264 | const SerializationTable* table, |
265 | bool is_deterministic, uint8* buffer) { |
266 | const uint8* base = reinterpret_cast<const uint8*>(&msg); |
267 | const FieldMetadata* field_table = table->field_table + 1; |
268 | int num_fields = table->num_fields - 1; |
269 | return SerializeInternalToArray(base, table: field_table, num_fields, |
270 | is_deterministic, buffer); |
271 | } |
272 | |
273 | template <typename T> |
274 | struct CompareHelper { |
275 | bool operator()(const T& a, const T& b) const { return a < b; } |
276 | }; |
277 | |
278 | template <> |
279 | struct CompareHelper<ArenaStringPtr> { |
280 | bool operator()(const ArenaStringPtr& a, const ArenaStringPtr& b) const { |
281 | return a.Get() < b.Get(); |
282 | } |
283 | }; |
284 | |
285 | struct CompareMapKey { |
286 | template <typename T> |
287 | bool operator()(const MapEntryHelper<T>& a, |
288 | const MapEntryHelper<T>& b) const { |
289 | return Compare(a.key_, b.key_); |
290 | } |
291 | template <typename T> |
292 | bool Compare(const T& a, const T& b) const { |
293 | return CompareHelper<T>()(a, b); |
294 | } |
295 | }; |
296 | |
297 | template <typename MapFieldType, const SerializationTable* table> |
298 | void MapFieldSerializer(const uint8* base, uint32 offset, uint32 tag, |
299 | uint32 has_offset, io::CodedOutputStream* output) { |
300 | typedef MapEntryHelper<typename MapFieldType::EntryTypeTrait> Entry; |
301 | typedef typename MapFieldType::MapType::const_iterator Iter; |
302 | |
303 | const MapFieldType& map_field = |
304 | *reinterpret_cast<const MapFieldType*>(base + offset); |
305 | const SerializationTable* t = |
306 | table + |
307 | has_offset; // has_offset is overloaded for maps to mean table offset |
308 | if (!output->IsSerializationDeterministic()) { |
309 | for (Iter it = map_field.GetMap().begin(); it != map_field.GetMap().end(); |
310 | ++it) { |
311 | Entry map_entry(*it); |
312 | output->WriteVarint32(value: tag); |
313 | output->WriteVarint32(value: map_entry._cached_size_); |
314 | SerializeInternal(base: reinterpret_cast<const uint8*>(&map_entry), |
315 | table: t->field_table, num_fields: t->num_fields, output); |
316 | } |
317 | } else { |
318 | std::vector<Entry> v; |
319 | for (Iter it = map_field.GetMap().begin(); it != map_field.GetMap().end(); |
320 | ++it) { |
321 | v.push_back(Entry(*it)); |
322 | } |
323 | std::sort(v.begin(), v.end(), CompareMapKey()); |
324 | for (int i = 0; i < v.size(); i++) { |
325 | output->WriteVarint32(value: tag); |
326 | output->WriteVarint32(value: v[i]._cached_size_); |
327 | SerializeInternal(base: reinterpret_cast<const uint8*>(&v[i]), table: t->field_table, |
328 | num_fields: t->num_fields, output); |
329 | } |
330 | } |
331 | } |
332 | |
333 | } // namespace internal |
334 | } // namespace protobuf |
335 | } // namespace google |
336 | |
337 | #include <google/protobuf/port_undef.inc> |
338 | |
339 | #endif // GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__ |
340 | |