1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2008 Google Inc. All rights reserved.
3 // https://developers.google.com/protocol-buffers/
4 //
5 // Redistribution and use in source and binary forms, with or without
6 // modification, are permitted provided that the following conditions are
7 // met:
8 //
9 // * Redistributions of source code must retain the above copyright
10 // notice, this list of conditions and the following disclaimer.
11 // * Redistributions in binary form must reproduce the above
12 // copyright notice, this list of conditions and the following disclaimer
13 // in the documentation and/or other materials provided with the
14 // distribution.
15 // * Neither the name of Google Inc. nor the names of its
16 // contributors may be used to endorse or promote products derived from
17 // this software without specific prior written permission.
18 //
19 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
31 #ifndef GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__
32 #define GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__
33
34 #include <google/protobuf/map.h>
35 #include <google/protobuf/map_entry_lite.h>
36 #include <google/protobuf/map_field_lite.h>
37 #include <google/protobuf/message_lite.h>
38 #include <google/protobuf/wire_format_lite.h>
39
40 // We require C++11 and Clang to use constexpr for variables, as GCC 4.8
41 // requires constexpr to be consistent between declarations of variables
42 // unnecessarily (see https://gcc.gnu.org/bugzilla/show_bug.cgi?id=58541).
43 // VS 2017 Update 3 also supports this usage of constexpr.
44 #if defined(__clang__) || (defined(_MSC_VER) && _MSC_VER >= 1911)
45 #define PROTOBUF_CONSTEXPR_VAR constexpr
46 #else // !__clang__
47 #define PROTOBUF_CONSTEXPR_VAR
48 #endif // !_clang
49
50 #ifdef SWIG
51 #error "You cannot SWIG proto headers"
52 #endif
53
54 #include <google/protobuf/port_def.inc>
55
56 namespace google {
57 namespace protobuf {
58 namespace internal {
59
60 // Processing-type masks.
61 static constexpr const unsigned char kOneofMask = 0x40;
62 static constexpr const unsigned char kRepeatedMask = 0x20;
63 // Mask for the raw type: either a WireFormatLite::FieldType or one of the
64 // ProcessingTypes below, without the oneof or repeated flag.
65 static constexpr const unsigned char kTypeMask = 0x1f;
66
67 // Wire type masks.
68 static constexpr const unsigned char kNotPackedMask = 0x10;
69 static constexpr const unsigned char kInvalidMask = 0x20;
70
71 enum ProcessingTypes {
72 TYPE_STRING_CORD = 19,
73 TYPE_STRING_STRING_PIECE = 20,
74 TYPE_BYTES_CORD = 21,
75 TYPE_BYTES_STRING_PIECE = 22,
76 TYPE_STRING_INLINED = 23,
77 TYPE_BYTES_INLINED = 24,
78 TYPE_MAP = 25,
79 };
80
81 static_assert(TYPE_MAP < kRepeatedMask, "Invalid enum");
82
83 struct PROTOBUF_EXPORT FieldMetadata {
84 uint32 offset; // offset of this field in the struct
85 uint32 tag; // field * 8 + wire_type
86 // byte offset * 8 + bit_offset;
87 // if the high bit is set then this is the byte offset of the oneof_case
88 // for this field.
89 uint32 has_offset;
90 uint32 type; // the type of this field.
91 const void* ptr; // auxiliary data
92
93 // From the serializer point of view each fundamental type can occur in
94 // 4 different ways. For simplicity we treat all combinations as a cartesion
95 // product although not all combinations are allowed.
96 enum FieldTypeClass {
97 kPresence,
98 kNoPresence,
99 kRepeated,
100 kPacked,
101 kOneOf,
102 kNumTypeClasses // must be last enum
103 };
104 // C++ protobuf has 20 fundamental types, were we added Cord and StringPiece
105 // and also distinquish the same types if they have different wire format.
106 enum {
107 kCordType = 19,
108 kStringPieceType = 20,
109 kInlinedType = 21,
110 kNumTypes = 21,
111 kSpecial = kNumTypes * kNumTypeClasses,
112 };
113
114 static int CalculateType(int fundamental_type, FieldTypeClass type_class);
115 };
116
117 // TODO(ckennelly): Add a static assertion to ensure that these masks do not
118 // conflict with wiretypes.
119
120 // ParseTableField is kept small to help simplify instructions for computing
121 // offsets, as we will always need this information to parse a field.
122 // Additional data, needed for some types, is stored in
123 // AuxiliaryParseTableField.
124 struct ParseTableField {
125 uint32 offset;
126 // The presence_index ordinarily represents a has_bit index, but for fields
127 // inside a oneof it represents the index in _oneof_case_.
128 uint32 presence_index;
129 unsigned char normal_wiretype;
130 unsigned char packed_wiretype;
131
132 // processing_type is given by:
133 // (FieldDescriptor->type() << 1) | FieldDescriptor->is_packed()
134 unsigned char processing_type;
135
136 unsigned char tag_size;
137 };
138
139 struct ParseTable;
140
141 union AuxiliaryParseTableField {
142 typedef bool (*EnumValidator)(int);
143
144 // Enums
145 struct enum_aux {
146 EnumValidator validator;
147 };
148 enum_aux enums;
149 // Group, messages
150 struct message_aux {
151 // ExplicitlyInitialized<T> -> T requires a reinterpret_cast, which prevents
152 // the tables from being constructed as a constexpr. We use void to avoid
153 // the cast.
154 const void* default_message_void;
default_messageAuxiliaryParseTableField::message_aux155 const MessageLite* default_message() const {
156 return static_cast<const MessageLite*>(default_message_void);
157 }
158 };
159 message_aux messages;
160 // Strings
161 struct string_aux {
162 const void* default_ptr;
163 const char* field_name;
164 };
165 string_aux strings;
166
167 struct map_aux {
168 bool (*parse_map)(io::CodedInputStream*, void*);
169 };
170 map_aux maps;
171
172 AuxiliaryParseTableField() = default;
AuxiliaryParseTableField(AuxiliaryParseTableField::enum_aux e)173 constexpr AuxiliaryParseTableField(AuxiliaryParseTableField::enum_aux e)
174 : enums(e) {}
AuxiliaryParseTableField(AuxiliaryParseTableField::message_aux m)175 constexpr AuxiliaryParseTableField(AuxiliaryParseTableField::message_aux m)
176 : messages(m) {}
AuxiliaryParseTableField(AuxiliaryParseTableField::string_aux s)177 constexpr AuxiliaryParseTableField(AuxiliaryParseTableField::string_aux s)
178 : strings(s) {}
AuxiliaryParseTableField(AuxiliaryParseTableField::map_aux m)179 constexpr AuxiliaryParseTableField(AuxiliaryParseTableField::map_aux m)
180 : maps(m) {}
181 };
182
183 struct ParseTable {
184 const ParseTableField* fields;
185 const AuxiliaryParseTableField* aux;
186 int max_field_number;
187 // TODO(ckennelly): Do something with this padding.
188
189 // TODO(ckennelly): Vet these for sign extension.
190 int64 has_bits_offset;
191 int64 oneof_case_offset;
192 int64 extension_offset;
193 int64 arena_offset;
194
195 // ExplicitlyInitialized<T> -> T requires a reinterpret_cast, which prevents
196 // the tables from being constructed as a constexpr. We use void to avoid
197 // the cast.
198 const void* default_instance_void;
default_instanceParseTable199 const MessageLite* default_instance() const {
200 return static_cast<const MessageLite*>(default_instance_void);
201 }
202
203 bool unknown_field_set;
204 };
205
206 static_assert(sizeof(ParseTableField) <= 16, "ParseTableField is too large");
207 // The tables must be composed of POD components to ensure link-time
208 // initialization.
209 static_assert(std::is_pod<ParseTableField>::value, "");
210 static_assert(std::is_pod<AuxiliaryParseTableField>::value, "");
211 static_assert(std::is_pod<AuxiliaryParseTableField::enum_aux>::value, "");
212 static_assert(std::is_pod<AuxiliaryParseTableField::message_aux>::value, "");
213 static_assert(std::is_pod<AuxiliaryParseTableField::string_aux>::value, "");
214 static_assert(std::is_pod<ParseTable>::value, "");
215
216 // TODO(ckennelly): Consolidate these implementations into a single one, using
217 // dynamic dispatch to the appropriate unknown field handler.
218 bool MergePartialFromCodedStream(MessageLite* msg, const ParseTable& table,
219 io::CodedInputStream* input);
220 bool MergePartialFromCodedStreamLite(MessageLite* msg, const ParseTable& table,
221 io::CodedInputStream* input);
222
223 template <typename Entry>
ParseMap(io::CodedInputStream * input,void * map_field)224 bool ParseMap(io::CodedInputStream* input, void* map_field) {
225 typedef typename MapEntryToMapField<Entry>::MapFieldType MapFieldType;
226 typedef Map<typename Entry::EntryKeyType, typename Entry::EntryValueType>
227 MapType;
228 typedef typename Entry::template Parser<MapFieldType, MapType> ParserType;
229
230 ParserType parser(static_cast<MapFieldType*>(map_field));
231 return WireFormatLite::ReadMessageNoVirtual(input, &parser);
232 }
233
234 struct SerializationTable {
235 int num_fields;
236 const FieldMetadata* field_table;
237 };
238
239 PROTOBUF_EXPORT void SerializeInternal(const uint8* base,
240 const FieldMetadata* table,
241 int32 num_fields,
242 io::CodedOutputStream* output);
243
TableSerialize(const MessageLite & msg,const SerializationTable * table,io::CodedOutputStream * output)244 inline void TableSerialize(const MessageLite& msg,
245 const SerializationTable* table,
246 io::CodedOutputStream* output) {
247 const FieldMetadata* field_table = table->field_table;
248 int num_fields = table->num_fields - 1;
249 const uint8* base = reinterpret_cast<const uint8*>(&msg);
250 // TODO(gerbens) This skips the first test if we could use the fast
251 // array serialization path, we should make this
252 // int cached_size =
253 // *reinterpret_cast<const int32*>(base + field_table->offset);
254 // SerializeWithCachedSize(msg, field_table + 1, num_fields, cached_size, ...)
255 // But we keep conformance with the old way for now.
256 SerializeInternal(base, field_table + 1, num_fields, output);
257 }
258
259 uint8* SerializeInternalToArray(const uint8* base, const FieldMetadata* table,
260 int32 num_fields, bool is_deterministic,
261 uint8* buffer);
262
TableSerializeToArray(const MessageLite & msg,const SerializationTable * table,bool is_deterministic,uint8 * buffer)263 inline uint8* TableSerializeToArray(const MessageLite& msg,
264 const SerializationTable* table,
265 bool is_deterministic, uint8* buffer) {
266 const uint8* base = reinterpret_cast<const uint8*>(&msg);
267 const FieldMetadata* field_table = table->field_table + 1;
268 int num_fields = table->num_fields - 1;
269 return SerializeInternalToArray(base, field_table, num_fields,
270 is_deterministic, buffer);
271 }
272
273 template <typename T>
274 struct CompareHelper {
operatorCompareHelper275 bool operator()(const T& a, const T& b) const { return a < b; }
276 };
277
278 template <>
279 struct CompareHelper<ArenaStringPtr> {
280 bool operator()(const ArenaStringPtr& a, const ArenaStringPtr& b) const {
281 return a.Get() < b.Get();
282 }
283 };
284
285 struct CompareMapKey {
286 template <typename T>
287 bool operator()(const MapEntryHelper<T>& a,
288 const MapEntryHelper<T>& b) const {
289 return Compare(a.key_, b.key_);
290 }
291 template <typename T>
292 bool Compare(const T& a, const T& b) const {
293 return CompareHelper<T>()(a, b);
294 }
295 };
296
297 template <typename MapFieldType, const SerializationTable* table>
298 void MapFieldSerializer(const uint8* base, uint32 offset, uint32 tag,
299 uint32 has_offset, io::CodedOutputStream* output) {
300 typedef MapEntryHelper<typename MapFieldType::EntryTypeTrait> Entry;
301 typedef typename MapFieldType::MapType::const_iterator Iter;
302
303 const MapFieldType& map_field =
304 *reinterpret_cast<const MapFieldType*>(base + offset);
305 const SerializationTable* t =
306 table +
307 has_offset; // has_offset is overloaded for maps to mean table offset
308 if (!output->IsSerializationDeterministic()) {
309 for (Iter it = map_field.GetMap().begin(); it != map_field.GetMap().end();
310 ++it) {
311 Entry map_entry(*it);
312 output->WriteVarint32(tag);
313 output->WriteVarint32(map_entry._cached_size_);
314 SerializeInternal(reinterpret_cast<const uint8*>(&map_entry),
315 t->field_table, t->num_fields, output);
316 }
317 } else {
318 std::vector<Entry> v;
319 for (Iter it = map_field.GetMap().begin(); it != map_field.GetMap().end();
320 ++it) {
321 v.push_back(Entry(*it));
322 }
323 std::sort(v.begin(), v.end(), CompareMapKey());
324 for (int i = 0; i < v.size(); i++) {
325 output->WriteVarint32(tag);
326 output->WriteVarint32(v[i]._cached_size_);
327 SerializeInternal(reinterpret_cast<const uint8*>(&v[i]), t->field_table,
328 t->num_fields, output);
329 }
330 }
331 }
332
333 } // namespace internal
334 } // namespace protobuf
335 } // namespace google
336
337 #include <google/protobuf/port_undef.inc>
338
339 #endif // GOOGLE_PROTOBUF_GENERATED_MESSAGE_TABLE_DRIVEN_H__
340