1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2023 Google LLC. All rights reserved.
3 //
4 // Use of this source code is governed by a BSD-style
5 // license that can be found in the LICENSE file or at
6 // https://developers.google.com/open-source/licenses/bsd
7
8 #include "upb/reflection/internal/enum_def.h"
9
10 #include <stddef.h>
11 #include <stdint.h>
12 #include <string.h>
13
14 #include "upb/base/status.h"
15 #include "upb/base/string_view.h"
16 #include "upb/hash/common.h"
17 #include "upb/hash/int_table.h"
18 #include "upb/hash/str_table.h"
19 #include "upb/mem/arena.h"
20 #include "upb/mini_descriptor/decode.h"
21 #include "upb/mini_descriptor/internal/encode.h"
22 #include "upb/mini_table/enum.h"
23 #include "upb/mini_table/file.h"
24 #include "upb/reflection/def.h"
25 #include "upb/reflection/def_type.h"
26 #include "upb/reflection/internal/def_builder.h"
27 #include "upb/reflection/internal/desc_state.h"
28 #include "upb/reflection/internal/enum_reserved_range.h"
29 #include "upb/reflection/internal/enum_value_def.h"
30 #include "upb/reflection/internal/file_def.h"
31 #include "upb/reflection/internal/strdup2.h"
32
33 // Must be last.
34 #include "upb/port/def.inc"
35
36 struct upb_EnumDef {
37 const UPB_DESC(EnumOptions*) opts;
38 const UPB_DESC(FeatureSet*) resolved_features;
39 const upb_MiniTableEnum* layout; // Only for proto2.
40 const upb_FileDef* file;
41 const upb_MessageDef* containing_type; // Could be merged with "file".
42 const char* full_name;
43 upb_strtable ntoi;
44 upb_inttable iton;
45 const upb_EnumValueDef* values;
46 const upb_EnumReservedRange* res_ranges;
47 const upb_StringView* res_names;
48 int value_count;
49 int res_range_count;
50 int res_name_count;
51 int32_t defaultval;
52 bool is_sorted; // Whether all of the values are defined in ascending order.
53 #if UINTPTR_MAX == 0xffffffff
54 uint32_t padding; // Increase size to a multiple of 8.
55 #endif
56 };
57
_upb_EnumDef_At(const upb_EnumDef * e,int i)58 upb_EnumDef* _upb_EnumDef_At(const upb_EnumDef* e, int i) {
59 return (upb_EnumDef*)&e[i];
60 }
61
_upb_EnumDef_MiniTable(const upb_EnumDef * e)62 const upb_MiniTableEnum* _upb_EnumDef_MiniTable(const upb_EnumDef* e) {
63 return e->layout;
64 }
65
_upb_EnumDef_Insert(upb_EnumDef * e,upb_EnumValueDef * v,upb_Arena * a)66 bool _upb_EnumDef_Insert(upb_EnumDef* e, upb_EnumValueDef* v, upb_Arena* a) {
67 const char* name = upb_EnumValueDef_Name(v);
68 const upb_value val = upb_value_constptr(v);
69 bool ok = upb_strtable_insert(&e->ntoi, name, strlen(name), val, a);
70 if (!ok) return false;
71
72 // Multiple enumerators can have the same number, first one wins.
73 const int number = upb_EnumValueDef_Number(v);
74 if (!upb_inttable_lookup(&e->iton, number, NULL)) {
75 return upb_inttable_insert(&e->iton, number, val, a);
76 }
77 return true;
78 }
79
UPB_DESC(EnumOptions)80 const UPB_DESC(EnumOptions) * upb_EnumDef_Options(const upb_EnumDef* e) {
81 return e->opts;
82 }
83
upb_EnumDef_HasOptions(const upb_EnumDef * e)84 bool upb_EnumDef_HasOptions(const upb_EnumDef* e) {
85 return e->opts != (void*)kUpbDefOptDefault;
86 }
87
UPB_DESC(FeatureSet)88 const UPB_DESC(FeatureSet) *
89 upb_EnumDef_ResolvedFeatures(const upb_EnumDef* e) {
90 return e->resolved_features;
91 }
92
upb_EnumDef_FullName(const upb_EnumDef * e)93 const char* upb_EnumDef_FullName(const upb_EnumDef* e) { return e->full_name; }
94
upb_EnumDef_Name(const upb_EnumDef * e)95 const char* upb_EnumDef_Name(const upb_EnumDef* e) {
96 return _upb_DefBuilder_FullToShort(e->full_name);
97 }
98
upb_EnumDef_File(const upb_EnumDef * e)99 const upb_FileDef* upb_EnumDef_File(const upb_EnumDef* e) { return e->file; }
100
upb_EnumDef_ContainingType(const upb_EnumDef * e)101 const upb_MessageDef* upb_EnumDef_ContainingType(const upb_EnumDef* e) {
102 return e->containing_type;
103 }
104
upb_EnumDef_Default(const upb_EnumDef * e)105 int32_t upb_EnumDef_Default(const upb_EnumDef* e) {
106 UPB_ASSERT(upb_EnumDef_FindValueByNumber(e, e->defaultval));
107 return e->defaultval;
108 }
109
upb_EnumDef_ReservedRangeCount(const upb_EnumDef * e)110 int upb_EnumDef_ReservedRangeCount(const upb_EnumDef* e) {
111 return e->res_range_count;
112 }
113
upb_EnumDef_ReservedRange(const upb_EnumDef * e,int i)114 const upb_EnumReservedRange* upb_EnumDef_ReservedRange(const upb_EnumDef* e,
115 int i) {
116 UPB_ASSERT(0 <= i && i < e->res_range_count);
117 return _upb_EnumReservedRange_At(e->res_ranges, i);
118 }
119
upb_EnumDef_ReservedNameCount(const upb_EnumDef * e)120 int upb_EnumDef_ReservedNameCount(const upb_EnumDef* e) {
121 return e->res_name_count;
122 }
123
upb_EnumDef_ReservedName(const upb_EnumDef * e,int i)124 upb_StringView upb_EnumDef_ReservedName(const upb_EnumDef* e, int i) {
125 UPB_ASSERT(0 <= i && i < e->res_name_count);
126 return e->res_names[i];
127 }
128
upb_EnumDef_ValueCount(const upb_EnumDef * e)129 int upb_EnumDef_ValueCount(const upb_EnumDef* e) { return e->value_count; }
130
upb_EnumDef_FindValueByName(const upb_EnumDef * e,const char * name)131 const upb_EnumValueDef* upb_EnumDef_FindValueByName(const upb_EnumDef* e,
132 const char* name) {
133 return upb_EnumDef_FindValueByNameWithSize(e, name, strlen(name));
134 }
135
upb_EnumDef_FindValueByNameWithSize(const upb_EnumDef * e,const char * name,size_t size)136 const upb_EnumValueDef* upb_EnumDef_FindValueByNameWithSize(
137 const upb_EnumDef* e, const char* name, size_t size) {
138 upb_value v;
139 return upb_strtable_lookup2(&e->ntoi, name, size, &v)
140 ? upb_value_getconstptr(v)
141 : NULL;
142 }
143
upb_EnumDef_FindValueByNumber(const upb_EnumDef * e,int32_t num)144 const upb_EnumValueDef* upb_EnumDef_FindValueByNumber(const upb_EnumDef* e,
145 int32_t num) {
146 upb_value v;
147 return upb_inttable_lookup(&e->iton, num, &v) ? upb_value_getconstptr(v)
148 : NULL;
149 }
150
upb_EnumDef_CheckNumber(const upb_EnumDef * e,int32_t num)151 bool upb_EnumDef_CheckNumber(const upb_EnumDef* e, int32_t num) {
152 // We could use upb_EnumDef_FindValueByNumber(e, num) != NULL, but we expect
153 // this to be faster (especially for small numbers).
154 return upb_MiniTableEnum_CheckValue(e->layout, num);
155 }
156
upb_EnumDef_Value(const upb_EnumDef * e,int i)157 const upb_EnumValueDef* upb_EnumDef_Value(const upb_EnumDef* e, int i) {
158 UPB_ASSERT(0 <= i && i < e->value_count);
159 return _upb_EnumValueDef_At(e->values, i);
160 }
161
upb_EnumDef_IsClosed(const upb_EnumDef * e)162 bool upb_EnumDef_IsClosed(const upb_EnumDef* e) {
163 if (UPB_TREAT_CLOSED_ENUMS_LIKE_OPEN) return false;
164 return upb_EnumDef_IsSpecifiedAsClosed(e);
165 }
166
upb_EnumDef_IsSpecifiedAsClosed(const upb_EnumDef * e)167 bool upb_EnumDef_IsSpecifiedAsClosed(const upb_EnumDef* e) {
168 return UPB_DESC(FeatureSet_enum_type)(e->resolved_features) ==
169 UPB_DESC(FeatureSet_CLOSED);
170 }
171
upb_EnumDef_MiniDescriptorEncode(const upb_EnumDef * e,upb_Arena * a,upb_StringView * out)172 bool upb_EnumDef_MiniDescriptorEncode(const upb_EnumDef* e, upb_Arena* a,
173 upb_StringView* out) {
174 upb_DescState s;
175 _upb_DescState_Init(&s);
176
177 const upb_EnumValueDef** sorted = NULL;
178 if (!e->is_sorted) {
179 sorted = _upb_EnumValueDefs_Sorted(e->values, e->value_count, a);
180 if (!sorted) return false;
181 }
182
183 if (!_upb_DescState_Grow(&s, a)) return false;
184 s.ptr = upb_MtDataEncoder_StartEnum(&s.e, s.ptr);
185
186 // Duplicate values are allowed but we only encode each value once.
187 uint32_t previous = 0;
188
189 for (int i = 0; i < e->value_count; i++) {
190 const uint32_t current =
191 upb_EnumValueDef_Number(sorted ? sorted[i] : upb_EnumDef_Value(e, i));
192 if (i != 0 && previous == current) continue;
193
194 if (!_upb_DescState_Grow(&s, a)) return false;
195 s.ptr = upb_MtDataEncoder_PutEnumValue(&s.e, s.ptr, current);
196 previous = current;
197 }
198
199 if (!_upb_DescState_Grow(&s, a)) return false;
200 s.ptr = upb_MtDataEncoder_EndEnum(&s.e, s.ptr);
201
202 // There will always be room for this '\0' in the encoder buffer because
203 // kUpb_MtDataEncoder_MinSize is overkill for upb_MtDataEncoder_EndEnum().
204 UPB_ASSERT(s.ptr < s.buf + s.bufsize);
205 *s.ptr = '\0';
206
207 out->data = s.buf;
208 out->size = s.ptr - s.buf;
209 return true;
210 }
211
create_enumlayout(upb_DefBuilder * ctx,const upb_EnumDef * e)212 static upb_MiniTableEnum* create_enumlayout(upb_DefBuilder* ctx,
213 const upb_EnumDef* e) {
214 upb_StringView sv;
215 bool ok = upb_EnumDef_MiniDescriptorEncode(e, ctx->tmp_arena, &sv);
216 if (!ok) _upb_DefBuilder_Errf(ctx, "OOM while building enum MiniDescriptor");
217
218 upb_Status status;
219 upb_MiniTableEnum* layout =
220 upb_MiniTableEnum_Build(sv.data, sv.size, ctx->arena, &status);
221 if (!layout)
222 _upb_DefBuilder_Errf(ctx, "Error building enum MiniTable: %s", status.msg);
223 return layout;
224 }
225
_upb_EnumReservedNames_New(upb_DefBuilder * ctx,int n,const upb_StringView * protos)226 static upb_StringView* _upb_EnumReservedNames_New(
227 upb_DefBuilder* ctx, int n, const upb_StringView* protos) {
228 upb_StringView* sv = _upb_DefBuilder_Alloc(ctx, sizeof(upb_StringView) * n);
229 for (int i = 0; i < n; i++) {
230 sv[i].data =
231 upb_strdup2(protos[i].data, protos[i].size, _upb_DefBuilder_Arena(ctx));
232 sv[i].size = protos[i].size;
233 }
234 return sv;
235 }
236
create_enumdef(upb_DefBuilder * ctx,const char * prefix,const UPB_DESC (EnumDescriptorProto)* enum_proto,const UPB_DESC (FeatureSet *)parent_features,upb_EnumDef * e)237 static void create_enumdef(upb_DefBuilder* ctx, const char* prefix,
238 const UPB_DESC(EnumDescriptorProto) * enum_proto,
239 const UPB_DESC(FeatureSet*) parent_features,
240 upb_EnumDef* e) {
241 const UPB_DESC(EnumValueDescriptorProto)* const* values;
242 const UPB_DESC(EnumDescriptorProto_EnumReservedRange)* const* res_ranges;
243 const upb_StringView* res_names;
244 upb_StringView name;
245 size_t n_value, n_res_range, n_res_name;
246
247 UPB_DEF_SET_OPTIONS(e->opts, EnumDescriptorProto, EnumOptions, enum_proto);
248 e->resolved_features = _upb_DefBuilder_ResolveFeatures(
249 ctx, parent_features, UPB_DESC(EnumOptions_features)(e->opts));
250
251 // Must happen before _upb_DefBuilder_Add()
252 e->file = _upb_DefBuilder_File(ctx);
253
254 name = UPB_DESC(EnumDescriptorProto_name)(enum_proto);
255
256 e->full_name = _upb_DefBuilder_MakeFullName(ctx, prefix, name);
257 _upb_DefBuilder_Add(ctx, e->full_name,
258 _upb_DefType_Pack(e, UPB_DEFTYPE_ENUM));
259
260 values = UPB_DESC(EnumDescriptorProto_value)(enum_proto, &n_value);
261
262 bool ok = upb_strtable_init(&e->ntoi, n_value, ctx->arena);
263 if (!ok) _upb_DefBuilder_OomErr(ctx);
264
265 ok = upb_inttable_init(&e->iton, ctx->arena);
266 if (!ok) _upb_DefBuilder_OomErr(ctx);
267
268 e->defaultval = 0;
269 e->value_count = n_value;
270 e->values = _upb_EnumValueDefs_New(ctx, prefix, n_value, values,
271 e->resolved_features, e, &e->is_sorted);
272
273 if (n_value == 0) {
274 _upb_DefBuilder_Errf(ctx, "enums must contain at least one value (%s)",
275 e->full_name);
276 }
277
278 res_ranges =
279 UPB_DESC(EnumDescriptorProto_reserved_range)(enum_proto, &n_res_range);
280 e->res_range_count = n_res_range;
281 e->res_ranges = _upb_EnumReservedRanges_New(ctx, n_res_range, res_ranges, e);
282
283 res_names =
284 UPB_DESC(EnumDescriptorProto_reserved_name)(enum_proto, &n_res_name);
285 e->res_name_count = n_res_name;
286 e->res_names = _upb_EnumReservedNames_New(ctx, n_res_name, res_names);
287
288 upb_inttable_compact(&e->iton, ctx->arena);
289
290 if (upb_EnumDef_IsClosed(e)) {
291 if (ctx->layout) {
292 e->layout = upb_MiniTableFile_Enum(ctx->layout, ctx->enum_count++);
293 } else {
294 e->layout = create_enumlayout(ctx, e);
295 }
296 } else {
297 e->layout = NULL;
298 }
299 }
300
_upb_EnumDefs_New(upb_DefBuilder * ctx,int n,const UPB_DESC (EnumDescriptorProto *)const * protos,const UPB_DESC (FeatureSet *)parent_features,const upb_MessageDef * containing_type)301 upb_EnumDef* _upb_EnumDefs_New(upb_DefBuilder* ctx, int n,
302 const UPB_DESC(EnumDescriptorProto*)
303 const* protos,
304 const UPB_DESC(FeatureSet*) parent_features,
305 const upb_MessageDef* containing_type) {
306 _upb_DefType_CheckPadding(sizeof(upb_EnumDef));
307
308 // If a containing type is defined then get the full name from that.
309 // Otherwise use the package name from the file def.
310 const char* name = containing_type ? upb_MessageDef_FullName(containing_type)
311 : _upb_FileDef_RawPackage(ctx->file);
312
313 upb_EnumDef* e = _upb_DefBuilder_Alloc(ctx, sizeof(upb_EnumDef) * n);
314 for (int i = 0; i < n; i++) {
315 create_enumdef(ctx, name, protos[i], parent_features, &e[i]);
316 e[i].containing_type = containing_type;
317 }
318 return e;
319 }
320