• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2008 Google Inc.  All rights reserved.
3 // https://developers.google.com/protocol-buffers/
4 //
5 // Redistribution and use in source and binary forms, with or without
6 // modification, are permitted provided that the following conditions are
7 // met:
8 //
9 //     * Redistributions of source code must retain the above copyright
10 // notice, this list of conditions and the following disclaimer.
11 //     * Redistributions in binary form must reproduce the above
12 // copyright notice, this list of conditions and the following disclaimer
13 // in the documentation and/or other materials provided with the
14 // distribution.
15 //     * Neither the name of Google Inc. nor the names of its
16 // contributors may be used to endorse or promote products derived from
17 // this software without specific prior written permission.
18 //
19 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30 
31 #ifndef GOOGLE_PROTOBUF_ARENASTRING_H__
32 #define GOOGLE_PROTOBUF_ARENASTRING_H__
33 
34 #include <algorithm>
35 #include <string>
36 #include <type_traits>
37 #include <utility>
38 
39 #include <google/protobuf/stubs/logging.h>
40 #include <google/protobuf/stubs/common.h>
41 #include <google/protobuf/arena.h>
42 #include <google/protobuf/port.h>
43 #include <google/protobuf/explicitly_constructed.h>
44 
45 // must be last:
46 #include <google/protobuf/port_def.inc>
47 
48 #ifdef SWIG
49 #error "You cannot SWIG proto headers"
50 #endif
51 
52 
53 namespace google {
54 namespace protobuf {
55 namespace internal {
56 class EpsCopyInputStream;
57 
58 class SwapFieldHelper;
59 
60 // Declared in message_lite.h
61 PROTOBUF_EXPORT extern ExplicitlyConstructedArenaString
62     fixed_address_empty_string;
63 
64 // Lazy string instance to support string fields with non-empty default.
65 // These are initialized on the first call to .get().
66 class PROTOBUF_EXPORT LazyString {
67  public:
68   // We explicitly make LazyString an aggregate so that MSVC can do constant
69   // initialization on it without marking it `constexpr`.
70   // We do not want to use `constexpr` because it makes it harder to have extern
71   // storage for it and causes library bloat.
72   struct InitValue {
73     const char* ptr;
74     size_t size;
75   };
76   // We keep a union of the initialization value and the std::string to save on
77   // space. We don't need the string array after Init() is done.
78   union {
79     mutable InitValue init_value_;
80     alignas(std::string) mutable char string_buf_[sizeof(std::string)];
81   };
82   mutable std::atomic<const std::string*> inited_;
83 
get()84   const std::string& get() const {
85     // This check generates less code than a call-once invocation.
86     auto* res = inited_.load(std::memory_order_acquire);
87     if (PROTOBUF_PREDICT_FALSE(res == nullptr)) return Init();
88     return *res;
89   }
90 
91  private:
92   // Initialize the string in `string_buf_`, update `inited_` and return it.
93   // We return it here to avoid having to read it again in the inlined code.
94   const std::string& Init() const;
95 };
96 
97 class TaggedStringPtr {
98  public:
99   // Bit flags qualifying string properties. We can use 2 bits as
100   // ptr_ is guaranteed and enforced to be aligned on 4 byte boundaries.
101   enum Flags {
102     kArenaBit = 0x1,      // ptr is arena allocated
103     kMutableBit = 0x2,    // ptr contents are fully mutable
104     kMask = 0x3           // Bit mask
105   };
106 
107   // Composed logical types
108   enum Type {
109     // Default strings are immutable and never owned.
110     kDefault = 0,
111 
112     // Allocated strings are mutable and (as the name implies) owned.
113     // A heap allocated string must be deleted.
114     kAllocated = kMutableBit,
115 
116     // Mutable arena strings are strings where the string instance is owned
117     // by the arena, but the string contents itself are owned by the string
118     // instance. Mutable arena string instances need to be destroyed which is
119     // typically done through a cleanup action added to the arena owning it.
120     kMutableArena = kArenaBit | kMutableBit,
121 
122     // Fixed size arena strings are strings where both the string instance and
123     // the string contents are fully owned by the arena. Fixed size arena
124     // strings are a platform and c++ library specific customization. Fixed
125     // size arena strings are immutable, with the exception of custom internal
126     // updates to the content that fit inside the existing capacity.
127     // Fixed size arena strings must never be deleted or destroyed.
128     kFixedSizeArena = kArenaBit,
129   };
130 
131   TaggedStringPtr() = default;
TaggedStringPtr(ExplicitlyConstructedArenaString * ptr)132   explicit constexpr TaggedStringPtr(ExplicitlyConstructedArenaString* ptr)
133       : ptr_(ptr) {}
134 
135   // Sets the value to `p`, tagging the value as being a 'default' value.
136   // See documentation for kDefault for more info.
SetDefault(const std::string * p)137   inline const std::string* SetDefault(const std::string* p) {
138     return TagAs(kDefault, const_cast<std::string*>(p));
139   }
140 
141   // Sets the value to `p`, tagging the value as a heap allocated value.
142   // Allocated strings are mutable and (as the name implies) owned.
143   // `p` must not be null
SetAllocated(std::string * p)144   inline std::string* SetAllocated(std::string* p) {
145     return TagAs(kAllocated, p);
146   }
147 
148   // Sets the value to `p`, tagging the value as a fixed size arena string.
149   // See documentation for kFixedSizeArena for more info.
150   // `p` must not be null
SetFixedSizeArena(std::string * p)151   inline std::string* SetFixedSizeArena(std::string* p) {
152     return TagAs(kFixedSizeArena, p);
153   }
154 
155   // Sets the value to `p`, tagging the value as a mutable arena string.
156   // See documentation for kMutableArena for more info.
157   // `p` must not be null
SetMutableArena(std::string * p)158   inline std::string* SetMutableArena(std::string* p) {
159     return TagAs(kMutableArena, p);
160   }
161 
162   // Returns true if the contents of the current string are fully mutable.
IsMutable()163   inline bool IsMutable() const { return as_int() & kMutableBit; }
164 
165   // Returns true if the current string is an immutable default value.
IsDefault()166   inline bool IsDefault() const { return (as_int() & kMask) == kDefault; }
167 
168   // If the current string is a heap-allocated mutable value, returns a pointer
169   // to it.  Returns nullptr otherwise.
GetIfAllocated()170   inline std::string *GetIfAllocated() const {
171     auto allocated = as_int() ^ kAllocated;
172     if (allocated & kMask) return nullptr;
173 
174     auto ptr = reinterpret_cast<std::string*>(allocated);
175     PROTOBUF_ASSUME(ptr != nullptr);
176     return ptr;
177   }
178 
179   // Returns true if the current string is an arena allocated value.
180   // This means it's either a mutable or fixed size arena string.
IsArena()181   inline bool IsArena() const { return as_int() & kArenaBit; }
182 
183   // Returns true if the current string is a fixed size arena allocated value.
IsFixedSizeArena()184   inline bool IsFixedSizeArena() const {
185     return (as_int() & kMask) == kFixedSizeArena;
186   }
187 
188   // Returns the contained string pointer.
Get()189   inline std::string* Get() const {
190     return reinterpret_cast<std::string*>(as_int() & ~kMask);
191   }
192 
193   // Returns true if the contained pointer is null, indicating some error.
194   // The Null value is only used during parsing for temporary values.
195   // A persisted ArenaStringPtr value is never null.
IsNull()196   inline bool IsNull() { return ptr_ == nullptr; }
197 
198  private:
assert_aligned(const void * p)199   static inline void assert_aligned(const void* p) {
200     GOOGLE_DCHECK_EQ(reinterpret_cast<uintptr_t>(p) & kMask, 0UL);
201   }
202 
TagAs(Type type,std::string * p)203   inline std::string* TagAs(Type type, std::string* p) {
204     GOOGLE_DCHECK(p != nullptr);
205     assert_aligned(p);
206     ptr_ = reinterpret_cast<void*>(reinterpret_cast<uintptr_t>(p) | type);
207     return p;
208   }
209 
as_int()210   uintptr_t as_int() const { return reinterpret_cast<uintptr_t>(ptr_); }
211   void* ptr_;
212 };
213 
214 static_assert(std::is_trivial<TaggedStringPtr>::value,
215               "TaggedStringPtr must be trivial");
216 
217 // This class encapsulates a pointer to a std::string with or without arena
218 // owned contents, tagged by the bottom bits of the string pointer. It is a
219 // high-level wrapper that almost directly corresponds to the interface required
220 // by string fields in generated code. It replaces the old std::string* pointer
221 // in such cases.
222 //
223 // The string pointer is tagged to be either a default, externally owned value,
224 // a mutable heap allocated value, or an arena allocated value. The object uses
225 // a single global instance of an empty string that is used as the initial
226 // default value. Fields that have empty default values directly use this global
227 // default. Fields that have non empty default values are supported through
228 // lazily initialized default values managed by the LazyString class.
229 //
230 // Generated code and reflection code both ensure that ptr_ is never null.
231 // Because ArenaStringPtr is used in oneof unions, its constructor is a NOP and
232 // the field is always manually initialized via method calls.
233 //
234 // See TaggedStringPtr for more information about the types of string values
235 // being held, and the mutable and ownership invariants for each type.
236 struct PROTOBUF_EXPORT ArenaStringPtr {
237   ArenaStringPtr() = default;
ArenaStringPtrArenaStringPtr238   constexpr ArenaStringPtr(ExplicitlyConstructedArenaString* default_value,
239                            ConstantInitialized)
240       : tagged_ptr_(default_value) {}
241 
242   // Called from generated code / reflection runtime only. Resets value to point
243   // to a default string pointer, with the semantics that this ArenaStringPtr
244   // does not own the pointed-to memory. Disregards initial value of ptr_ (so
245   // this is the *ONLY* safe method to call after construction or when
246   // reinitializing after becoming the active field in a oneof union).
247   inline void InitDefault();
248 
249   // Similar to `InitDefault` except that it allows the default value to be
250   // initialized to an externally owned string. This method is called from
251   // parsing code. `str` must not be null and outlive this instance.
252   inline void InitExternal(const std::string* str);
253 
254   // Called from generated code / reflection runtime only. Resets the value of
255   // this instances to the heap allocated value in `str`. `str` must not be
256   // null. Invokes `arena->Own(str)` to transfer ownership into the arena if
257   // `arena` is not null, else, `str` will be owned by ArenaStringPtr. This
258   // function should only be used to initialize a ArenaStringPtr or on an
259   // instance known to not carry any heap allocated value.
260   inline void InitAllocated(std::string* str, Arena* arena);
261 
262   void Set(ConstStringParam value, Arena* arena);
263   void Set(std::string&& value, Arena* arena);
264   void Set(const char* s, Arena* arena);
265   void Set(const char* s, size_t n, Arena* arena);
266 
267   void SetBytes(ConstStringParam value, Arena* arena);
268   void SetBytes(std::string&& value, Arena* arena);
269   void SetBytes(const char* s, Arena* arena);
270   void SetBytes(const void* p, size_t n, Arena* arena);
271 
272   template <typename RefWrappedType>
SetArenaStringPtr273   void Set(std::reference_wrapper<RefWrappedType> const_string_ref,
274            ::google::protobuf::Arena* arena) {
275     Set(const_string_ref.get(), arena);
276   }
277 
278   // Returns a mutable std::string reference.
279   // The version accepting a `LazyString` value is used in the generated code to
280   // initialize mutable copies for fields with a non-empty default where the
281   // default value is lazily initialized.
282   std::string* Mutable(Arena* arena);
283   std::string* Mutable(const LazyString& default_value, Arena* arena);
284 
285   // Gets a mutable pointer with unspecified contents.
286   // This function is identical to Mutable(), except it is optimized for the
287   // case where the caller is not interested in the current contents. For
288   // example, if the current field is not mutable, it will re-initialize the
289   // value with an empty string rather than a (non-empty) default value.
290   // Likewise, if the current value is a fixed size arena string with contents,
291   // it will be initialized into an empty mutable arena string.
292   std::string* MutableNoCopy(Arena* arena);
293 
294   // Basic accessors.
GetArenaStringPtr295   PROTOBUF_NDEBUG_INLINE const std::string& Get() const {
296     // Unconditionally mask away the tag.
297     return *tagged_ptr_.Get();
298   }
299 
300   // Returns a pointer to the stored contents for this instance.
301   // This method is for internal debugging and tracking purposes only.
UnsafeGetPointerArenaStringPtr302   PROTOBUF_NDEBUG_INLINE const std::string* UnsafeGetPointer() const
303       PROTOBUF_RETURNS_NONNULL {
304     return tagged_ptr_.Get();
305   }
306 
307   // Release returns a std::string* instance that is heap-allocated and is not
308   // Own()'d by any arena. If the field is not set, this returns nullptr. The
309   // caller retains ownership. Clears this field back to the default state.
310   // Used to implement release_<field>() methods on generated classes.
311   PROTOBUF_NODISCARD std::string* Release();
312 
313   // Takes a std::string that is heap-allocated, and takes ownership. The
314   // std::string's destructor is registered with the arena. Used to implement
315   // set_allocated_<field> in generated classes.
316   void SetAllocated(std::string* value, Arena* arena);
317 
318   // Frees storage (if not on an arena).
319   void Destroy();
320 
321   // Clears content, but keeps allocated std::string, to avoid the overhead of
322   // heap operations. After this returns, the content (as seen by the user) will
323   // always be the empty std::string. Assumes that |default_value| is an empty
324   // std::string.
325   void ClearToEmpty();
326 
327   // Clears content, assuming that the current value is not the empty
328   // string default.
329   void ClearNonDefaultToEmpty();
330 
331   // Clears content, but keeps allocated std::string if arena != nullptr, to
332   // avoid the overhead of heap operations. After this returns, the content
333   // (as seen by the user) will always be equal to |default_value|.
334   void ClearToDefault(const LazyString& default_value, ::google::protobuf::Arena* arena);
335 
336   // Swaps internal pointers. Arena-safety semantics: this is guarded by the
337   // logic in Swap()/UnsafeArenaSwap() at the message level, so this method is
338   // 'unsafe' if called directly.
339   inline PROTOBUF_NDEBUG_INLINE static void InternalSwap(ArenaStringPtr* rhs,
340                                                          Arena* rhs_arena,
341                                                          ArenaStringPtr* lhs,
342                                                          Arena* lhs_arena);
343 
344   // Internal setter used only at parse time to directly set a donated string
345   // value.
UnsafeSetTaggedPointerArenaStringPtr346   void UnsafeSetTaggedPointer(TaggedStringPtr value) { tagged_ptr_ = value; }
347   // Generated code only! An optimization, in certain cases the generated
348   // code is certain we can obtain a std::string with no default checks and
349   // tag tests.
350   std::string* UnsafeMutablePointer() PROTOBUF_RETURNS_NONNULL;
351 
352   // Returns true if this instances holds an immutable default value.
IsDefaultArenaStringPtr353   inline bool IsDefault() const { return tagged_ptr_.IsDefault(); }
354 
355  private:
356   template <typename... Args>
NewStringArenaStringPtr357   inline std::string* NewString(Arena* arena, Args&&... args) {
358     if (arena == nullptr) {
359       auto* s = new std::string(std::forward<Args>(args)...);
360       return tagged_ptr_.SetAllocated(s);
361     } else {
362       auto* s = Arena::Create<std::string>(arena, std::forward<Args>(args)...);
363       return tagged_ptr_.SetMutableArena(s);
364     }
365   }
366 
367   TaggedStringPtr tagged_ptr_;
368 
IsFixedSizeArenaArenaStringPtr369   bool IsFixedSizeArena() const { return false; }
370 
371   // Swaps tagged pointer without debug hardening. This is to allow python
372   // protobuf to maintain pointer stability even in DEBUG builds.
UnsafeShallowSwapArenaStringPtr373   inline PROTOBUF_NDEBUG_INLINE static void UnsafeShallowSwap(
374       ArenaStringPtr* rhs, ArenaStringPtr* lhs) {
375     std::swap(lhs->tagged_ptr_, rhs->tagged_ptr_);
376   }
377 
378   friend class ::google::protobuf::internal::SwapFieldHelper;
379   friend class TcParser;
380 
381   // Slow paths.
382 
383   // MutableSlow requires that !IsString() || IsDefault
384   // Variadic to support 0 args for empty default and 1 arg for LazyString.
385   template <typename... Lazy>
386   std::string* MutableSlow(::google::protobuf::Arena* arena, const Lazy&... lazy_default);
387 
388   friend class EpsCopyInputStream;
389 };
390 
InitDefault()391 inline void ArenaStringPtr::InitDefault() {
392   tagged_ptr_ = TaggedStringPtr(&fixed_address_empty_string);
393 }
394 
InitExternal(const std::string * str)395 inline void ArenaStringPtr::InitExternal(const std::string* str) {
396   tagged_ptr_.SetDefault(str);
397 }
398 
InitAllocated(std::string * str,Arena * arena)399 inline void ArenaStringPtr::InitAllocated(std::string* str, Arena* arena) {
400   if (arena != nullptr) {
401     tagged_ptr_.SetMutableArena(str);
402     arena->Own(str);
403   } else {
404     tagged_ptr_.SetAllocated(str);
405   }
406 }
407 
Set(const char * s,Arena * arena)408 inline void ArenaStringPtr::Set(const char* s, Arena* arena) {
409   Set(ConstStringParam{s}, arena);
410 }
411 
Set(const char * s,size_t n,Arena * arena)412 inline void ArenaStringPtr::Set(const char* s, size_t n, Arena* arena) {
413   Set(ConstStringParam{s, n}, arena);
414 }
415 
SetBytes(ConstStringParam value,Arena * arena)416 inline void ArenaStringPtr::SetBytes(ConstStringParam value, Arena* arena) {
417   Set(value, arena);
418 }
419 
SetBytes(std::string && value,Arena * arena)420 inline void ArenaStringPtr::SetBytes(std::string&& value, Arena* arena) {
421   Set(std::move(value), arena);
422 }
423 
SetBytes(const char * s,Arena * arena)424 inline void ArenaStringPtr::SetBytes(const char* s, Arena* arena) {
425   Set(s, arena);
426 }
427 
SetBytes(const void * p,size_t n,Arena * arena)428 inline void ArenaStringPtr::SetBytes(const void* p, size_t n, Arena* arena) {
429   Set(ConstStringParam{static_cast<const char*>(p), n}, arena);
430 }
431 
432 // Make sure rhs_arena allocated rhs, and lhs_arena allocated lhs.
InternalSwap(ArenaStringPtr * rhs,Arena * rhs_arena,ArenaStringPtr * lhs,Arena * lhs_arena)433 inline PROTOBUF_NDEBUG_INLINE void ArenaStringPtr::InternalSwap(  //
434     ArenaStringPtr* rhs, Arena* rhs_arena,                        //
435     ArenaStringPtr* lhs, Arena* lhs_arena) {
436   // Silence unused variable warnings in release buildls.
437   (void)rhs_arena;
438   (void)lhs_arena;
439   std::swap(lhs->tagged_ptr_, rhs->tagged_ptr_);
440 #ifdef PROTOBUF_FORCE_COPY_IN_SWAP
441   auto force_realloc = [](ArenaStringPtr* p, Arena* arena) {
442     if (p->IsDefault()) return;
443     std::string* old_value = p->tagged_ptr_.Get();
444     std::string* new_value =
445         p->IsFixedSizeArena()
446             ? Arena::Create<std::string>(arena, *old_value)
447             : Arena::Create<std::string>(arena, std::move(*old_value));
448     if (arena == nullptr) {
449       delete old_value;
450       p->tagged_ptr_.SetAllocated(new_value);
451     } else {
452       p->tagged_ptr_.SetMutableArena(new_value);
453     }
454   };
455   // Because, at this point, tagged_ptr_ has been swapped, arena should also be
456   // swapped.
457   force_realloc(lhs, rhs_arena);
458   force_realloc(rhs, lhs_arena);
459 #endif  // PROTOBUF_FORCE_COPY_IN_SWAP
460 }
461 
ClearNonDefaultToEmpty()462 inline void ArenaStringPtr::ClearNonDefaultToEmpty() {
463   // Unconditionally mask away the tag.
464   tagged_ptr_.Get()->clear();
465 }
466 
UnsafeMutablePointer()467 inline std::string* ArenaStringPtr::UnsafeMutablePointer() {
468   GOOGLE_DCHECK(tagged_ptr_.IsMutable());
469   GOOGLE_DCHECK(tagged_ptr_.Get() != nullptr);
470   return tagged_ptr_.Get();
471 }
472 
473 
474 }  // namespace internal
475 }  // namespace protobuf
476 }  // namespace google
477 
478 #include <google/protobuf/port_undef.inc>
479 
480 #endif  // GOOGLE_PROTOBUF_ARENASTRING_H__
481