// Copyright 2016 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "src/snapshot/serializer.h" #include "src/codegen/assembler-inl.h" #include "src/common/globals.h" #include "src/heap/heap-inl.h" // For Space::identity(). #include "src/heap/memory-chunk-inl.h" #include "src/heap/read-only-heap.h" #include "src/interpreter/interpreter.h" #include "src/objects/code.h" #include "src/objects/js-array-buffer-inl.h" #include "src/objects/js-array-inl.h" #include "src/objects/map.h" #include "src/objects/objects-body-descriptors-inl.h" #include "src/objects/slots-inl.h" #include "src/objects/smi.h" #include "src/snapshot/serializer-deserializer.h" namespace v8 { namespace internal { Serializer::Serializer(Isolate* isolate, Snapshot::SerializerFlags flags) : isolate_(isolate), hot_objects_(isolate->heap()), reference_map_(isolate), external_reference_encoder_(isolate), root_index_map_(isolate), deferred_objects_(isolate->heap()), forward_refs_per_pending_object_(isolate->heap()), flags_(flags) #ifdef DEBUG , back_refs_(isolate->heap()), stack_(isolate->heap()) #endif { #ifdef OBJECT_PRINT if (FLAG_serialization_statistics) { for (int space = 0; space < kNumberOfSnapshotSpaces; ++space) { // Value-initialized to 0. instance_type_count_[space] = std::make_unique(kInstanceTypes); instance_type_size_[space] = std::make_unique(kInstanceTypes); } } #endif // OBJECT_PRINT } void Serializer::CountAllocation(Map map, int size, SnapshotSpace space) { DCHECK(FLAG_serialization_statistics); const int space_number = static_cast(space); allocation_size_[space_number] += size; #ifdef OBJECT_PRINT int instance_type = map.instance_type(); instance_type_count_[space_number][instance_type]++; instance_type_size_[space_number][instance_type] += size; #endif // OBJECT_PRINT } int Serializer::TotalAllocationSize() const { int sum = 0; for (int space = 0; space < kNumberOfSnapshotSpaces; space++) { sum += allocation_size_[space]; } return sum; } void Serializer::OutputStatistics(const char* name) { if (!FLAG_serialization_statistics) return; PrintF("%s:\n", name); PrintF(" Spaces (bytes):\n"); for (int space = 0; space < kNumberOfSnapshotSpaces; space++) { PrintF("%16s", BaseSpace::GetSpaceName(static_cast(space))); } PrintF("\n"); for (int space = 0; space < kNumberOfSnapshotSpaces; space++) { PrintF("%16zu", allocation_size_[space]); } #ifdef OBJECT_PRINT PrintF(" Instance types (count and bytes):\n"); #define PRINT_INSTANCE_TYPE(Name) \ for (int space = 0; space < kNumberOfSnapshotSpaces; ++space) { \ if (instance_type_count_[space][Name]) { \ PrintF("%10d %10zu %-10s %s\n", instance_type_count_[space][Name], \ instance_type_size_[space][Name], \ BaseSpace::GetSpaceName(static_cast(space)), \ #Name); \ } \ } INSTANCE_TYPE_LIST(PRINT_INSTANCE_TYPE) #undef PRINT_INSTANCE_TYPE PrintF("\n"); #endif // OBJECT_PRINT } void Serializer::SerializeDeferredObjects() { if (FLAG_trace_serializer) { PrintF("Serializing deferred objects\n"); } WHILE_WITH_HANDLE_SCOPE(isolate(), !deferred_objects_.empty(), { Handle obj = handle(deferred_objects_.Pop(), isolate()); ObjectSerializer obj_serializer(this, obj, &sink_); obj_serializer.SerializeDeferred(); }); sink_.Put(kSynchronize, "Finished with deferred objects"); } void Serializer::SerializeObject(Handle obj) { // ThinStrings are just an indirection to an internalized string, so elide the // indirection and serialize the actual string directly. if (obj->IsThinString(isolate())) { obj = handle(ThinString::cast(*obj).actual(isolate()), isolate()); } SerializeObjectImpl(obj); } bool Serializer::MustBeDeferred(HeapObject object) { return false; } void Serializer::VisitRootPointers(Root root, const char* description, FullObjectSlot start, FullObjectSlot end) { for (FullObjectSlot current = start; current < end; ++current) { SerializeRootObject(current); } } void Serializer::SerializeRootObject(FullObjectSlot slot) { Object o = *slot; if (o.IsSmi()) { PutSmiRoot(slot); } else { SerializeObject(Handle(slot.location())); } } #ifdef DEBUG void Serializer::PrintStack() { PrintStack(std::cout); } void Serializer::PrintStack(std::ostream& out) { for (const auto o : stack_) { o->Print(out); out << "\n"; } } #endif // DEBUG bool Serializer::SerializeRoot(Handle obj) { RootIndex root_index; // Derived serializers are responsible for determining if the root has // actually been serialized before calling this. if (root_index_map()->Lookup(*obj, &root_index)) { PutRoot(root_index); return true; } return false; } bool Serializer::SerializeHotObject(Handle obj) { // Encode a reference to a hot object by its index in the working set. int index = hot_objects_.Find(*obj); if (index == HotObjectsList::kNotFound) return false; DCHECK(index >= 0 && index < kHotObjectCount); if (FLAG_trace_serializer) { PrintF(" Encoding hot object %d:", index); obj->ShortPrint(); PrintF("\n"); } sink_.Put(HotObject::Encode(index), "HotObject"); return true; } bool Serializer::SerializeBackReference(Handle obj) { const SerializerReference* reference = reference_map_.LookupReference(obj); if (reference == nullptr) return false; // Encode the location of an already deserialized object in order to write // its location into a later object. We can encode the location as an // offset fromthe start of the deserialized objects or as an offset // backwards from thecurrent allocation pointer. if (reference->is_attached_reference()) { if (FLAG_trace_serializer) { PrintF(" Encoding attached reference %d\n", reference->attached_reference_index()); } PutAttachedReference(*reference); } else { DCHECK(reference->is_back_reference()); if (FLAG_trace_serializer) { PrintF(" Encoding back reference to: "); obj->ShortPrint(); PrintF("\n"); } sink_.Put(kBackref, "Backref"); PutBackReference(obj, *reference); } return true; } bool Serializer::SerializePendingObject(Handle obj) { PendingObjectReferences* refs_to_object = forward_refs_per_pending_object_.Find(obj); if (refs_to_object == nullptr) { return false; } PutPendingForwardReference(*refs_to_object); return true; } bool Serializer::ObjectIsBytecodeHandler(Handle obj) const { if (!obj->IsCode()) return false; return (Code::cast(*obj).kind() == CodeKind::BYTECODE_HANDLER); } void Serializer::PutRoot(RootIndex root) { int root_index = static_cast(root); Handle object = Handle::cast(isolate()->root_handle(root)); if (FLAG_trace_serializer) { PrintF(" Encoding root %d:", root_index); object->ShortPrint(); PrintF("\n"); } // Assert that the first 32 root array items are a conscious choice. They are // chosen so that the most common ones can be encoded more efficiently. STATIC_ASSERT(static_cast(RootIndex::kArgumentsMarker) == kRootArrayConstantsCount - 1); // TODO(ulan): Check that it works with young large objects. if (root_index < kRootArrayConstantsCount && !Heap::InYoungGeneration(*object)) { sink_.Put(RootArrayConstant::Encode(root), "RootConstant"); } else { sink_.Put(kRootArray, "RootSerialization"); sink_.PutInt(root_index, "root_index"); hot_objects_.Add(*object); } } void Serializer::PutSmiRoot(FullObjectSlot slot) { // Serializing a smi root in compressed pointer builds will serialize the // full object slot (of kSystemPointerSize) to avoid complications during // deserialization (endianness or smi sequences). STATIC_ASSERT(decltype(slot)::kSlotDataSize == sizeof(Address)); STATIC_ASSERT(decltype(slot)::kSlotDataSize == kSystemPointerSize); static constexpr int bytes_to_output = decltype(slot)::kSlotDataSize; static constexpr int size_in_tagged = bytes_to_output >> kTaggedSizeLog2; sink_.Put(FixedRawDataWithSize::Encode(size_in_tagged), "Smi"); Address raw_value = Smi::cast(*slot).ptr(); const byte* raw_value_as_bytes = reinterpret_cast(&raw_value); sink_.PutRaw(raw_value_as_bytes, bytes_to_output, "Bytes"); } void Serializer::PutBackReference(Handle object, SerializerReference reference) { DCHECK_EQ(*object, *back_refs_[reference.back_ref_index()]); sink_.PutInt(reference.back_ref_index(), "BackRefIndex"); hot_objects_.Add(*object); } void Serializer::PutAttachedReference(SerializerReference reference) { DCHECK(reference.is_attached_reference()); sink_.Put(kAttachedReference, "AttachedRef"); sink_.PutInt(reference.attached_reference_index(), "AttachedRefIndex"); } void Serializer::PutRepeat(int repeat_count) { if (repeat_count <= kLastEncodableFixedRepeatCount) { sink_.Put(FixedRepeatWithCount::Encode(repeat_count), "FixedRepeat"); } else { sink_.Put(kVariableRepeat, "VariableRepeat"); sink_.PutInt(VariableRepeatCount::Encode(repeat_count), "repeat count"); } } void Serializer::PutPendingForwardReference(PendingObjectReferences& refs) { sink_.Put(kRegisterPendingForwardRef, "RegisterPendingForwardRef"); unresolved_forward_refs_++; // Register the current slot with the pending object. int forward_ref_id = next_forward_ref_id_++; if (refs == nullptr) { // The IdentityMap holding the pending object reference vectors does not // support non-trivial types; in particular it doesn't support destructors // on values. So, we manually allocate a vector with new, and delete it when // resolving the pending object. refs = new std::vector(); } refs->push_back(forward_ref_id); } void Serializer::ResolvePendingForwardReference(int forward_reference_id) { sink_.Put(kResolvePendingForwardRef, "ResolvePendingForwardRef"); sink_.PutInt(forward_reference_id, "with this index"); unresolved_forward_refs_--; // If there are no more unresolved forward refs, reset the forward ref id to // zero so that future forward refs compress better. if (unresolved_forward_refs_ == 0) { next_forward_ref_id_ = 0; } } void Serializer::RegisterObjectIsPending(Handle obj) { if (*obj == ReadOnlyRoots(isolate()).not_mapped_symbol()) return; // Add the given object to the pending objects -> forward refs map. auto find_result = forward_refs_per_pending_object_.FindOrInsert(obj); USE(find_result); // If the above emplace didn't actually add the object, then the object must // already have been registered pending by deferring. It might not be in the // deferred objects queue though, since it may be the very object we just // popped off that queue, so just check that it can be deferred. DCHECK_IMPLIES(find_result.already_exists, *find_result.entry != nullptr); DCHECK_IMPLIES(find_result.already_exists, CanBeDeferred(*obj)); } void Serializer::ResolvePendingObject(Handle obj) { if (*obj == ReadOnlyRoots(isolate()).not_mapped_symbol()) return; std::vector* refs; CHECK(forward_refs_per_pending_object_.Delete(obj, &refs)); if (refs) { for (int index : *refs) { ResolvePendingForwardReference(index); } // See PutPendingForwardReference -- we have to manually manage the memory // of non-trivial IdentityMap values. delete refs; } } void Serializer::Pad(int padding_offset) { // The non-branching GetInt will read up to 3 bytes too far, so we need // to pad the snapshot to make sure we don't read over the end. for (unsigned i = 0; i < sizeof(int32_t) - 1; i++) { sink_.Put(kNop, "Padding"); } // Pad up to pointer size for checksum. while (!IsAligned(sink_.Position() + padding_offset, kPointerAlignment)) { sink_.Put(kNop, "Padding"); } } void Serializer::InitializeCodeAddressMap() { isolate_->InitializeLoggingAndCounters(); code_address_map_ = std::make_unique(isolate_); } Code Serializer::CopyCode(Code code) { code_buffer_.clear(); // Clear buffer without deleting backing store. int size = code.CodeSize(); code_buffer_.insert(code_buffer_.end(), reinterpret_cast(code.address()), reinterpret_cast(code.address() + size)); // When pointer compression is enabled the checked cast will try to // decompress map field of off-heap Code object. return Code::unchecked_cast(HeapObject::FromAddress( reinterpret_cast
(&code_buffer_.front()))); } void Serializer::ObjectSerializer::SerializePrologue(SnapshotSpace space, int size, Map map) { if (serializer_->code_address_map_) { const char* code_name = serializer_->code_address_map_->Lookup(object_->address()); LOG(serializer_->isolate_, CodeNameEvent(object_->address(), sink_->Position(), code_name)); } if (map == *object_) { DCHECK_EQ(*object_, ReadOnlyRoots(isolate()).meta_map()); DCHECK_EQ(space, SnapshotSpace::kReadOnlyHeap); sink_->Put(kNewMetaMap, "NewMetaMap"); DCHECK_EQ(size, Map::kSize); } else { sink_->Put(NewObject::Encode(space), "NewObject"); // TODO(leszeks): Skip this when the map has a fixed size. sink_->PutInt(size >> kObjectAlignmentBits, "ObjectSizeInWords"); // Until the space for the object is allocated, it is considered "pending". serializer_->RegisterObjectIsPending(object_); // Serialize map (first word of the object) before anything else, so that // the deserializer can access it when allocating. Make sure that the map // isn't a pending object. DCHECK_NULL(serializer_->forward_refs_per_pending_object_.Find(map)); DCHECK(map.IsMap()); serializer_->SerializeObject(handle(map, isolate())); // Make sure the map serialization didn't accidentally recursively serialize // this object. DCHECK_IMPLIES( *object_ != ReadOnlyRoots(isolate()).not_mapped_symbol(), serializer_->reference_map()->LookupReference(object_) == nullptr); // Now that the object is allocated, we can resolve pending references to // it. serializer_->ResolvePendingObject(object_); } if (FLAG_serialization_statistics) { serializer_->CountAllocation(object_->map(), size, space); } // Mark this object as already serialized, and add it to the reference map so // that it can be accessed by backreference by future objects. serializer_->num_back_refs_++; #ifdef DEBUG serializer_->back_refs_.Push(*object_); DCHECK_EQ(serializer_->back_refs_.size(), serializer_->num_back_refs_); #endif if (*object_ != ReadOnlyRoots(isolate()).not_mapped_symbol()) { // Only add the object to the map if it's not not_mapped_symbol, else // the reference IdentityMap has issues. We don't expect to have back // references to the not_mapped_symbol anyway, so it's fine. SerializerReference back_reference = SerializerReference::BackReference(serializer_->num_back_refs_ - 1); serializer_->reference_map()->Add(*object_, back_reference); DCHECK_EQ(*object_, *serializer_->back_refs_[back_reference.back_ref_index()]); DCHECK_EQ(back_reference.back_ref_index(), serializer_->reference_map() ->LookupReference(object_) ->back_ref_index()); } } uint32_t Serializer::ObjectSerializer::SerializeBackingStore( void* backing_store, int32_t byte_length) { const SerializerReference* reference_ptr = serializer_->reference_map()->LookupBackingStore(backing_store); // Serialize the off-heap backing store. if (!reference_ptr) { sink_->Put(kOffHeapBackingStore, "Off-heap backing store"); sink_->PutInt(byte_length, "length"); sink_->PutRaw(static_cast(backing_store), byte_length, "BackingStore"); DCHECK_NE(0, serializer_->seen_backing_stores_index_); SerializerReference reference = SerializerReference::OffHeapBackingStoreReference( serializer_->seen_backing_stores_index_++); // Mark this backing store as already serialized. serializer_->reference_map()->AddBackingStore(backing_store, reference); return reference.off_heap_backing_store_index(); } else { return reference_ptr->off_heap_backing_store_index(); } } void Serializer::ObjectSerializer::SerializeJSTypedArray() { Handle typed_array = Handle::cast(object_); if (typed_array->is_on_heap()) { typed_array->RemoveExternalPointerCompensationForSerialization(isolate()); } else { if (!typed_array->WasDetached()) { // Explicitly serialize the backing store now. JSArrayBuffer buffer = JSArrayBuffer::cast(typed_array->buffer()); // We cannot store byte_length larger than int32 range in the snapshot. CHECK_LE(buffer.byte_length(), std::numeric_limits::max()); int32_t byte_length = static_cast(buffer.byte_length()); size_t byte_offset = typed_array->byte_offset(); // We need to calculate the backing store from the data pointer // because the ArrayBuffer may already have been serialized. void* backing_store = reinterpret_cast( reinterpret_cast
(typed_array->DataPtr()) - byte_offset); uint32_t ref = SerializeBackingStore(backing_store, byte_length); typed_array->SetExternalBackingStoreRefForSerialization(ref); } else { typed_array->SetExternalBackingStoreRefForSerialization(0); } } SerializeObject(); } void Serializer::ObjectSerializer::SerializeJSArrayBuffer() { Handle buffer = Handle::cast(object_); void* backing_store = buffer->backing_store(); // We cannot store byte_length larger than int32 range in the snapshot. CHECK_LE(buffer->byte_length(), std::numeric_limits::max()); int32_t byte_length = static_cast(buffer->byte_length()); ArrayBufferExtension* extension = buffer->extension(); // The embedder-allocated backing store only exists for the off-heap case. #ifdef V8_HEAP_SANDBOX uint32_t external_pointer_entry = buffer->GetBackingStoreRefForDeserialization(); #endif if (backing_store != nullptr) { uint32_t ref = SerializeBackingStore(backing_store, byte_length); buffer->SetBackingStoreRefForSerialization(ref); // Ensure deterministic output by setting extension to null during // serialization. buffer->set_extension(nullptr); } else { buffer->SetBackingStoreRefForSerialization(kNullRefSentinel); } SerializeObject(); #ifdef V8_HEAP_SANDBOX buffer->SetBackingStoreRefForSerialization(external_pointer_entry); #else buffer->set_backing_store(isolate(), backing_store); #endif buffer->set_extension(extension); } void Serializer::ObjectSerializer::SerializeExternalString() { // For external strings with known resources, we replace the resource field // with the encoded external reference, which we restore upon deserialize. // For the rest we serialize them to look like ordinary sequential strings. Handle string = Handle::cast(object_); Address resource = string->resource_as_address(); ExternalReferenceEncoder::Value reference; if (serializer_->external_reference_encoder_.TryEncode(resource).To( &reference)) { DCHECK(reference.is_from_api()); #ifdef V8_HEAP_SANDBOX uint32_t external_pointer_entry = string->GetResourceRefForDeserialization(); #endif string->SetResourceRefForSerialization(reference.index()); SerializeObject(); #ifdef V8_HEAP_SANDBOX string->SetResourceRefForSerialization(external_pointer_entry); #else string->set_address_as_resource(isolate(), resource); #endif } else { SerializeExternalStringAsSequentialString(); } } void Serializer::ObjectSerializer::SerializeExternalStringAsSequentialString() { // Instead of serializing this as an external string, we serialize // an imaginary sequential string with the same content. ReadOnlyRoots roots(isolate()); DCHECK(object_->IsExternalString()); Handle string = Handle::cast(object_); int length = string->length(); Map map; int content_size; int allocation_size; const byte* resource; // Find the map and size for the imaginary sequential string. bool internalized = object_->IsInternalizedString(); if (object_->IsExternalOneByteString()) { map = internalized ? roots.one_byte_internalized_string_map() : roots.one_byte_string_map(); allocation_size = SeqOneByteString::SizeFor(length); content_size = length * kCharSize; resource = reinterpret_cast( Handle::cast(string)->resource()->data()); } else { map = internalized ? roots.internalized_string_map() : roots.string_map(); allocation_size = SeqTwoByteString::SizeFor(length); content_size = length * kShortSize; resource = reinterpret_cast( Handle::cast(string)->resource()->data()); } SnapshotSpace space = SnapshotSpace::kOld; SerializePrologue(space, allocation_size, map); // Output the rest of the imaginary string. int bytes_to_output = allocation_size - HeapObject::kHeaderSize; DCHECK(IsAligned(bytes_to_output, kTaggedSize)); int slots_to_output = bytes_to_output >> kTaggedSizeLog2; // Output raw data header. Do not bother with common raw length cases here. sink_->Put(kVariableRawData, "RawDataForString"); sink_->PutInt(slots_to_output, "length"); // Serialize string header (except for map). byte* string_start = reinterpret_cast(string->address()); for (int i = HeapObject::kHeaderSize; i < SeqString::kHeaderSize; i++) { sink_->Put(string_start[i], "StringHeader"); } // Serialize string content. sink_->PutRaw(resource, content_size, "StringContent"); // Since the allocation size is rounded up to object alignment, there // maybe left-over bytes that need to be padded. int padding_size = allocation_size - SeqString::kHeaderSize - content_size; DCHECK(0 <= padding_size && padding_size < kObjectAlignment); for (int i = 0; i < padding_size; i++) sink_->Put(static_cast(0), "StringPadding"); } // Clear and later restore the next link in the weak cell or allocation site. // TODO(all): replace this with proper iteration of weak slots in serializer. class UnlinkWeakNextScope { public: explicit UnlinkWeakNextScope(Heap* heap, Handle object) { if (object->IsAllocationSite() && Handle::cast(object)->HasWeakNext()) { object_ = object; next_ = handle(AllocationSite::cast(*object).weak_next(), heap->isolate()); Handle::cast(object)->set_weak_next( ReadOnlyRoots(heap).undefined_value()); } } ~UnlinkWeakNextScope() { if (!object_.is_null()) { Handle::cast(object_)->set_weak_next( *next_, UPDATE_WEAK_WRITE_BARRIER); } } private: Handle object_; Handle next_; DISALLOW_HEAP_ALLOCATION(no_gc_) }; void Serializer::ObjectSerializer::Serialize() { RecursionScope recursion(serializer_); // Defer objects as "pending" if they cannot be serialized now, or if we // exceed a certain recursion depth. Some objects cannot be deferred if ((recursion.ExceedsMaximum() && CanBeDeferred(*object_)) || serializer_->MustBeDeferred(*object_)) { DCHECK(CanBeDeferred(*object_)); if (FLAG_trace_serializer) { PrintF(" Deferring heap object: "); object_->ShortPrint(); PrintF("\n"); } // Deferred objects are considered "pending". serializer_->RegisterObjectIsPending(object_); serializer_->PutPendingForwardReference( *serializer_->forward_refs_per_pending_object_.Find(object_)); serializer_->QueueDeferredObject(object_); return; } if (FLAG_trace_serializer) { PrintF(" Encoding heap object: "); object_->ShortPrint(); PrintF("\n"); } if (object_->IsExternalString()) { SerializeExternalString(); return; } else if (!ReadOnlyHeap::Contains(*object_)) { // Only clear padding for strings outside the read-only heap. Read-only heap // should have been cleared elsewhere. if (object_->IsSeqOneByteString()) { // Clear padding bytes at the end. Done here to avoid having to do this // at allocation sites in generated code. Handle::cast(object_)->clear_padding(); } else if (object_->IsSeqTwoByteString()) { Handle::cast(object_)->clear_padding(); } } if (object_->IsJSTypedArray()) { SerializeJSTypedArray(); return; } else if (object_->IsJSArrayBuffer()) { SerializeJSArrayBuffer(); return; } // We don't expect fillers. DCHECK(!object_->IsFreeSpaceOrFiller()); if (object_->IsScript()) { // Clear cached line ends. Oddball undefined = ReadOnlyRoots(isolate()).undefined_value(); Handle