1 /* 2 * Copyright (C) 2017 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #ifndef ART_LIBDEXFILE_DEX_COMPACT_DEX_FILE_H_ 18 #define ART_LIBDEXFILE_DEX_COMPACT_DEX_FILE_H_ 19 20 #include <memory> 21 22 #include "base/casts.h" 23 #include "dex/compact_offset_table.h" 24 #include "dex_file.h" 25 26 namespace art { 27 28 // CompactDex is a currently ART internal dex file format that aims to reduce storage/RAM usage. 29 class CompactDexFile : public DexFile { 30 public: 31 static constexpr uint8_t kDexMagic[kDexMagicSize] = { 'c', 'd', 'e', 'x' }; 32 // Last change: remove code item deduping. 33 static constexpr uint8_t kDexMagicVersion[] = {'0', '0', '1', '\0'}; 34 35 enum class FeatureFlags : uint32_t { 36 kDefaultMethods = 0x1, 37 }; 38 39 class Header : public DexFile::Header { 40 public: At(const void * at)41 static const Header* At(const void* at) { 42 return reinterpret_cast<const Header*>(at); 43 } 44 GetFeatureFlags()45 uint32_t GetFeatureFlags() const { 46 return feature_flags_; 47 } 48 GetDataOffset()49 uint32_t GetDataOffset() const { 50 return data_off_; 51 } 52 GetDataSize()53 uint32_t GetDataSize() const { 54 return data_size_; 55 } 56 57 // Range of the shared data section owned by the dex file. Owned in this context refers to data 58 // for this DEX that was not deduplicated to another DEX. OwnedDataBegin()59 uint32_t OwnedDataBegin() const { 60 return owned_data_begin_; 61 } 62 OwnedDataEnd()63 uint32_t OwnedDataEnd() const { 64 return owned_data_end_; 65 } 66 67 private: 68 uint32_t feature_flags_ = 0u; 69 70 // Position in the compact dex file for the debug info table data starts. 71 uint32_t debug_info_offsets_pos_ = 0u; 72 73 // Offset into the debug info table data where the lookup table is. 74 uint32_t debug_info_offsets_table_offset_ = 0u; 75 76 // Base offset of where debug info starts in the dex file. 77 uint32_t debug_info_base_ = 0u; 78 79 // Range of the shared data section owned by the dex file. 80 uint32_t owned_data_begin_ = 0u; 81 uint32_t owned_data_end_ = 0u; 82 83 friend class CompactDexFile; 84 friend class CompactDexWriter; 85 }; 86 87 // Like the standard code item except without a debug info offset. Each code item may have a 88 // preheader to encode large methods. In 99% of cases, the preheader is not used. This enables 89 // smaller size with a good fast path case in the accessors. 90 struct CodeItem : public dex::CodeItem { 91 static constexpr size_t kAlignment = sizeof(uint16_t); 92 // Max preheader size in uint16_ts. 93 static constexpr size_t kMaxPreHeaderSize = 6; 94 FieldsOffsetCodeItem95 static constexpr size_t FieldsOffset() { 96 return OFFSETOF_MEMBER(CodeItem, fields_); 97 } 98 InsnsCountAndFlagsOffsetCodeItem99 static constexpr size_t InsnsCountAndFlagsOffset() { 100 return OFFSETOF_MEMBER(CodeItem, insns_count_and_flags_); 101 } 102 InsnsOffsetCodeItem103 static constexpr size_t InsnsOffset() { 104 return OFFSETOF_MEMBER(CodeItem, insns_); 105 } 106 107 static constexpr size_t kRegistersSizeShift = 12; 108 static constexpr size_t kInsSizeShift = 8; 109 static constexpr size_t kOutsSizeShift = 4; 110 static constexpr size_t kTriesSizeSizeShift = 0; 111 static constexpr uint16_t kBitPreHeaderRegistersSize = 0; 112 static constexpr uint16_t kBitPreHeaderInsSize = 1; 113 static constexpr uint16_t kBitPreHeaderOutsSize = 2; 114 static constexpr uint16_t kBitPreHeaderTriesSize = 3; 115 static constexpr uint16_t kBitPreHeaderInsnsSize = 4; 116 static constexpr uint16_t kFlagPreHeaderRegistersSize = 0x1 << kBitPreHeaderRegistersSize; 117 static constexpr uint16_t kFlagPreHeaderInsSize = 0x1 << kBitPreHeaderInsSize; 118 static constexpr uint16_t kFlagPreHeaderOutsSize = 0x1 << kBitPreHeaderOutsSize; 119 static constexpr uint16_t kFlagPreHeaderTriesSize = 0x1 << kBitPreHeaderTriesSize; 120 static constexpr uint16_t kFlagPreHeaderInsnsSize = 0x1 << kBitPreHeaderInsnsSize; 121 static constexpr size_t kInsnsSizeShift = 5; 122 static constexpr size_t kInsnsSizeBits = sizeof(uint16_t) * kBitsPerByte - kInsnsSizeShift; 123 124 private: 125 CodeItem() = default; 126 127 // Combined preheader flags for fast testing if we need to go slow path. 128 static constexpr uint16_t kFlagPreHeaderCombined = 129 kFlagPreHeaderRegistersSize | 130 kFlagPreHeaderInsSize | 131 kFlagPreHeaderOutsSize | 132 kFlagPreHeaderTriesSize | 133 kFlagPreHeaderInsnsSize; 134 135 // Create a code item and associated preheader if required based on field values. 136 // Returns the start of the preheader. The preheader buffer must be at least as large as 137 // kMaxPreHeaderSize; CreateCodeItem138 uint16_t* Create(uint16_t registers_size, 139 uint16_t ins_size, 140 uint16_t outs_size, 141 uint16_t tries_size, 142 uint32_t insns_size_in_code_units, 143 uint16_t* out_preheader) { 144 // Dex verification ensures that registers size > ins_size, so we can subtract the registers 145 // size accordingly to reduce how often we need to use the preheader. 146 DCHECK_GE(registers_size, ins_size); 147 registers_size -= ins_size; 148 fields_ = (registers_size & 0xF) << kRegistersSizeShift; 149 fields_ |= (ins_size & 0xF) << kInsSizeShift; 150 fields_ |= (outs_size & 0xF) << kOutsSizeShift; 151 fields_ |= (tries_size & 0xF) << kTriesSizeSizeShift; 152 registers_size &= ~0xF; 153 ins_size &= ~0xF; 154 outs_size &= ~0xF; 155 tries_size &= ~0xF; 156 insns_count_and_flags_ = 0; 157 const size_t masked_count = insns_size_in_code_units & ((1 << kInsnsSizeBits) - 1); 158 insns_count_and_flags_ |= masked_count << kInsnsSizeShift; 159 insns_size_in_code_units -= masked_count; 160 161 // Since the preheader case is rare (1% of code items), use a suboptimally large but fast 162 // decoding format. 163 if (insns_size_in_code_units != 0) { 164 insns_count_and_flags_ |= kFlagPreHeaderInsnsSize; 165 --out_preheader; 166 *out_preheader = static_cast<uint16_t>(insns_size_in_code_units); 167 --out_preheader; 168 *out_preheader = static_cast<uint16_t>(insns_size_in_code_units >> 16); 169 } 170 auto preheader_encode = [&](uint16_t size, uint16_t flag) { 171 if (size != 0) { 172 insns_count_and_flags_ |= flag; 173 --out_preheader; 174 *out_preheader = size; 175 } 176 }; 177 preheader_encode(registers_size, kFlagPreHeaderRegistersSize); 178 preheader_encode(ins_size, kFlagPreHeaderInsSize); 179 preheader_encode(outs_size, kFlagPreHeaderOutsSize); 180 preheader_encode(tries_size, kFlagPreHeaderTriesSize); 181 return out_preheader; 182 } 183 HasPreHeaderCodeItem184 ALWAYS_INLINE bool HasPreHeader(uint16_t flag) const { 185 return (insns_count_and_flags_ & flag) != 0; 186 } 187 188 // Return true if the code item has any preheaders. HasAnyPreHeaderCodeItem189 ALWAYS_INLINE static bool HasAnyPreHeader(uint16_t insns_count_and_flags) { 190 return (insns_count_and_flags & kFlagPreHeaderCombined) != 0; 191 } 192 GetPreHeaderCodeItem193 ALWAYS_INLINE uint16_t* GetPreHeader() { 194 return reinterpret_cast<uint16_t*>(this); 195 } 196 GetPreHeaderCodeItem197 ALWAYS_INLINE const uint16_t* GetPreHeader() const { 198 return reinterpret_cast<const uint16_t*>(this); 199 } 200 201 // Decode fields and read the preheader if necessary. If kDecodeOnlyInstructionCount is 202 // specified then only the instruction count is decoded. 203 template <bool kDecodeOnlyInstructionCount> DecodeFieldsCodeItem204 ALWAYS_INLINE void DecodeFields(uint32_t* insns_count, 205 uint16_t* registers_size, 206 uint16_t* ins_size, 207 uint16_t* outs_size, 208 uint16_t* tries_size) const { 209 *insns_count = insns_count_and_flags_ >> kInsnsSizeShift; 210 if (!kDecodeOnlyInstructionCount) { 211 const uint16_t fields = fields_; 212 *registers_size = (fields >> kRegistersSizeShift) & 0xF; 213 *ins_size = (fields >> kInsSizeShift) & 0xF; 214 *outs_size = (fields >> kOutsSizeShift) & 0xF; 215 *tries_size = (fields >> kTriesSizeSizeShift) & 0xF; 216 } 217 if (UNLIKELY(HasAnyPreHeader(insns_count_and_flags_))) { 218 const uint16_t* preheader = GetPreHeader(); 219 if (HasPreHeader(kFlagPreHeaderInsnsSize)) { 220 --preheader; 221 *insns_count += static_cast<uint32_t>(*preheader); 222 --preheader; 223 *insns_count += static_cast<uint32_t>(*preheader) << 16; 224 } 225 if (!kDecodeOnlyInstructionCount) { 226 if (HasPreHeader(kFlagPreHeaderRegistersSize)) { 227 --preheader; 228 *registers_size += preheader[0]; 229 } 230 if (HasPreHeader(kFlagPreHeaderInsSize)) { 231 --preheader; 232 *ins_size += preheader[0]; 233 } 234 if (HasPreHeader(kFlagPreHeaderOutsSize)) { 235 --preheader; 236 *outs_size += preheader[0]; 237 } 238 if (HasPreHeader(kFlagPreHeaderTriesSize)) { 239 --preheader; 240 *tries_size += preheader[0]; 241 } 242 } 243 } 244 if (!kDecodeOnlyInstructionCount) { 245 *registers_size += *ins_size; 246 } 247 } 248 249 // Packed code item data, 4 bits each: [registers_size, ins_size, outs_size, tries_size] 250 uint16_t fields_; 251 252 // 5 bits for if either of the fields required preheader extension, 11 bits for the number of 253 // instruction code units. 254 uint16_t insns_count_and_flags_; 255 256 uint16_t insns_[1]; // actual array of bytecode. 257 258 ART_FRIEND_TEST(CodeItemAccessorsTest, TestDexInstructionsAccessor); 259 ART_FRIEND_TEST(CompactDexFileTest, CodeItemFields); 260 friend class CodeItemDataAccessor; 261 friend class CodeItemDebugInfoAccessor; 262 friend class CodeItemInstructionAccessor; 263 friend class CompactDexFile; 264 friend class CompactDexWriter; 265 DISALLOW_COPY_AND_ASSIGN(CodeItem); 266 }; 267 268 // Write the compact dex specific magic. 269 static void WriteMagic(uint8_t* magic); 270 271 // Write the current version, note that the input is the address of the magic. 272 static void WriteCurrentVersion(uint8_t* magic); 273 274 // Returns true if the byte string points to the magic value. 275 static bool IsMagicValid(const uint8_t* magic); IsMagicValid(DexFile::Magic magic)276 static bool IsMagicValid(DexFile::Magic magic) { return IsMagicValid(magic.data()); } 277 bool IsMagicValid() const override; 278 279 // Returns true if the byte string after the magic is the correct value. 280 static bool IsVersionValid(const uint8_t* magic); 281 bool IsVersionValid() const override; 282 283 // TODO This is completely a guess. We really need to do better. b/72402467 284 // We ask for 64 megabytes which should be big enough for any realistic dex file. GetDequickenedSize()285 size_t GetDequickenedSize() const override { 286 return 64 * MB; 287 } 288 GetHeader()289 const Header& GetHeader() const { 290 return down_cast<const Header&>(DexFile::GetHeader()); 291 } 292 293 bool SupportsDefaultMethods() const override; 294 295 uint32_t GetCodeItemSize(const dex::CodeItem& item) const override; 296 GetDebugInfoOffset(uint32_t dex_method_index)297 uint32_t GetDebugInfoOffset(uint32_t dex_method_index) const { 298 return debug_info_offsets_.GetOffset(dex_method_index); 299 } 300 301 static uint32_t CalculateChecksum(const uint8_t* base_begin, 302 size_t base_size, 303 const uint8_t* data_begin, 304 size_t data_size); 305 uint32_t CalculateChecksum() const override; 306 307 private: 308 CompactDexFile(const uint8_t* base, 309 const std::string& location, 310 uint32_t location_checksum, 311 const OatDexFile* oat_dex_file, 312 // Shared since several dex files may be stored in the same logical container. 313 std::shared_ptr<DexFileContainer> container); 314 315 CompactOffsetTable::Accessor debug_info_offsets_; 316 317 friend class DexFile; 318 friend class DexFileLoader; 319 DISALLOW_COPY_AND_ASSIGN(CompactDexFile); 320 }; 321 322 } // namespace art 323 324 #endif // ART_LIBDEXFILE_DEX_COMPACT_DEX_FILE_H_ 325