1 /*
2 * Copyright (C) 2016 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 *
16 * Implementation file of the dexlayout utility.
17 *
18 * This is a tool to read dex files into an internal representation,
19 * reorganize the representation, and emit dex files with a better
20 * file layout.
21 */
22
23 #include "dex_ir.h"
24 #include "dex_instruction-inl.h"
25 #include "dex_ir_builder.h"
26
27 namespace art {
28 namespace dex_ir {
29
ReadVarWidth(const uint8_t ** data,uint8_t length,bool sign_extend)30 static uint64_t ReadVarWidth(const uint8_t** data, uint8_t length, bool sign_extend) {
31 uint64_t value = 0;
32 for (uint32_t i = 0; i <= length; i++) {
33 value |= static_cast<uint64_t>(*(*data)++) << (i * 8);
34 }
35 if (sign_extend) {
36 int shift = (7 - length) * 8;
37 return (static_cast<int64_t>(value) << shift) >> shift;
38 }
39 return value;
40 }
41
GetPositionsCb(void * context,const DexFile::PositionInfo & entry)42 static bool GetPositionsCb(void* context, const DexFile::PositionInfo& entry) {
43 DebugInfoItem* debug_info = reinterpret_cast<DebugInfoItem*>(context);
44 PositionInfoVector& positions = debug_info->GetPositionInfo();
45 positions.push_back(std::unique_ptr<PositionInfo>(new PositionInfo(entry.address_, entry.line_)));
46 return false;
47 }
48
GetLocalsCb(void * context,const DexFile::LocalInfo & entry)49 static void GetLocalsCb(void* context, const DexFile::LocalInfo& entry) {
50 DebugInfoItem* debug_info = reinterpret_cast<DebugInfoItem*>(context);
51 LocalInfoVector& locals = debug_info->GetLocalInfo();
52 const char* name = entry.name_ != nullptr ? entry.name_ : "(null)";
53 const char* descriptor = entry.descriptor_ != nullptr ? entry.descriptor_ : "";
54 const char* signature = entry.signature_ != nullptr ? entry.signature_ : "";
55 locals.push_back(std::unique_ptr<LocalInfo>(
56 new LocalInfo(name, descriptor, signature, entry.start_address_, entry.end_address_,
57 entry.reg_)));
58 }
59
GetDebugInfoStreamSize(const uint8_t * debug_info_stream)60 static uint32_t GetDebugInfoStreamSize(const uint8_t* debug_info_stream) {
61 const uint8_t* stream = debug_info_stream;
62 DecodeUnsignedLeb128(&stream); // line_start
63 uint32_t parameters_size = DecodeUnsignedLeb128(&stream);
64 for (uint32_t i = 0; i < parameters_size; ++i) {
65 DecodeUnsignedLeb128P1(&stream); // Parameter name.
66 }
67
68 for (;;) {
69 uint8_t opcode = *stream++;
70 switch (opcode) {
71 case DexFile::DBG_END_SEQUENCE:
72 return stream - debug_info_stream; // end of stream.
73 case DexFile::DBG_ADVANCE_PC:
74 DecodeUnsignedLeb128(&stream); // addr_diff
75 break;
76 case DexFile::DBG_ADVANCE_LINE:
77 DecodeSignedLeb128(&stream); // line_diff
78 break;
79 case DexFile::DBG_START_LOCAL:
80 DecodeUnsignedLeb128(&stream); // register_num
81 DecodeUnsignedLeb128P1(&stream); // name_idx
82 DecodeUnsignedLeb128P1(&stream); // type_idx
83 break;
84 case DexFile::DBG_START_LOCAL_EXTENDED:
85 DecodeUnsignedLeb128(&stream); // register_num
86 DecodeUnsignedLeb128P1(&stream); // name_idx
87 DecodeUnsignedLeb128P1(&stream); // type_idx
88 DecodeUnsignedLeb128P1(&stream); // sig_idx
89 break;
90 case DexFile::DBG_END_LOCAL:
91 case DexFile::DBG_RESTART_LOCAL:
92 DecodeUnsignedLeb128(&stream); // register_num
93 break;
94 case DexFile::DBG_SET_PROLOGUE_END:
95 case DexFile::DBG_SET_EPILOGUE_BEGIN:
96 break;
97 case DexFile::DBG_SET_FILE: {
98 DecodeUnsignedLeb128P1(&stream); // name_idx
99 break;
100 }
101 default: {
102 break;
103 }
104 }
105 }
106 }
107
GetIdFromInstruction(Collections & collections,const Instruction * dec_insn,std::vector<TypeId * > * type_ids,std::vector<StringId * > * string_ids,std::vector<MethodId * > * method_ids,std::vector<FieldId * > * field_ids)108 static bool GetIdFromInstruction(Collections& collections,
109 const Instruction* dec_insn,
110 std::vector<TypeId*>* type_ids,
111 std::vector<StringId*>* string_ids,
112 std::vector<MethodId*>* method_ids,
113 std::vector<FieldId*>* field_ids) {
114 // Determine index and width of the string.
115 uint32_t index = 0;
116 switch (Instruction::FormatOf(dec_insn->Opcode())) {
117 // SOME NOT SUPPORTED:
118 // case Instruction::k20bc:
119 case Instruction::k21c:
120 case Instruction::k35c:
121 // case Instruction::k35ms:
122 case Instruction::k3rc:
123 // case Instruction::k3rms:
124 // case Instruction::k35mi:
125 // case Instruction::k3rmi:
126 case Instruction::k45cc:
127 case Instruction::k4rcc:
128 index = dec_insn->VRegB();
129 break;
130 case Instruction::k31c:
131 index = dec_insn->VRegB();
132 break;
133 case Instruction::k22c:
134 // case Instruction::k22cs:
135 index = dec_insn->VRegC();
136 break;
137 default:
138 break;
139 } // switch
140
141 // Determine index type, and add reference to the appropriate collection.
142 switch (Instruction::IndexTypeOf(dec_insn->Opcode())) {
143 case Instruction::kIndexTypeRef:
144 if (index < collections.TypeIdsSize()) {
145 type_ids->push_back(collections.GetTypeId(index));
146 return true;
147 }
148 break;
149 case Instruction::kIndexStringRef:
150 if (index < collections.StringIdsSize()) {
151 string_ids->push_back(collections.GetStringId(index));
152 return true;
153 }
154 break;
155 case Instruction::kIndexMethodRef:
156 case Instruction::kIndexMethodAndProtoRef:
157 if (index < collections.MethodIdsSize()) {
158 method_ids->push_back(collections.GetMethodId(index));
159 return true;
160 }
161 break;
162 case Instruction::kIndexFieldRef:
163 if (index < collections.FieldIdsSize()) {
164 field_ids->push_back(collections.GetFieldId(index));
165 return true;
166 }
167 break;
168 case Instruction::kIndexUnknown:
169 case Instruction::kIndexNone:
170 case Instruction::kIndexVtableOffset:
171 case Instruction::kIndexFieldOffset:
172 default:
173 break;
174 } // switch
175 return false;
176 }
177
178 /*
179 * Get all the types, strings, methods, and fields referred to from bytecode.
180 */
GetIdsFromByteCode(Collections & collections,const CodeItem * code,std::vector<TypeId * > * type_ids,std::vector<StringId * > * string_ids,std::vector<MethodId * > * method_ids,std::vector<FieldId * > * field_ids)181 static bool GetIdsFromByteCode(Collections& collections,
182 const CodeItem* code,
183 std::vector<TypeId*>* type_ids,
184 std::vector<StringId*>* string_ids,
185 std::vector<MethodId*>* method_ids,
186 std::vector<FieldId*>* field_ids) {
187 bool has_id = false;
188 // Iterate over all instructions.
189 const uint16_t* insns = code->Insns();
190 for (uint32_t insn_idx = 0; insn_idx < code->InsnsSize();) {
191 const Instruction* instruction = Instruction::At(&insns[insn_idx]);
192 const uint32_t insn_width = instruction->SizeInCodeUnits();
193 if (insn_width == 0) {
194 break;
195 }
196 has_id |= GetIdFromInstruction(collections,
197 instruction,
198 type_ids,
199 string_ids,
200 method_ids,
201 field_ids);
202 insn_idx += insn_width;
203 } // for
204 return has_id;
205 }
206
ReadEncodedValue(const uint8_t ** data)207 EncodedValue* Collections::ReadEncodedValue(const uint8_t** data) {
208 const uint8_t encoded_value = *(*data)++;
209 const uint8_t type = encoded_value & 0x1f;
210 EncodedValue* item = new EncodedValue(type);
211 ReadEncodedValue(data, type, encoded_value >> 5, item);
212 return item;
213 }
214
ReadEncodedValue(const uint8_t ** data,uint8_t type,uint8_t length)215 EncodedValue* Collections::ReadEncodedValue(const uint8_t** data, uint8_t type, uint8_t length) {
216 EncodedValue* item = new EncodedValue(type);
217 ReadEncodedValue(data, type, length, item);
218 return item;
219 }
220
ReadEncodedValue(const uint8_t ** data,uint8_t type,uint8_t length,EncodedValue * item)221 void Collections::ReadEncodedValue(
222 const uint8_t** data, uint8_t type, uint8_t length, EncodedValue* item) {
223 switch (type) {
224 case DexFile::kDexAnnotationByte:
225 item->SetByte(static_cast<int8_t>(ReadVarWidth(data, length, false)));
226 break;
227 case DexFile::kDexAnnotationShort:
228 item->SetShort(static_cast<int16_t>(ReadVarWidth(data, length, true)));
229 break;
230 case DexFile::kDexAnnotationChar:
231 item->SetChar(static_cast<uint16_t>(ReadVarWidth(data, length, false)));
232 break;
233 case DexFile::kDexAnnotationInt:
234 item->SetInt(static_cast<int32_t>(ReadVarWidth(data, length, true)));
235 break;
236 case DexFile::kDexAnnotationLong:
237 item->SetLong(static_cast<int64_t>(ReadVarWidth(data, length, true)));
238 break;
239 case DexFile::kDexAnnotationFloat: {
240 // Fill on right.
241 union {
242 float f;
243 uint32_t data;
244 } conv;
245 conv.data = static_cast<uint32_t>(ReadVarWidth(data, length, false)) << (3 - length) * 8;
246 item->SetFloat(conv.f);
247 break;
248 }
249 case DexFile::kDexAnnotationDouble: {
250 // Fill on right.
251 union {
252 double d;
253 uint64_t data;
254 } conv;
255 conv.data = ReadVarWidth(data, length, false) << (7 - length) * 8;
256 item->SetDouble(conv.d);
257 break;
258 }
259 case DexFile::kDexAnnotationMethodType: {
260 const uint32_t proto_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
261 item->SetProtoId(GetProtoId(proto_index));
262 break;
263 }
264 case DexFile::kDexAnnotationMethodHandle: {
265 const uint32_t method_handle_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
266 item->SetMethodHandle(GetMethodHandle(method_handle_index));
267 break;
268 }
269 case DexFile::kDexAnnotationString: {
270 const uint32_t string_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
271 item->SetStringId(GetStringId(string_index));
272 break;
273 }
274 case DexFile::kDexAnnotationType: {
275 const uint32_t string_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
276 item->SetTypeId(GetTypeId(string_index));
277 break;
278 }
279 case DexFile::kDexAnnotationField:
280 case DexFile::kDexAnnotationEnum: {
281 const uint32_t field_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
282 item->SetFieldId(GetFieldId(field_index));
283 break;
284 }
285 case DexFile::kDexAnnotationMethod: {
286 const uint32_t method_index = static_cast<uint32_t>(ReadVarWidth(data, length, false));
287 item->SetMethodId(GetMethodId(method_index));
288 break;
289 }
290 case DexFile::kDexAnnotationArray: {
291 EncodedValueVector* values = new EncodedValueVector();
292 const uint32_t size = DecodeUnsignedLeb128(data);
293 // Decode all elements.
294 for (uint32_t i = 0; i < size; i++) {
295 values->push_back(std::unique_ptr<EncodedValue>(ReadEncodedValue(data)));
296 }
297 item->SetEncodedArray(new EncodedArrayItem(values));
298 break;
299 }
300 case DexFile::kDexAnnotationAnnotation: {
301 AnnotationElementVector* elements = new AnnotationElementVector();
302 const uint32_t type_idx = DecodeUnsignedLeb128(data);
303 const uint32_t size = DecodeUnsignedLeb128(data);
304 // Decode all name=value pairs.
305 for (uint32_t i = 0; i < size; i++) {
306 const uint32_t name_index = DecodeUnsignedLeb128(data);
307 elements->push_back(std::unique_ptr<AnnotationElement>(
308 new AnnotationElement(GetStringId(name_index), ReadEncodedValue(data))));
309 }
310 item->SetEncodedAnnotation(new EncodedAnnotation(GetTypeId(type_idx), elements));
311 break;
312 }
313 case DexFile::kDexAnnotationNull:
314 break;
315 case DexFile::kDexAnnotationBoolean:
316 item->SetBoolean(length != 0);
317 break;
318 default:
319 break;
320 }
321 }
322
CreateStringId(const DexFile & dex_file,uint32_t i)323 void Collections::CreateStringId(const DexFile& dex_file, uint32_t i) {
324 const DexFile::StringId& disk_string_id = dex_file.GetStringId(dex::StringIndex(i));
325 StringData* string_data = new StringData(dex_file.GetStringData(disk_string_id));
326 string_datas_.AddItem(string_data, disk_string_id.string_data_off_);
327
328 StringId* string_id = new StringId(string_data);
329 string_ids_.AddIndexedItem(string_id, StringIdsOffset() + i * StringId::ItemSize(), i);
330 }
331
CreateTypeId(const DexFile & dex_file,uint32_t i)332 void Collections::CreateTypeId(const DexFile& dex_file, uint32_t i) {
333 const DexFile::TypeId& disk_type_id = dex_file.GetTypeId(dex::TypeIndex(i));
334 TypeId* type_id = new TypeId(GetStringId(disk_type_id.descriptor_idx_.index_));
335 type_ids_.AddIndexedItem(type_id, TypeIdsOffset() + i * TypeId::ItemSize(), i);
336 }
337
CreateProtoId(const DexFile & dex_file,uint32_t i)338 void Collections::CreateProtoId(const DexFile& dex_file, uint32_t i) {
339 const DexFile::ProtoId& disk_proto_id = dex_file.GetProtoId(i);
340 const DexFile::TypeList* type_list = dex_file.GetProtoParameters(disk_proto_id);
341 TypeList* parameter_type_list = CreateTypeList(type_list, disk_proto_id.parameters_off_);
342
343 ProtoId* proto_id = new ProtoId(GetStringId(disk_proto_id.shorty_idx_.index_),
344 GetTypeId(disk_proto_id.return_type_idx_.index_),
345 parameter_type_list);
346 proto_ids_.AddIndexedItem(proto_id, ProtoIdsOffset() + i * ProtoId::ItemSize(), i);
347 }
348
CreateFieldId(const DexFile & dex_file,uint32_t i)349 void Collections::CreateFieldId(const DexFile& dex_file, uint32_t i) {
350 const DexFile::FieldId& disk_field_id = dex_file.GetFieldId(i);
351 FieldId* field_id = new FieldId(GetTypeId(disk_field_id.class_idx_.index_),
352 GetTypeId(disk_field_id.type_idx_.index_),
353 GetStringId(disk_field_id.name_idx_.index_));
354 field_ids_.AddIndexedItem(field_id, FieldIdsOffset() + i * FieldId::ItemSize(), i);
355 }
356
CreateMethodId(const DexFile & dex_file,uint32_t i)357 void Collections::CreateMethodId(const DexFile& dex_file, uint32_t i) {
358 const DexFile::MethodId& disk_method_id = dex_file.GetMethodId(i);
359 MethodId* method_id = new MethodId(GetTypeId(disk_method_id.class_idx_.index_),
360 GetProtoId(disk_method_id.proto_idx_),
361 GetStringId(disk_method_id.name_idx_.index_));
362 method_ids_.AddIndexedItem(method_id, MethodIdsOffset() + i * MethodId::ItemSize(), i);
363 }
364
CreateClassDef(const DexFile & dex_file,uint32_t i)365 void Collections::CreateClassDef(const DexFile& dex_file, uint32_t i) {
366 const DexFile::ClassDef& disk_class_def = dex_file.GetClassDef(i);
367 const TypeId* class_type = GetTypeId(disk_class_def.class_idx_.index_);
368 uint32_t access_flags = disk_class_def.access_flags_;
369 const TypeId* superclass = GetTypeIdOrNullPtr(disk_class_def.superclass_idx_.index_);
370
371 const DexFile::TypeList* type_list = dex_file.GetInterfacesList(disk_class_def);
372 TypeList* interfaces_type_list = CreateTypeList(type_list, disk_class_def.interfaces_off_);
373
374 const StringId* source_file = GetStringIdOrNullPtr(disk_class_def.source_file_idx_.index_);
375 // Annotations.
376 AnnotationsDirectoryItem* annotations = nullptr;
377 const DexFile::AnnotationsDirectoryItem* disk_annotations_directory_item =
378 dex_file.GetAnnotationsDirectory(disk_class_def);
379 if (disk_annotations_directory_item != nullptr) {
380 annotations = CreateAnnotationsDirectoryItem(
381 dex_file, disk_annotations_directory_item, disk_class_def.annotations_off_);
382 }
383 // Static field initializers.
384 const uint8_t* static_data = dex_file.GetEncodedStaticFieldValuesArray(disk_class_def);
385 EncodedArrayItem* static_values =
386 CreateEncodedArrayItem(static_data, disk_class_def.static_values_off_);
387 ClassData* class_data = CreateClassData(
388 dex_file, dex_file.GetClassData(disk_class_def), disk_class_def.class_data_off_);
389 ClassDef* class_def = new ClassDef(class_type, access_flags, superclass, interfaces_type_list,
390 source_file, annotations, static_values, class_data);
391 class_defs_.AddIndexedItem(class_def, ClassDefsOffset() + i * ClassDef::ItemSize(), i);
392 }
393
CreateTypeList(const DexFile::TypeList * dex_type_list,uint32_t offset)394 TypeList* Collections::CreateTypeList(const DexFile::TypeList* dex_type_list, uint32_t offset) {
395 if (dex_type_list == nullptr) {
396 return nullptr;
397 }
398 auto found_type_list = TypeLists().find(offset);
399 if (found_type_list != TypeLists().end()) {
400 return found_type_list->second.get();
401 }
402 TypeIdVector* type_vector = new TypeIdVector();
403 uint32_t size = dex_type_list->Size();
404 for (uint32_t index = 0; index < size; ++index) {
405 type_vector->push_back(GetTypeId(dex_type_list->GetTypeItem(index).type_idx_.index_));
406 }
407 TypeList* new_type_list = new TypeList(type_vector);
408 type_lists_.AddItem(new_type_list, offset);
409 return new_type_list;
410 }
411
CreateEncodedArrayItem(const uint8_t * static_data,uint32_t offset)412 EncodedArrayItem* Collections::CreateEncodedArrayItem(const uint8_t* static_data, uint32_t offset) {
413 if (static_data == nullptr) {
414 return nullptr;
415 }
416 auto found_encoded_array_item = EncodedArrayItems().find(offset);
417 if (found_encoded_array_item != EncodedArrayItems().end()) {
418 return found_encoded_array_item->second.get();
419 }
420 uint32_t size = DecodeUnsignedLeb128(&static_data);
421 EncodedValueVector* values = new EncodedValueVector();
422 for (uint32_t i = 0; i < size; ++i) {
423 values->push_back(std::unique_ptr<EncodedValue>(ReadEncodedValue(&static_data)));
424 }
425 // TODO: Calculate the size of the encoded array.
426 EncodedArrayItem* encoded_array_item = new EncodedArrayItem(values);
427 encoded_array_items_.AddItem(encoded_array_item, offset);
428 return encoded_array_item;
429 }
430
CreateAnnotationItem(const DexFile::AnnotationItem * annotation,uint32_t offset)431 AnnotationItem* Collections::CreateAnnotationItem(const DexFile::AnnotationItem* annotation,
432 uint32_t offset) {
433 auto found_annotation_item = AnnotationItems().find(offset);
434 if (found_annotation_item != AnnotationItems().end()) {
435 return found_annotation_item->second.get();
436 }
437 uint8_t visibility = annotation->visibility_;
438 const uint8_t* annotation_data = annotation->annotation_;
439 std::unique_ptr<EncodedValue> encoded_value(
440 ReadEncodedValue(&annotation_data, DexFile::kDexAnnotationAnnotation, 0));
441 // TODO: Calculate the size of the annotation.
442 AnnotationItem* annotation_item =
443 new AnnotationItem(visibility, encoded_value->ReleaseEncodedAnnotation());
444 annotation_items_.AddItem(annotation_item, offset);
445 return annotation_item;
446 }
447
448
CreateAnnotationSetItem(const DexFile & dex_file,const DexFile::AnnotationSetItem * disk_annotations_item,uint32_t offset)449 AnnotationSetItem* Collections::CreateAnnotationSetItem(const DexFile& dex_file,
450 const DexFile::AnnotationSetItem* disk_annotations_item, uint32_t offset) {
451 if (disk_annotations_item == nullptr || (disk_annotations_item->size_ == 0 && offset == 0)) {
452 return nullptr;
453 }
454 auto found_anno_set_item = AnnotationSetItems().find(offset);
455 if (found_anno_set_item != AnnotationSetItems().end()) {
456 return found_anno_set_item->second.get();
457 }
458 std::vector<AnnotationItem*>* items = new std::vector<AnnotationItem*>();
459 for (uint32_t i = 0; i < disk_annotations_item->size_; ++i) {
460 const DexFile::AnnotationItem* annotation =
461 dex_file.GetAnnotationItem(disk_annotations_item, i);
462 if (annotation == nullptr) {
463 continue;
464 }
465 AnnotationItem* annotation_item =
466 CreateAnnotationItem(annotation, disk_annotations_item->entries_[i]);
467 items->push_back(annotation_item);
468 }
469 AnnotationSetItem* annotation_set_item = new AnnotationSetItem(items);
470 annotation_set_items_.AddItem(annotation_set_item, offset);
471 return annotation_set_item;
472 }
473
CreateAnnotationsDirectoryItem(const DexFile & dex_file,const DexFile::AnnotationsDirectoryItem * disk_annotations_item,uint32_t offset)474 AnnotationsDirectoryItem* Collections::CreateAnnotationsDirectoryItem(const DexFile& dex_file,
475 const DexFile::AnnotationsDirectoryItem* disk_annotations_item, uint32_t offset) {
476 auto found_anno_dir_item = AnnotationsDirectoryItems().find(offset);
477 if (found_anno_dir_item != AnnotationsDirectoryItems().end()) {
478 return found_anno_dir_item->second.get();
479 }
480 const DexFile::AnnotationSetItem* class_set_item =
481 dex_file.GetClassAnnotationSet(disk_annotations_item);
482 AnnotationSetItem* class_annotation = nullptr;
483 if (class_set_item != nullptr) {
484 uint32_t item_offset = disk_annotations_item->class_annotations_off_;
485 class_annotation = CreateAnnotationSetItem(dex_file, class_set_item, item_offset);
486 }
487 const DexFile::FieldAnnotationsItem* fields =
488 dex_file.GetFieldAnnotations(disk_annotations_item);
489 FieldAnnotationVector* field_annotations = nullptr;
490 if (fields != nullptr) {
491 field_annotations = new FieldAnnotationVector();
492 for (uint32_t i = 0; i < disk_annotations_item->fields_size_; ++i) {
493 FieldId* field_id = GetFieldId(fields[i].field_idx_);
494 const DexFile::AnnotationSetItem* field_set_item =
495 dex_file.GetFieldAnnotationSetItem(fields[i]);
496 uint32_t annotation_set_offset = fields[i].annotations_off_;
497 AnnotationSetItem* annotation_set_item =
498 CreateAnnotationSetItem(dex_file, field_set_item, annotation_set_offset);
499 field_annotations->push_back(std::unique_ptr<FieldAnnotation>(
500 new FieldAnnotation(field_id, annotation_set_item)));
501 }
502 }
503 const DexFile::MethodAnnotationsItem* methods =
504 dex_file.GetMethodAnnotations(disk_annotations_item);
505 MethodAnnotationVector* method_annotations = nullptr;
506 if (methods != nullptr) {
507 method_annotations = new MethodAnnotationVector();
508 for (uint32_t i = 0; i < disk_annotations_item->methods_size_; ++i) {
509 MethodId* method_id = GetMethodId(methods[i].method_idx_);
510 const DexFile::AnnotationSetItem* method_set_item =
511 dex_file.GetMethodAnnotationSetItem(methods[i]);
512 uint32_t annotation_set_offset = methods[i].annotations_off_;
513 AnnotationSetItem* annotation_set_item =
514 CreateAnnotationSetItem(dex_file, method_set_item, annotation_set_offset);
515 method_annotations->push_back(std::unique_ptr<MethodAnnotation>(
516 new MethodAnnotation(method_id, annotation_set_item)));
517 }
518 }
519 const DexFile::ParameterAnnotationsItem* parameters =
520 dex_file.GetParameterAnnotations(disk_annotations_item);
521 ParameterAnnotationVector* parameter_annotations = nullptr;
522 if (parameters != nullptr) {
523 parameter_annotations = new ParameterAnnotationVector();
524 for (uint32_t i = 0; i < disk_annotations_item->parameters_size_; ++i) {
525 MethodId* method_id = GetMethodId(parameters[i].method_idx_);
526 const DexFile::AnnotationSetRefList* list =
527 dex_file.GetParameterAnnotationSetRefList(¶meters[i]);
528 parameter_annotations->push_back(std::unique_ptr<ParameterAnnotation>(
529 GenerateParameterAnnotation(dex_file, method_id, list, parameters[i].annotations_off_)));
530 }
531 }
532 // TODO: Calculate the size of the annotations directory.
533 AnnotationsDirectoryItem* annotations_directory_item = new AnnotationsDirectoryItem(
534 class_annotation, field_annotations, method_annotations, parameter_annotations);
535 annotations_directory_items_.AddItem(annotations_directory_item, offset);
536 return annotations_directory_item;
537 }
538
GenerateParameterAnnotation(const DexFile & dex_file,MethodId * method_id,const DexFile::AnnotationSetRefList * annotation_set_ref_list,uint32_t offset)539 ParameterAnnotation* Collections::GenerateParameterAnnotation(
540 const DexFile& dex_file, MethodId* method_id,
541 const DexFile::AnnotationSetRefList* annotation_set_ref_list, uint32_t offset) {
542 AnnotationSetRefList* set_ref_list = nullptr;
543 auto found_set_ref_list = AnnotationSetRefLists().find(offset);
544 if (found_set_ref_list != AnnotationSetRefLists().end()) {
545 set_ref_list = found_set_ref_list->second.get();
546 }
547 if (set_ref_list == nullptr) {
548 std::vector<AnnotationSetItem*>* annotations = new std::vector<AnnotationSetItem*>();
549 for (uint32_t i = 0; i < annotation_set_ref_list->size_; ++i) {
550 const DexFile::AnnotationSetItem* annotation_set_item =
551 dex_file.GetSetRefItemItem(&annotation_set_ref_list->list_[i]);
552 uint32_t set_offset = annotation_set_ref_list->list_[i].annotations_off_;
553 annotations->push_back(CreateAnnotationSetItem(dex_file, annotation_set_item, set_offset));
554 }
555 set_ref_list = new AnnotationSetRefList(annotations);
556 annotation_set_ref_lists_.AddItem(set_ref_list, offset);
557 }
558 return new ParameterAnnotation(method_id, set_ref_list);
559 }
560
CreateCodeItem(const DexFile & dex_file,const DexFile::CodeItem & disk_code_item,uint32_t offset)561 CodeItem* Collections::CreateCodeItem(const DexFile& dex_file,
562 const DexFile::CodeItem& disk_code_item, uint32_t offset) {
563 uint16_t registers_size = disk_code_item.registers_size_;
564 uint16_t ins_size = disk_code_item.ins_size_;
565 uint16_t outs_size = disk_code_item.outs_size_;
566 uint32_t tries_size = disk_code_item.tries_size_;
567
568 // TODO: Calculate the size of the debug info.
569 const uint8_t* debug_info_stream = dex_file.GetDebugInfoStream(&disk_code_item);
570 DebugInfoItem* debug_info = nullptr;
571 if (debug_info_stream != nullptr) {
572 debug_info = debug_info_items_.GetExistingObject(disk_code_item.debug_info_off_);
573 if (debug_info == nullptr) {
574 uint32_t debug_info_size = GetDebugInfoStreamSize(debug_info_stream);
575 uint8_t* debug_info_buffer = new uint8_t[debug_info_size];
576 memcpy(debug_info_buffer, debug_info_stream, debug_info_size);
577 debug_info = new DebugInfoItem(debug_info_size, debug_info_buffer);
578 debug_info_items_.AddItem(debug_info, disk_code_item.debug_info_off_);
579 }
580 }
581
582 uint32_t insns_size = disk_code_item.insns_size_in_code_units_;
583 uint16_t* insns = new uint16_t[insns_size];
584 memcpy(insns, disk_code_item.insns_, insns_size * sizeof(uint16_t));
585
586 TryItemVector* tries = nullptr;
587 CatchHandlerVector* handler_list = nullptr;
588 if (tries_size > 0) {
589 tries = new TryItemVector();
590 handler_list = new CatchHandlerVector();
591 for (uint32_t i = 0; i < tries_size; ++i) {
592 const DexFile::TryItem* disk_try_item = dex_file.GetTryItems(disk_code_item, i);
593 uint32_t start_addr = disk_try_item->start_addr_;
594 uint16_t insn_count = disk_try_item->insn_count_;
595 uint16_t handler_off = disk_try_item->handler_off_;
596 const CatchHandler* handlers = nullptr;
597 for (std::unique_ptr<const CatchHandler>& existing_handlers : *handler_list) {
598 if (handler_off == existing_handlers->GetListOffset()) {
599 handlers = existing_handlers.get();
600 break;
601 }
602 }
603 if (handlers == nullptr) {
604 bool catch_all = false;
605 TypeAddrPairVector* addr_pairs = new TypeAddrPairVector();
606 for (CatchHandlerIterator it(disk_code_item, *disk_try_item); it.HasNext(); it.Next()) {
607 const dex::TypeIndex type_index = it.GetHandlerTypeIndex();
608 const TypeId* type_id = GetTypeIdOrNullPtr(type_index.index_);
609 catch_all |= type_id == nullptr;
610 addr_pairs->push_back(std::unique_ptr<const TypeAddrPair>(
611 new TypeAddrPair(type_id, it.GetHandlerAddress())));
612 }
613 handlers = new CatchHandler(catch_all, handler_off, addr_pairs);
614 handler_list->push_back(std::unique_ptr<const CatchHandler>(handlers));
615 }
616 TryItem* try_item = new TryItem(start_addr, insn_count, handlers);
617 tries->push_back(std::unique_ptr<const TryItem>(try_item));
618 }
619 // Manually walk catch handlers list and add any missing handlers unreferenced by try items.
620 const uint8_t* handlers_base = DexFile::GetCatchHandlerData(disk_code_item, 0);
621 const uint8_t* handlers_data = handlers_base;
622 uint32_t handlers_size = DecodeUnsignedLeb128(&handlers_data);
623 while (handlers_size > handler_list->size()) {
624 bool already_added = false;
625 uint16_t handler_off = handlers_data - handlers_base;
626 for (std::unique_ptr<const CatchHandler>& existing_handlers : *handler_list) {
627 if (handler_off == existing_handlers->GetListOffset()) {
628 already_added = true;
629 break;
630 }
631 }
632 int32_t size = DecodeSignedLeb128(&handlers_data);
633 bool has_catch_all = size <= 0;
634 if (has_catch_all) {
635 size = -size;
636 }
637 if (already_added) {
638 for (int32_t i = 0; i < size; i++) {
639 DecodeUnsignedLeb128(&handlers_data);
640 DecodeUnsignedLeb128(&handlers_data);
641 }
642 if (has_catch_all) {
643 DecodeUnsignedLeb128(&handlers_data);
644 }
645 continue;
646 }
647 TypeAddrPairVector* addr_pairs = new TypeAddrPairVector();
648 for (int32_t i = 0; i < size; i++) {
649 const TypeId* type_id = GetTypeIdOrNullPtr(DecodeUnsignedLeb128(&handlers_data));
650 uint32_t addr = DecodeUnsignedLeb128(&handlers_data);
651 addr_pairs->push_back(
652 std::unique_ptr<const TypeAddrPair>(new TypeAddrPair(type_id, addr)));
653 }
654 if (has_catch_all) {
655 uint32_t addr = DecodeUnsignedLeb128(&handlers_data);
656 addr_pairs->push_back(
657 std::unique_ptr<const TypeAddrPair>(new TypeAddrPair(nullptr, addr)));
658 }
659 const CatchHandler* handler = new CatchHandler(has_catch_all, handler_off, addr_pairs);
660 handler_list->push_back(std::unique_ptr<const CatchHandler>(handler));
661 }
662 }
663
664 uint32_t size = DexFile::GetCodeItemSize(disk_code_item);
665 CodeItem* code_item = new CodeItem(
666 registers_size, ins_size, outs_size, debug_info, insns_size, insns, tries, handler_list);
667 code_item->SetSize(size);
668 code_items_.AddItem(code_item, offset);
669 // Add "fixup" references to types, strings, methods, and fields.
670 // This is temporary, as we will probably want more detailed parsing of the
671 // instructions here.
672 std::unique_ptr<std::vector<TypeId*>> type_ids(new std::vector<TypeId*>());
673 std::unique_ptr<std::vector<StringId*>> string_ids(new std::vector<StringId*>());
674 std::unique_ptr<std::vector<MethodId*>> method_ids(new std::vector<MethodId*>());
675 std::unique_ptr<std::vector<FieldId*>> field_ids(new std::vector<FieldId*>());
676 if (GetIdsFromByteCode(*this,
677 code_item,
678 type_ids.get(),
679 string_ids.get(),
680 method_ids.get(),
681 field_ids.get())) {
682 CodeFixups* fixups = new CodeFixups(type_ids.release(),
683 string_ids.release(),
684 method_ids.release(),
685 field_ids.release());
686 code_item->SetCodeFixups(fixups);
687 }
688
689 return code_item;
690 }
691
GenerateMethodItem(const DexFile & dex_file,ClassDataItemIterator & cdii)692 MethodItem* Collections::GenerateMethodItem(const DexFile& dex_file, ClassDataItemIterator& cdii) {
693 MethodId* method_id = GetMethodId(cdii.GetMemberIndex());
694 uint32_t access_flags = cdii.GetRawMemberAccessFlags();
695 const DexFile::CodeItem* disk_code_item = cdii.GetMethodCodeItem();
696 CodeItem* code_item = code_items_.GetExistingObject(cdii.GetMethodCodeItemOffset());
697 DebugInfoItem* debug_info = nullptr;
698 if (disk_code_item != nullptr) {
699 if (code_item == nullptr) {
700 code_item = CreateCodeItem(dex_file, *disk_code_item, cdii.GetMethodCodeItemOffset());
701 }
702 debug_info = code_item->DebugInfo();
703 }
704 if (debug_info != nullptr) {
705 bool is_static = (access_flags & kAccStatic) != 0;
706 dex_file.DecodeDebugLocalInfo(
707 disk_code_item, is_static, cdii.GetMemberIndex(), GetLocalsCb, debug_info);
708 dex_file.DecodeDebugPositionInfo(disk_code_item, GetPositionsCb, debug_info);
709 }
710 return new MethodItem(access_flags, method_id, code_item);
711 }
712
CreateClassData(const DexFile & dex_file,const uint8_t * encoded_data,uint32_t offset)713 ClassData* Collections::CreateClassData(
714 const DexFile& dex_file, const uint8_t* encoded_data, uint32_t offset) {
715 // Read the fields and methods defined by the class, resolving the circular reference from those
716 // to classes by setting class at the same time.
717 ClassData* class_data = class_datas_.GetExistingObject(offset);
718 if (class_data == nullptr && encoded_data != nullptr) {
719 ClassDataItemIterator cdii(dex_file, encoded_data);
720 // Static fields.
721 FieldItemVector* static_fields = new FieldItemVector();
722 for (; cdii.HasNextStaticField(); cdii.Next()) {
723 FieldId* field_item = GetFieldId(cdii.GetMemberIndex());
724 uint32_t access_flags = cdii.GetRawMemberAccessFlags();
725 static_fields->push_back(std::unique_ptr<FieldItem>(new FieldItem(access_flags, field_item)));
726 }
727 // Instance fields.
728 FieldItemVector* instance_fields = new FieldItemVector();
729 for (; cdii.HasNextInstanceField(); cdii.Next()) {
730 FieldId* field_item = GetFieldId(cdii.GetMemberIndex());
731 uint32_t access_flags = cdii.GetRawMemberAccessFlags();
732 instance_fields->push_back(
733 std::unique_ptr<FieldItem>(new FieldItem(access_flags, field_item)));
734 }
735 // Direct methods.
736 MethodItemVector* direct_methods = new MethodItemVector();
737 for (; cdii.HasNextDirectMethod(); cdii.Next()) {
738 direct_methods->push_back(std::unique_ptr<MethodItem>(GenerateMethodItem(dex_file, cdii)));
739 }
740 // Virtual methods.
741 MethodItemVector* virtual_methods = new MethodItemVector();
742 for (; cdii.HasNextVirtualMethod(); cdii.Next()) {
743 virtual_methods->push_back(std::unique_ptr<MethodItem>(GenerateMethodItem(dex_file, cdii)));
744 }
745 class_data = new ClassData(static_fields, instance_fields, direct_methods, virtual_methods);
746 class_data->SetSize(cdii.EndDataPointer() - encoded_data);
747 class_datas_.AddItem(class_data, offset);
748 }
749 return class_data;
750 }
751
CreateCallSitesAndMethodHandles(const DexFile & dex_file)752 void Collections::CreateCallSitesAndMethodHandles(const DexFile& dex_file) {
753 // Iterate through the map list and set the offset of the CallSiteIds and MethodHandleItems.
754 const DexFile::MapList* map =
755 reinterpret_cast<const DexFile::MapList*>(dex_file.Begin() + MapListOffset());
756 for (uint32_t i = 0; i < map->size_; ++i) {
757 const DexFile::MapItem* item = map->list_ + i;
758 switch (item->type_) {
759 case DexFile::kDexTypeCallSiteIdItem:
760 SetCallSiteIdsOffset(item->offset_);
761 break;
762 case DexFile::kDexTypeMethodHandleItem:
763 SetMethodHandleItemsOffset(item->offset_);
764 break;
765 default:
766 break;
767 }
768 }
769 // Populate MethodHandleItems first (CallSiteIds may depend on them).
770 for (uint32_t i = 0; i < dex_file.NumMethodHandles(); i++) {
771 CreateMethodHandleItem(dex_file, i);
772 }
773 // Populate CallSiteIds.
774 for (uint32_t i = 0; i < dex_file.NumCallSiteIds(); i++) {
775 CreateCallSiteId(dex_file, i);
776 }
777 }
778
CreateCallSiteId(const DexFile & dex_file,uint32_t i)779 void Collections::CreateCallSiteId(const DexFile& dex_file, uint32_t i) {
780 const DexFile::CallSiteIdItem& disk_call_site_id = dex_file.GetCallSiteId(i);
781 const uint8_t* disk_call_item_ptr = dex_file.Begin() + disk_call_site_id.data_off_;
782 EncodedArrayItem* call_site_item =
783 CreateEncodedArrayItem(disk_call_item_ptr, disk_call_site_id.data_off_);
784
785 CallSiteId* call_site_id = new CallSiteId(call_site_item);
786 call_site_ids_.AddIndexedItem(call_site_id, CallSiteIdsOffset() + i * CallSiteId::ItemSize(), i);
787 }
788
CreateMethodHandleItem(const DexFile & dex_file,uint32_t i)789 void Collections::CreateMethodHandleItem(const DexFile& dex_file, uint32_t i) {
790 const DexFile::MethodHandleItem& disk_method_handle = dex_file.GetMethodHandle(i);
791 uint16_t index = disk_method_handle.field_or_method_idx_;
792 DexFile::MethodHandleType type =
793 static_cast<DexFile::MethodHandleType>(disk_method_handle.method_handle_type_);
794 bool is_invoke = type == DexFile::MethodHandleType::kInvokeStatic ||
795 type == DexFile::MethodHandleType::kInvokeInstance ||
796 type == DexFile::MethodHandleType::kInvokeConstructor ||
797 type == DexFile::MethodHandleType::kInvokeDirect ||
798 type == DexFile::MethodHandleType::kInvokeInterface;
799 static_assert(DexFile::MethodHandleType::kLast == DexFile::MethodHandleType::kInvokeInterface,
800 "Unexpected method handle types.");
801 IndexedItem* field_or_method_id;
802 if (is_invoke) {
803 field_or_method_id = GetMethodId(index);
804 } else {
805 field_or_method_id = GetFieldId(index);
806 }
807 MethodHandleItem* method_handle = new MethodHandleItem(type, field_or_method_id);
808 method_handle_items_.AddIndexedItem(
809 method_handle, MethodHandleItemsOffset() + i * MethodHandleItem::ItemSize(), i);
810 }
811
HeaderOffset(const dex_ir::Collections & collections ATTRIBUTE_UNUSED)812 static uint32_t HeaderOffset(const dex_ir::Collections& collections ATTRIBUTE_UNUSED) {
813 return 0;
814 }
815
HeaderSize(const dex_ir::Collections & collections ATTRIBUTE_UNUSED)816 static uint32_t HeaderSize(const dex_ir::Collections& collections ATTRIBUTE_UNUSED) {
817 // Size is in elements, so there is only one header.
818 return 1;
819 }
820
821 // The description of each dex file section type.
822 struct FileSectionDescriptor {
823 public:
824 std::string name;
825 uint16_t type;
826 // A function that when applied to a collection object, gives the size of the section.
827 std::function<uint32_t(const dex_ir::Collections&)> size_fn;
828 // A function that when applied to a collection object, gives the offset of the section.
829 std::function<uint32_t(const dex_ir::Collections&)> offset_fn;
830 };
831
832 static const FileSectionDescriptor kFileSectionDescriptors[] = {
833 {
834 "Header",
835 DexFile::kDexTypeHeaderItem,
836 &HeaderSize,
837 &HeaderOffset,
838 }, {
839 "StringId",
840 DexFile::kDexTypeStringIdItem,
841 &dex_ir::Collections::StringIdsSize,
842 &dex_ir::Collections::StringIdsOffset
843 }, {
844 "TypeId",
845 DexFile::kDexTypeTypeIdItem,
846 &dex_ir::Collections::TypeIdsSize,
847 &dex_ir::Collections::TypeIdsOffset
848 }, {
849 "ProtoId",
850 DexFile::kDexTypeProtoIdItem,
851 &dex_ir::Collections::ProtoIdsSize,
852 &dex_ir::Collections::ProtoIdsOffset
853 }, {
854 "FieldId",
855 DexFile::kDexTypeFieldIdItem,
856 &dex_ir::Collections::FieldIdsSize,
857 &dex_ir::Collections::FieldIdsOffset
858 }, {
859 "MethodId",
860 DexFile::kDexTypeMethodIdItem,
861 &dex_ir::Collections::MethodIdsSize,
862 &dex_ir::Collections::MethodIdsOffset
863 }, {
864 "ClassDef",
865 DexFile::kDexTypeClassDefItem,
866 &dex_ir::Collections::ClassDefsSize,
867 &dex_ir::Collections::ClassDefsOffset
868 }, {
869 "CallSiteId",
870 DexFile::kDexTypeCallSiteIdItem,
871 &dex_ir::Collections::CallSiteIdsSize,
872 &dex_ir::Collections::CallSiteIdsOffset
873 }, {
874 "MethodHandle",
875 DexFile::kDexTypeMethodHandleItem,
876 &dex_ir::Collections::MethodHandleItemsSize,
877 &dex_ir::Collections::MethodHandleItemsOffset
878 }, {
879 "StringData",
880 DexFile::kDexTypeStringDataItem,
881 &dex_ir::Collections::StringDatasSize,
882 &dex_ir::Collections::StringDatasOffset
883 }, {
884 "TypeList",
885 DexFile::kDexTypeTypeList,
886 &dex_ir::Collections::TypeListsSize,
887 &dex_ir::Collections::TypeListsOffset
888 }, {
889 "EncArr",
890 DexFile::kDexTypeEncodedArrayItem,
891 &dex_ir::Collections::EncodedArrayItemsSize,
892 &dex_ir::Collections::EncodedArrayItemsOffset
893 }, {
894 "Annotation",
895 DexFile::kDexTypeAnnotationItem,
896 &dex_ir::Collections::AnnotationItemsSize,
897 &dex_ir::Collections::AnnotationItemsOffset
898 }, {
899 "AnnoSet",
900 DexFile::kDexTypeAnnotationSetItem,
901 &dex_ir::Collections::AnnotationSetItemsSize,
902 &dex_ir::Collections::AnnotationSetItemsOffset
903 }, {
904 "AnnoSetRL",
905 DexFile::kDexTypeAnnotationSetRefList,
906 &dex_ir::Collections::AnnotationSetRefListsSize,
907 &dex_ir::Collections::AnnotationSetRefListsOffset
908 }, {
909 "AnnoDir",
910 DexFile::kDexTypeAnnotationsDirectoryItem,
911 &dex_ir::Collections::AnnotationsDirectoryItemsSize,
912 &dex_ir::Collections::AnnotationsDirectoryItemsOffset
913 }, {
914 "DebugInfo",
915 DexFile::kDexTypeDebugInfoItem,
916 &dex_ir::Collections::DebugInfoItemsSize,
917 &dex_ir::Collections::DebugInfoItemsOffset
918 }, {
919 "CodeItem",
920 DexFile::kDexTypeCodeItem,
921 &dex_ir::Collections::CodeItemsSize,
922 &dex_ir::Collections::CodeItemsOffset
923 }, {
924 "ClassData",
925 DexFile::kDexTypeClassDataItem,
926 &dex_ir::Collections::ClassDatasSize,
927 &dex_ir::Collections::ClassDatasOffset
928 }
929 };
930
GetSortedDexFileSections(dex_ir::Header * header,dex_ir::SortDirection direction)931 std::vector<dex_ir::DexFileSection> GetSortedDexFileSections(dex_ir::Header* header,
932 dex_ir::SortDirection direction) {
933 const dex_ir::Collections& collections = header->GetCollections();
934 std::vector<dex_ir::DexFileSection> sorted_sections;
935 // Build the table that will map from offset to color
936 for (const FileSectionDescriptor& s : kFileSectionDescriptors) {
937 sorted_sections.push_back(dex_ir::DexFileSection(s.name,
938 s.type,
939 s.size_fn(collections),
940 s.offset_fn(collections)));
941 }
942 // Sort by offset.
943 std::sort(sorted_sections.begin(),
944 sorted_sections.end(),
945 [=](dex_ir::DexFileSection& a, dex_ir::DexFileSection& b) {
946 if (direction == SortDirection::kSortDescending) {
947 return a.offset > b.offset;
948 } else {
949 return a.offset < b.offset;
950 }
951 });
952 return sorted_sections;
953 }
954
955 } // namespace dex_ir
956 } // namespace art
957