blob: cb7f174787ef23a250653bada6a77d87827787c0 [file] [log] [blame]
Elliott Hughes2faa5f12012-01-30 14:42:07 -08001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Carl Shapiro1fb86202011-06-27 17:43:13 -070016
Brian Carlstromfc0e3212013-07-17 14:40:12 -070017#ifndef ART_RUNTIME_DEX_FILE_H_
18#define ART_RUNTIME_DEX_FILE_H_
Carl Shapiro1fb86202011-06-27 17:43:13 -070019
Ian Rogers700a4022014-05-19 16:49:03 -070020#include <memory>
Elliott Hughes0c424cb2011-08-26 10:16:25 -070021#include <string>
Brian Carlstrom74eb46a2011-08-02 20:10:14 -070022#include <vector>
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070023
Elliott Hughes07ed66b2012-12-12 18:34:25 -080024#include "base/logging.h"
Ian Rogers03b6eaf2014-10-28 09:34:57 -070025#include "base/value_object.h"
Andreas Gampea5b09a62016-11-17 15:21:22 -080026#include "dex_file_types.h"
Brian Carlstrom578bbdc2011-07-21 14:07:47 -070027#include "globals.h"
Ian Rogers08f753d2012-08-24 14:35:25 -070028#include "invoke_type.h"
Jesse Wilson6bf19152011-09-29 13:12:33 -040029#include "jni.h"
Ian Rogers08f753d2012-08-24 14:35:25 -070030#include "modifiers.h"
Ian Rogers68b56852014-08-29 20:19:11 -070031#include "utf.h"
Carl Shapiro1fb86202011-06-27 17:43:13 -070032
33namespace art {
34
Ian Rogers576ca0c2014-06-06 15:58:22 -070035class MemMap;
Richard Uhler07b3c232015-03-31 15:57:54 -070036class OatDexFile;
Ian Rogersd91d6d62013-09-25 20:26:14 -070037class Signature;
Ian Rogersfc0e94b2013-09-23 23:51:32 -070038class StringPiece;
Brian Carlstroma6cc8932012-01-04 14:44:07 -080039class ZipArchive;
40
Brian Carlstromf615a612011-07-23 12:50:34 -070041class DexFile {
Carl Shapiro1fb86202011-06-27 17:43:13 -070042 public:
Roland Levillain621b5ea2016-05-18 11:41:33 +010043 // First Dex format version supporting default methods.
Alex Lightb55f1ac2016-04-12 15:50:55 -070044 static const uint32_t kDefaultMethodsVersion = 37;
Roland Levillain621b5ea2016-05-18 11:41:33 +010045 // First Dex format version enforcing class definition ordering rules.
46 static const uint32_t kClassDefinitionOrderEnforcedVersion = 37;
47
Ian Rogers13735952014-10-08 12:43:28 -070048 static const uint8_t kDexMagic[];
Narayan Kamath52e66502016-08-01 14:20:31 +010049 static constexpr size_t kNumDexVersions = 3;
Alex Lightc4961812016-03-23 10:20:41 -070050 static constexpr size_t kDexVersionLen = 4;
51 static const uint8_t kDexMagicVersions[kNumDexVersions][kDexVersionLen];
52
Ian Rogers13735952014-10-08 12:43:28 -070053 static constexpr size_t kSha1DigestSize = 20;
54 static constexpr uint32_t kDexEndianConstant = 0x12345678;
Carl Shapiro80d4dde2011-06-28 16:24:07 -070055
Brian Carlstromb7bbba42011-10-13 14:58:47 -070056 // name of the DexFile entry within a zip archive
57 static const char* kClassesDex;
58
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070059 // The value of an invalid index.
60 static const uint32_t kDexNoIndex = 0xFFFFFFFF;
61
Ian Rogers0571d352011-11-03 19:51:38 -070062 // The value of an invalid index.
63 static const uint16_t kDexNoIndex16 = 0xFFFF;
Carl Shapiro1fb86202011-06-27 17:43:13 -070064
Alex Lightc4961812016-03-23 10:20:41 -070065 // The separator character in MultiDex locations.
Andreas Gampe833a4852014-05-21 18:46:59 -070066 static constexpr char kMultiDexSeparator = ':';
67
68 // A string version of the previous. This is a define so that we can merge string literals in the
69 // preprocessor.
70 #define kMultiDexSeparatorString ":"
71
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070072 // Raw header_item.
73 struct Header {
74 uint8_t magic_[8];
Brian Carlstrom7934ac22013-07-26 10:54:15 -070075 uint32_t checksum_; // See also location_checksum_
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070076 uint8_t signature_[kSha1DigestSize];
jeffhaof6174e82012-01-31 16:14:17 -080077 uint32_t file_size_; // size of entire file
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070078 uint32_t header_size_; // offset to start of next section
79 uint32_t endian_tag_;
Ian Rogers0571d352011-11-03 19:51:38 -070080 uint32_t link_size_; // unused
81 uint32_t link_off_; // unused
82 uint32_t map_off_; // unused
83 uint32_t string_ids_size_; // number of StringIds
84 uint32_t string_ids_off_; // file offset of StringIds array
85 uint32_t type_ids_size_; // number of TypeIds, we don't support more than 65535
86 uint32_t type_ids_off_; // file offset of TypeIds array
87 uint32_t proto_ids_size_; // number of ProtoIds, we don't support more than 65535
88 uint32_t proto_ids_off_; // file offset of ProtoIds array
89 uint32_t field_ids_size_; // number of FieldIds
90 uint32_t field_ids_off_; // file offset of FieldIds array
91 uint32_t method_ids_size_; // number of MethodIds
92 uint32_t method_ids_off_; // file offset of MethodIds array
93 uint32_t class_defs_size_; // number of ClassDefs
94 uint32_t class_defs_off_; // file offset of ClassDef array
95 uint32_t data_size_; // unused
96 uint32_t data_off_; // unused
Elliott Hughesa21039c2012-06-21 12:09:25 -070097
Andreas Gampe76ed99d2016-03-28 18:31:29 -070098 // Decode the dex magic version
99 uint32_t GetVersion() const;
100
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700101 private:
102 DISALLOW_COPY_AND_ASSIGN(Header);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700103 };
Carl Shapiro1fb86202011-06-27 17:43:13 -0700104
jeffhao10037c82012-01-23 15:06:23 -0800105 // Map item type codes.
106 enum {
107 kDexTypeHeaderItem = 0x0000,
108 kDexTypeStringIdItem = 0x0001,
109 kDexTypeTypeIdItem = 0x0002,
110 kDexTypeProtoIdItem = 0x0003,
111 kDexTypeFieldIdItem = 0x0004,
112 kDexTypeMethodIdItem = 0x0005,
113 kDexTypeClassDefItem = 0x0006,
114 kDexTypeMapList = 0x1000,
115 kDexTypeTypeList = 0x1001,
116 kDexTypeAnnotationSetRefList = 0x1002,
117 kDexTypeAnnotationSetItem = 0x1003,
118 kDexTypeClassDataItem = 0x2000,
119 kDexTypeCodeItem = 0x2001,
120 kDexTypeStringDataItem = 0x2002,
121 kDexTypeDebugInfoItem = 0x2003,
122 kDexTypeAnnotationItem = 0x2004,
123 kDexTypeEncodedArrayItem = 0x2005,
124 kDexTypeAnnotationsDirectoryItem = 0x2006,
125 };
126
127 struct MapItem {
128 uint16_t type_;
129 uint16_t unused_;
130 uint32_t size_;
131 uint32_t offset_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700132
jeffhao10037c82012-01-23 15:06:23 -0800133 private:
134 DISALLOW_COPY_AND_ASSIGN(MapItem);
135 };
136
137 struct MapList {
138 uint32_t size_;
139 MapItem list_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700140
jeffhao10037c82012-01-23 15:06:23 -0800141 private:
142 DISALLOW_COPY_AND_ASSIGN(MapList);
143 };
144
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700145 // Raw string_id_item.
146 struct StringId {
147 uint32_t string_data_off_; // offset in bytes from the base address
Elliott Hughesa21039c2012-06-21 12:09:25 -0700148
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700149 private:
150 DISALLOW_COPY_AND_ASSIGN(StringId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700151 };
152
153 // Raw type_id_item.
154 struct TypeId {
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800155 dex::StringIndex descriptor_idx_; // index into string_ids
Elliott Hughesa21039c2012-06-21 12:09:25 -0700156
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700157 private:
158 DISALLOW_COPY_AND_ASSIGN(TypeId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700159 };
160
161 // Raw field_id_item.
162 struct FieldId {
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800163 dex::TypeIndex class_idx_; // index into type_ids_ array for defining class
164 dex::TypeIndex type_idx_; // index into type_ids_ array for field type
165 dex::StringIndex name_idx_; // index into string_ids_ array for field name
Elliott Hughesa21039c2012-06-21 12:09:25 -0700166
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700167 private:
168 DISALLOW_COPY_AND_ASSIGN(FieldId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700169 };
170
Andreas Gampea5b09a62016-11-17 15:21:22 -0800171 // Raw proto_id_item.
172 struct ProtoId {
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800173 dex::StringIndex shorty_idx_; // index into string_ids array for shorty descriptor
Andreas Gampea5b09a62016-11-17 15:21:22 -0800174 dex::TypeIndex return_type_idx_; // index into type_ids array for return type
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800175 uint16_t pad_; // padding = 0
176 uint32_t parameters_off_; // file offset to type_list for parameter types
Andreas Gampea5b09a62016-11-17 15:21:22 -0800177
178 private:
179 DISALLOW_COPY_AND_ASSIGN(ProtoId);
180 };
181
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700182 // Raw method_id_item.
183 struct MethodId {
Andreas Gampea5b09a62016-11-17 15:21:22 -0800184 dex::TypeIndex class_idx_; // index into type_ids_ array for defining class
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800185 uint16_t proto_idx_; // index into proto_ids_ array for method prototype
186 dex::StringIndex name_idx_; // index into string_ids_ array for method name
Elliott Hughesa21039c2012-06-21 12:09:25 -0700187
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700188 private:
189 DISALLOW_COPY_AND_ASSIGN(MethodId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700190 };
191
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700192 // Raw class_def_item.
193 struct ClassDef {
Andreas Gampea5b09a62016-11-17 15:21:22 -0800194 dex::TypeIndex class_idx_; // index into type_ids_ array for this class
Ian Rogers0571d352011-11-03 19:51:38 -0700195 uint16_t pad1_; // padding = 0
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700196 uint32_t access_flags_;
Andreas Gampea5b09a62016-11-17 15:21:22 -0800197 dex::TypeIndex superclass_idx_; // index into type_ids_ array for superclass
Ian Rogers0571d352011-11-03 19:51:38 -0700198 uint16_t pad2_; // padding = 0
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700199 uint32_t interfaces_off_; // file offset to TypeList
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800200 dex::StringIndex source_file_idx_; // index into string_ids_ for source file name
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700201 uint32_t annotations_off_; // file offset to annotations_directory_item
202 uint32_t class_data_off_; // file offset to class_data_item
203 uint32_t static_values_off_; // file offset to EncodedArray
Elliott Hughesa21039c2012-06-21 12:09:25 -0700204
Andreas Gampe51829322014-08-25 15:05:04 -0700205 // Returns the valid access flags, that is, Java modifier bits relevant to the ClassDef type
206 // (class or interface). These are all in the lower 16b and do not contain runtime flags.
207 uint32_t GetJavaAccessFlags() const {
208 // Make sure that none of our runtime-only flags are set.
Andreas Gampe575e78c2014-11-03 23:41:03 -0800209 static_assert((kAccValidClassFlags & kAccJavaFlagsMask) == kAccValidClassFlags,
210 "Valid class flags not a subset of Java flags");
211 static_assert((kAccValidInterfaceFlags & kAccJavaFlagsMask) == kAccValidInterfaceFlags,
212 "Valid interface flags not a subset of Java flags");
Andreas Gampe51829322014-08-25 15:05:04 -0700213
214 if ((access_flags_ & kAccInterface) != 0) {
215 // Interface.
216 return access_flags_ & kAccValidInterfaceFlags;
217 } else {
218 // Class.
219 return access_flags_ & kAccValidClassFlags;
220 }
221 }
222
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700223 private:
224 DISALLOW_COPY_AND_ASSIGN(ClassDef);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700225 };
226
227 // Raw type_item.
228 struct TypeItem {
Andreas Gampea5b09a62016-11-17 15:21:22 -0800229 dex::TypeIndex type_idx_; // index into type_ids section
Elliott Hughesa21039c2012-06-21 12:09:25 -0700230
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700231 private:
232 DISALLOW_COPY_AND_ASSIGN(TypeItem);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700233 };
234
235 // Raw type_list.
236 class TypeList {
237 public:
238 uint32_t Size() const {
239 return size_;
240 }
241
242 const TypeItem& GetTypeItem(uint32_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200243 DCHECK_LT(idx, this->size_);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700244 return this->list_[idx];
245 }
246
Andreas Gampe31a7a0c2014-08-29 16:07:49 -0700247 // Size in bytes of the part of the list that is common.
248 static constexpr size_t GetHeaderSize() {
249 return 4U;
250 }
251
252 // Size in bytes of the whole type list including all the stored elements.
253 static constexpr size_t GetListSize(size_t count) {
254 return GetHeaderSize() + sizeof(TypeItem) * count;
255 }
256
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700257 private:
258 uint32_t size_; // size of the list, in entries
259 TypeItem list_[1]; // elements of the list
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700260 DISALLOW_COPY_AND_ASSIGN(TypeList);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700261 };
262
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700263 // Raw code_item.
264 struct CodeItem {
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700265 uint16_t registers_size_; // the number of registers used by this code
266 // (locals + parameters)
267 uint16_t ins_size_; // the number of words of incoming arguments to the method
268 // that this code is for
269 uint16_t outs_size_; // the number of words of outgoing argument space required
270 // by this code for method invocation
271 uint16_t tries_size_; // the number of try_items for this instance. If non-zero,
272 // then these appear as the tries array just after the
273 // insns in this instance.
274 uint32_t debug_info_off_; // file offset to debug info stream
Ian Rogersd81871c2011-10-03 13:57:23 -0700275 uint32_t insns_size_in_code_units_; // size of the insns array, in 2 byte code units
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700276 uint16_t insns_[1]; // actual array of bytecode.
Elliott Hughesa21039c2012-06-21 12:09:25 -0700277
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700278 private:
279 DISALLOW_COPY_AND_ASSIGN(CodeItem);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700280 };
281
Carl Shapiro2eaa9682011-08-04 19:26:11 -0700282 // Raw try_item.
283 struct TryItem {
284 uint32_t start_addr_;
285 uint16_t insn_count_;
286 uint16_t handler_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700287
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700288 private:
289 DISALLOW_COPY_AND_ASSIGN(TryItem);
Carl Shapiro2eaa9682011-08-04 19:26:11 -0700290 };
291
jeffhao10037c82012-01-23 15:06:23 -0800292 // Annotation constants.
293 enum {
294 kDexVisibilityBuild = 0x00, /* annotation visibility */
295 kDexVisibilityRuntime = 0x01,
296 kDexVisibilitySystem = 0x02,
297
298 kDexAnnotationByte = 0x00,
299 kDexAnnotationShort = 0x02,
300 kDexAnnotationChar = 0x03,
301 kDexAnnotationInt = 0x04,
302 kDexAnnotationLong = 0x06,
303 kDexAnnotationFloat = 0x10,
304 kDexAnnotationDouble = 0x11,
305 kDexAnnotationString = 0x17,
306 kDexAnnotationType = 0x18,
307 kDexAnnotationField = 0x19,
308 kDexAnnotationMethod = 0x1a,
309 kDexAnnotationEnum = 0x1b,
310 kDexAnnotationArray = 0x1c,
311 kDexAnnotationAnnotation = 0x1d,
312 kDexAnnotationNull = 0x1e,
313 kDexAnnotationBoolean = 0x1f,
314
315 kDexAnnotationValueTypeMask = 0x1f, /* low 5 bits */
316 kDexAnnotationValueArgShift = 5,
317 };
318
319 struct AnnotationsDirectoryItem {
320 uint32_t class_annotations_off_;
321 uint32_t fields_size_;
322 uint32_t methods_size_;
323 uint32_t parameters_size_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700324
jeffhao10037c82012-01-23 15:06:23 -0800325 private:
326 DISALLOW_COPY_AND_ASSIGN(AnnotationsDirectoryItem);
327 };
328
329 struct FieldAnnotationsItem {
330 uint32_t field_idx_;
331 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700332
jeffhao10037c82012-01-23 15:06:23 -0800333 private:
334 DISALLOW_COPY_AND_ASSIGN(FieldAnnotationsItem);
335 };
336
337 struct MethodAnnotationsItem {
338 uint32_t method_idx_;
339 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700340
jeffhao10037c82012-01-23 15:06:23 -0800341 private:
342 DISALLOW_COPY_AND_ASSIGN(MethodAnnotationsItem);
343 };
344
345 struct ParameterAnnotationsItem {
346 uint32_t method_idx_;
347 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700348
jeffhao10037c82012-01-23 15:06:23 -0800349 private:
350 DISALLOW_COPY_AND_ASSIGN(ParameterAnnotationsItem);
351 };
352
353 struct AnnotationSetRefItem {
354 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700355
jeffhao10037c82012-01-23 15:06:23 -0800356 private:
357 DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefItem);
358 };
359
360 struct AnnotationSetRefList {
361 uint32_t size_;
362 AnnotationSetRefItem list_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700363
jeffhao10037c82012-01-23 15:06:23 -0800364 private:
365 DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefList);
366 };
367
368 struct AnnotationSetItem {
369 uint32_t size_;
370 uint32_t entries_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700371
jeffhao10037c82012-01-23 15:06:23 -0800372 private:
373 DISALLOW_COPY_AND_ASSIGN(AnnotationSetItem);
374 };
375
376 struct AnnotationItem {
377 uint8_t visibility_;
378 uint8_t annotation_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700379
jeffhao10037c82012-01-23 15:06:23 -0800380 private:
381 DISALLOW_COPY_AND_ASSIGN(AnnotationItem);
382 };
383
Jeff Hao13e748b2015-08-25 20:44:19 +0000384 enum AnnotationResultStyle { // private
385 kAllObjects,
386 kPrimitivesOrObjects,
387 kAllRaw
388 };
389
David Sehr9323e6e2016-09-13 08:58:35 -0700390 struct AnnotationValue;
391
Brian Carlstrom5b332c82012-02-01 15:02:31 -0800392 // Returns the checksum of a file for comparison with GetLocationChecksum().
393 // For .dex files, this is the header checksum.
394 // For zip files, this is the classes.dex zip entry CRC32 checksum.
395 // Return true if the checksum could be found, false otherwise.
Ian Rogers8d31bbd2013-10-13 10:44:14 -0700396 static bool GetChecksum(const char* filename, uint32_t* checksum, std::string* error_msg);
Brian Carlstrom78128a62011-09-15 17:21:19 -0700397
Brian Carlstrom89521892011-12-07 22:05:07 -0800398 // Opens .dex file, backed by existing memory
David Sehr733ddb22016-09-19 15:02:18 -0700399 static std::unique_ptr<const DexFile> Open(const uint8_t* base,
400 size_t size,
Richard Uhlerfbef44d2014-12-23 09:48:51 -0800401 const std::string& location,
402 uint32_t location_checksum,
Richard Uhler07b3c232015-03-31 15:57:54 -0700403 const OatDexFile* oat_dex_file,
Andreas Gampe3a2bd292016-01-26 17:23:47 -0800404 bool verify,
Aart Bik37d6a3b2016-06-21 18:30:10 -0700405 bool verify_checksum,
Andreas Gampe3a2bd292016-01-26 17:23:47 -0800406 std::string* error_msg);
Brian Carlstrom89521892011-12-07 22:05:07 -0800407
Orion Hodsona4c2a052016-08-17 10:51:42 +0100408 // Opens .dex file that has been memory-mapped by the caller.
409 static std::unique_ptr<const DexFile> Open(const std::string& location,
410 uint32_t location_checkum,
411 std::unique_ptr<MemMap> mem_map,
412 bool verify,
413 bool verify_checksum,
414 std::string* error_msg);
415
David Sehr733ddb22016-09-19 15:02:18 -0700416 // Opens all .dex files found in the file, guessing the container format based on file extension.
417 static bool Open(const char* filename,
418 const std::string& location,
419 bool verify_checksum,
420 std::string* error_msg,
421 std::vector<std::unique_ptr<const DexFile>>* dex_files);
Orion Hodsona4c2a052016-08-17 10:51:42 +0100422
David Sehr733ddb22016-09-19 15:02:18 -0700423 // Open a single dex file from an fd.
424 static std::unique_ptr<const DexFile> OpenDex(int fd,
425 const std::string& location,
426 bool verify_checksum,
427 std::string* error_msg);
428
429 // Opens dex files from within a .jar, .zip, or .apk file
430 static bool OpenZip(int fd,
431 const std::string& location,
432 bool verify_checksum,
433 std::string* error_msg,
434 std::vector<std::unique_ptr<const DexFile>>* dex_files);
Brian Carlstroma6cc8932012-01-04 14:44:07 -0800435
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700436 // Closes a .dex file.
Brian Carlstromf615a612011-07-23 12:50:34 -0700437 virtual ~DexFile();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700438
Brian Carlstroma663ea52011-08-19 23:33:41 -0700439 const std::string& GetLocation() const {
440 return location_;
441 }
442
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700443 // For normal dex files, location and base location coincide. If a dex file is part of a multidex
444 // archive, the base location is the name of the originating jar/apk, stripped of any internal
445 // classes*.dex path.
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100446 static std::string GetBaseLocation(const char* location) {
447 const char* pos = strrchr(location, kMultiDexSeparator);
448 if (pos == nullptr) {
449 return location;
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700450 } else {
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100451 return std::string(location, pos - location);
452 }
453 }
454
Richard Uhlere5fed032015-03-18 08:21:11 -0700455 static std::string GetBaseLocation(const std::string& location) {
456 return GetBaseLocation(location.c_str());
457 }
458
459 // Returns the ':classes*.dex' part of the dex location. Returns an empty
460 // string if there is no multidex suffix for the given location.
461 // The kMultiDexSeparator is included in the returned suffix.
462 static std::string GetMultiDexSuffix(const std::string& location) {
463 size_t pos = location.rfind(kMultiDexSeparator);
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100464 if (pos == std::string::npos) {
Richard Uhlere5fed032015-03-18 08:21:11 -0700465 return "";
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100466 } else {
Richard Uhlere5fed032015-03-18 08:21:11 -0700467 return location.substr(pos);
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700468 }
469 }
470
Richard Uhlere5fed032015-03-18 08:21:11 -0700471 std::string GetBaseLocation() const {
472 return GetBaseLocation(location_);
473 }
474
Brian Carlstrom5b332c82012-02-01 15:02:31 -0800475 // For DexFiles directly from .dex files, this is the checksum from the DexFile::Header.
476 // For DexFiles opened from a zip files, this will be the ZipEntry CRC32 of classes.dex.
477 uint32_t GetLocationChecksum() const {
478 return location_checksum_;
479 }
480
Brian Carlstroma663ea52011-08-19 23:33:41 -0700481 const Header& GetHeader() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700482 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700483 return *header_;
Carl Shapiro1fb86202011-06-27 17:43:13 -0700484 }
485
Ian Rogers0571d352011-11-03 19:51:38 -0700486 // Decode the dex magic version
Andreas Gampe76ed99d2016-03-28 18:31:29 -0700487 uint32_t GetVersion() const {
488 return GetHeader().GetVersion();
489 }
Ian Rogersd81871c2011-10-03 13:57:23 -0700490
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800491 // Returns true if the byte string points to the magic value.
Ian Rogers13735952014-10-08 12:43:28 -0700492 static bool IsMagicValid(const uint8_t* magic);
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800493
494 // Returns true if the byte string after the magic is the correct value.
Ian Rogers13735952014-10-08 12:43:28 -0700495 static bool IsVersionValid(const uint8_t* magic);
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800496
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700497 // Returns the number of string identifiers in the .dex file.
498 size_t NumStringIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700499 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700500 return header_->string_ids_size_;
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700501 }
502
Ian Rogers0571d352011-11-03 19:51:38 -0700503 // Returns the StringId at the specified index.
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800504 const StringId& GetStringId(dex::StringIndex idx) const {
505 DCHECK_LT(idx.index_, NumStringIds()) << GetLocation();
506 return string_ids_[idx.index_];
Ian Rogers0571d352011-11-03 19:51:38 -0700507 }
508
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800509 dex::StringIndex GetIndexForStringId(const StringId& string_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800510 CHECK_GE(&string_id, string_ids_) << GetLocation();
511 CHECK_LT(&string_id, string_ids_ + header_->string_ids_size_) << GetLocation();
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800512 return dex::StringIndex(&string_id - string_ids_);
Ian Rogers0571d352011-11-03 19:51:38 -0700513 }
514
515 int32_t GetStringLength(const StringId& string_id) const;
516
Ian Rogersdfb325e2013-10-30 01:00:44 -0700517 // Returns a pointer to the UTF-8 string data referred to by the given string_id as well as the
518 // length of the string when decoded as a UTF-16 string. Note the UTF-16 length is not the same
519 // as the string length of the string data.
520 const char* GetStringDataAndUtf16Length(const StringId& string_id, uint32_t* utf16_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700521
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100522 const char* GetStringData(const StringId& string_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700523
Ian Rogersdfb325e2013-10-30 01:00:44 -0700524 // Index version of GetStringDataAndUtf16Length.
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800525 const char* StringDataAndUtf16LengthByIdx(dex::StringIndex idx, uint32_t* utf16_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700526
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800527 const char* StringDataByIdx(dex::StringIndex idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700528
Ian Rogers637c65b2013-05-31 11:46:00 -0700529 // Looks up a string id for a given modified utf8 string.
530 const StringId* FindStringId(const char* string) const;
531
Artem Udovichenkod9786b02015-10-14 16:36:55 +0300532 const TypeId* FindTypeId(const char* string) const;
533
Ian Rogers637c65b2013-05-31 11:46:00 -0700534 // Looks up a string id for a given utf16 string.
Vladimir Markoa48aef42014-12-03 17:53:53 +0000535 const StringId* FindStringId(const uint16_t* string, size_t length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700536
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700537 // Returns the number of type identifiers in the .dex file.
Ian Rogers68b56852014-08-29 20:19:11 -0700538 uint32_t NumTypeIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700539 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700540 return header_->type_ids_size_;
Carl Shapiro5fafe2b2011-07-09 15:34:41 -0700541 }
542
Ian Rogers0571d352011-11-03 19:51:38 -0700543 // Returns the TypeId at the specified index.
Andreas Gampea5b09a62016-11-17 15:21:22 -0800544 const TypeId& GetTypeId(dex::TypeIndex idx) const {
545 DCHECK_LT(idx.index_, NumTypeIds()) << GetLocation();
546 return type_ids_[idx.index_];
Carl Shapiro5fafe2b2011-07-09 15:34:41 -0700547 }
548
Andreas Gampea5b09a62016-11-17 15:21:22 -0800549 dex::TypeIndex GetIndexForTypeId(const TypeId& type_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800550 CHECK_GE(&type_id, type_ids_) << GetLocation();
551 CHECK_LT(&type_id, type_ids_ + header_->type_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700552 size_t result = &type_id - type_ids_;
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800553 DCHECK_LT(result, 65536U) << GetLocation();
Andreas Gampea5b09a62016-11-17 15:21:22 -0800554 return dex::TypeIndex(static_cast<uint16_t>(result));
Ian Rogers0571d352011-11-03 19:51:38 -0700555 }
556
557 // Get the descriptor string associated with a given type index.
Andreas Gampea5b09a62016-11-17 15:21:22 -0800558 const char* StringByTypeIdx(dex::TypeIndex idx, uint32_t* unicode_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700559
Andreas Gampea5b09a62016-11-17 15:21:22 -0800560 const char* StringByTypeIdx(dex::TypeIndex idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700561
562 // Returns the type descriptor string of a type id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100563 const char* GetTypeDescriptor(const TypeId& type_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700564
565 // Looks up a type for the given string index
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800566 const TypeId* FindTypeId(dex::StringIndex string_idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700567
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700568 // Returns the number of field identifiers in the .dex file.
569 size_t NumFieldIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700570 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700571 return header_->field_ids_size_;
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700572 }
573
Ian Rogers0571d352011-11-03 19:51:38 -0700574 // Returns the FieldId at the specified index.
575 const FieldId& GetFieldId(uint32_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200576 DCHECK_LT(idx, NumFieldIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700577 return field_ids_[idx];
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700578 }
579
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800580 uint32_t GetIndexForFieldId(const FieldId& field_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800581 CHECK_GE(&field_id, field_ids_) << GetLocation();
582 CHECK_LT(&field_id, field_ids_ + header_->field_ids_size_) << GetLocation();
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800583 return &field_id - field_ids_;
584 }
585
586 // Looks up a field by its declaring class, name and type
587 const FieldId* FindFieldId(const DexFile::TypeId& declaring_klass,
588 const DexFile::StringId& name,
589 const DexFile::TypeId& type) const;
590
Alex Light9c20a142016-08-23 15:05:12 -0700591 uint32_t FindCodeItemOffset(const DexFile::ClassDef& class_def,
592 uint32_t dex_method_idx) const;
593
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700594 // Returns the declaring class descriptor string of a field id.
595 const char* GetFieldDeclaringClassDescriptor(const FieldId& field_id) const {
Brian Carlstromb9edb842011-08-28 16:31:06 -0700596 const DexFile::TypeId& type_id = GetTypeId(field_id.class_idx_);
597 return GetTypeDescriptor(type_id);
598 }
599
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700600 // Returns the class descriptor string of a field id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100601 const char* GetFieldTypeDescriptor(const FieldId& field_id) const;
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700602
Brian Carlstromb9edb842011-08-28 16:31:06 -0700603 // Returns the name of a field id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100604 const char* GetFieldName(const FieldId& field_id) const;
Brian Carlstromb9edb842011-08-28 16:31:06 -0700605
Ian Rogers0571d352011-11-03 19:51:38 -0700606 // Returns the number of method identifiers in the .dex file.
607 size_t NumMethodIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700608 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700609 return header_->method_ids_size_;
610 }
611
612 // Returns the MethodId at the specified index.
613 const MethodId& GetMethodId(uint32_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700614 DCHECK_LT(idx, NumMethodIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700615 return method_ids_[idx];
616 }
617
618 uint32_t GetIndexForMethodId(const MethodId& method_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800619 CHECK_GE(&method_id, method_ids_) << GetLocation();
620 CHECK_LT(&method_id, method_ids_ + header_->method_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700621 return &method_id - method_ids_;
622 }
623
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800624 // Looks up a method by its declaring class, name and proto_id
625 const MethodId* FindMethodId(const DexFile::TypeId& declaring_klass,
626 const DexFile::StringId& name,
Ian Rogers0571d352011-11-03 19:51:38 -0700627 const DexFile::ProtoId& signature) const;
628
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700629 // Returns the declaring class descriptor string of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100630 const char* GetMethodDeclaringClassDescriptor(const MethodId& method_id) const;
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700631
jeffhao98eacac2011-09-14 16:11:53 -0700632 // Returns the prototype of a method id.
Brian Carlstromaded5f72011-10-07 17:15:04 -0700633 const ProtoId& GetMethodPrototype(const MethodId& method_id) const {
634 return GetProtoId(method_id.proto_idx_);
635 }
636
Ian Rogersd91d6d62013-09-25 20:26:14 -0700637 // Returns a representation of the signature of a method id.
638 const Signature GetMethodSignature(const MethodId& method_id) const;
jeffhao98eacac2011-09-14 16:11:53 -0700639
Orion Hodsonb34bb192016-10-18 17:02:58 +0100640 // Returns a representation of the signature of a proto id.
641 const Signature GetProtoSignature(const ProtoId& proto_id) const;
642
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700643 // Returns the name of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100644 const char* GetMethodName(const MethodId& method_id) const;
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700645
Calin Juravle68ad6492015-08-18 17:08:12 +0100646 // Returns the shorty of a method by its index.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100647 const char* GetMethodShorty(uint32_t idx) const;
Calin Juravle68ad6492015-08-18 17:08:12 +0100648
Ian Rogers0571d352011-11-03 19:51:38 -0700649 // Returns the shorty of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100650 const char* GetMethodShorty(const MethodId& method_id) const;
651 const char* GetMethodShorty(const MethodId& method_id, uint32_t* length) const;
652
Ian Rogers0571d352011-11-03 19:51:38 -0700653 // Returns the number of class definitions in the .dex file.
Ian Rogers68b56852014-08-29 20:19:11 -0700654 uint32_t NumClassDefs() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700655 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700656 return header_->class_defs_size_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700657 }
658
659 // Returns the ClassDef at the specified index.
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700660 const ClassDef& GetClassDef(uint16_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200661 DCHECK_LT(idx, NumClassDefs()) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700662 return class_defs_[idx];
663 }
664
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700665 uint16_t GetIndexForClassDef(const ClassDef& class_def) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800666 CHECK_GE(&class_def, class_defs_) << GetLocation();
667 CHECK_LT(&class_def, class_defs_ + header_->class_defs_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700668 return &class_def - class_defs_;
669 }
670
671 // Returns the class descriptor string of a class definition.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100672 const char* GetClassDescriptor(const ClassDef& class_def) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700673
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700674 // Looks up a class definition by its type index.
Andreas Gampea5b09a62016-11-17 15:21:22 -0800675 const ClassDef* FindClassDef(dex::TypeIndex type_idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700676
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700677 const TypeList* GetInterfacesList(const ClassDef& class_def) const {
678 if (class_def.interfaces_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700679 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700680 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700681 const uint8_t* addr = begin_ + class_def.interfaces_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700682 return reinterpret_cast<const TypeList*>(addr);
683 }
684 }
685
Ian Rogers0571d352011-11-03 19:51:38 -0700686 // Returns a pointer to the raw memory mapped class_data_item
Ian Rogers13735952014-10-08 12:43:28 -0700687 const uint8_t* GetClassData(const ClassDef& class_def) const {
Ian Rogers0571d352011-11-03 19:51:38 -0700688 if (class_def.class_data_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700689 return nullptr;
Ian Rogers0571d352011-11-03 19:51:38 -0700690 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800691 return begin_ + class_def.class_data_off_;
Ian Rogers0571d352011-11-03 19:51:38 -0700692 }
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700693 }
694
Ian Rogers0571d352011-11-03 19:51:38 -0700695 //
Ian Rogers6d4d9fc2011-11-30 16:24:48 -0800696 const CodeItem* GetCodeItem(const uint32_t code_off) const {
Alex Light9139e002015-10-09 15:59:48 -0700697 DCHECK_LT(code_off, size_) << "Code item offset larger then maximum allowed offset";
Ian Rogers6d4d9fc2011-11-30 16:24:48 -0800698 if (code_off == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700699 return nullptr; // native or abstract method
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700700 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700701 const uint8_t* addr = begin_ + code_off;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700702 return reinterpret_cast<const CodeItem*>(addr);
703 }
704 }
705
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100706 const char* GetReturnTypeDescriptor(const ProtoId& proto_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700707
708 // Returns the number of prototype identifiers in the .dex file.
709 size_t NumProtoIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700710 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700711 return header_->proto_ids_size_;
712 }
713
714 // Returns the ProtoId at the specified index.
Andreas Gampea5b09a62016-11-17 15:21:22 -0800715 const ProtoId& GetProtoId(uint16_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700716 DCHECK_LT(idx, NumProtoIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700717 return proto_ids_[idx];
718 }
719
720 uint16_t GetIndexForProtoId(const ProtoId& proto_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800721 CHECK_GE(&proto_id, proto_ids_) << GetLocation();
722 CHECK_LT(&proto_id, proto_ids_ + header_->proto_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700723 return &proto_id - proto_ids_;
724 }
725
726 // Looks up a proto id for a given return type and signature type list
Andreas Gampea5b09a62016-11-17 15:21:22 -0800727 const ProtoId* FindProtoId(dex::TypeIndex return_type_idx,
728 const dex::TypeIndex* signature_type_idxs,
729 uint32_t signature_length) const;
730 const ProtoId* FindProtoId(dex::TypeIndex return_type_idx,
731 const std::vector<dex::TypeIndex>& signature_type_idxs) const {
Vladimir Marko5c96e6b2013-11-14 15:34:17 +0000732 return FindProtoId(return_type_idx, &signature_type_idxs[0], signature_type_idxs.size());
733 }
Ian Rogers0571d352011-11-03 19:51:38 -0700734
735 // Given a signature place the type ids into the given vector, returns true on success
Andreas Gampea5b09a62016-11-17 15:21:22 -0800736 bool CreateTypeList(const StringPiece& signature,
737 dex::TypeIndex* return_type_idx,
738 std::vector<dex::TypeIndex>* param_type_idxs) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700739
Ian Rogersd91d6d62013-09-25 20:26:14 -0700740 // Create a Signature from the given string signature or return Signature::NoSignature if not
741 // possible.
742 const Signature CreateSignature(const StringPiece& signature) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700743
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700744 // Returns the short form method descriptor for the given prototype.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100745 const char* GetShorty(uint32_t proto_idx) const;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700746
747 const TypeList* GetProtoParameters(const ProtoId& proto_id) const {
748 if (proto_id.parameters_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700749 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700750 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700751 const uint8_t* addr = begin_ + proto_id.parameters_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700752 return reinterpret_cast<const TypeList*>(addr);
753 }
754 }
755
Ian Rogers13735952014-10-08 12:43:28 -0700756 const uint8_t* GetEncodedStaticFieldValuesArray(const ClassDef& class_def) const {
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700757 if (class_def.static_values_off_ == 0) {
758 return 0;
759 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800760 return begin_ + class_def.static_values_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700761 }
762 }
763
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800764 static const TryItem* GetTryItems(const CodeItem& code_item, uint32_t offset);
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700765
766 // Get the base of the encoded data for the given DexCode.
Ian Rogers13735952014-10-08 12:43:28 -0700767 static const uint8_t* GetCatchHandlerData(const CodeItem& code_item, uint32_t offset) {
768 const uint8_t* handler_data =
769 reinterpret_cast<const uint8_t*>(GetTryItems(code_item, code_item.tries_size_));
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700770 return handler_data + offset;
771 }
772
Ian Rogersdbbc99d2013-04-18 16:51:54 -0700773 // Find which try region is associated with the given address (ie dex pc). Returns -1 if none.
774 static int32_t FindTryItem(const CodeItem &code_item, uint32_t address);
775
776 // Find the handler offset associated with the given address (ie dex pc). Returns -1 if none.
777 static int32_t FindCatchHandlerOffset(const CodeItem &code_item, uint32_t address);
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700778
Shih-wei Liao195487c2011-08-20 13:29:04 -0700779 // Get the pointer to the start of the debugging data
Ian Rogers13735952014-10-08 12:43:28 -0700780 const uint8_t* GetDebugInfoStream(const CodeItem* code_item) const {
David Srbecky68529422015-07-07 19:13:29 +0100781 // Check that the offset is in bounds.
782 // Note that although the specification says that 0 should be used if there
783 // is no debug information, some applications incorrectly use 0xFFFFFFFF.
784 if (code_item->debug_info_off_ == 0 || code_item->debug_info_off_ >= size_) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700785 return nullptr;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700786 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800787 return begin_ + code_item->debug_info_off_;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700788 }
789 }
790
David Srbeckyb06e28e2015-12-10 13:15:00 +0000791 struct PositionInfo {
792 PositionInfo()
793 : address_(0),
794 line_(0),
795 source_file_(nullptr),
796 prologue_end_(false),
797 epilogue_begin_(false) {
798 }
799
800 uint32_t address_; // In 16-bit code units.
801 uint32_t line_; // Source code line number starting at 1.
802 const char* source_file_; // nullptr if the file from ClassDef still applies.
803 bool prologue_end_;
804 bool epilogue_begin_;
805 };
806
Shih-wei Liao195487c2011-08-20 13:29:04 -0700807 // Callback for "new position table entry".
808 // Returning true causes the decoder to stop early.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000809 typedef bool (*DexDebugNewPositionCb)(void* context, const PositionInfo& entry);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700810
David Srbeckyb06e28e2015-12-10 13:15:00 +0000811 struct LocalInfo {
812 LocalInfo()
813 : name_(nullptr),
814 descriptor_(nullptr),
815 signature_(nullptr),
816 start_address_(0),
817 end_address_(0),
818 reg_(0),
819 is_live_(false) {
820 }
Shih-wei Liao195487c2011-08-20 13:29:04 -0700821
David Srbeckyb06e28e2015-12-10 13:15:00 +0000822 const char* name_; // E.g., list. It can be nullptr if unknown.
823 const char* descriptor_; // E.g., Ljava/util/LinkedList;
824 const char* signature_; // E.g., java.util.LinkedList<java.lang.Integer>
825 uint32_t start_address_; // PC location where the local is first defined.
826 uint32_t end_address_; // PC location where the local is no longer defined.
827 uint16_t reg_; // Dex register which stores the values.
828 bool is_live_; // Is the local defined and live.
829 };
830
831 // Callback for "new locals table entry".
832 typedef void (*DexDebugNewLocalCb)(void* context, const LocalInfo& entry);
833
834 static bool LineNumForPcCb(void* context, const PositionInfo& entry);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700835
Jeff Hao13e748b2015-08-25 20:44:19 +0000836 const AnnotationsDirectoryItem* GetAnnotationsDirectory(const ClassDef& class_def) const {
837 if (class_def.annotations_off_ == 0) {
838 return nullptr;
839 } else {
840 return reinterpret_cast<const AnnotationsDirectoryItem*>(begin_ + class_def.annotations_off_);
841 }
842 }
843
844 const AnnotationSetItem* GetClassAnnotationSet(const AnnotationsDirectoryItem* anno_dir) const {
845 if (anno_dir->class_annotations_off_ == 0) {
846 return nullptr;
847 } else {
848 return reinterpret_cast<const AnnotationSetItem*>(begin_ + anno_dir->class_annotations_off_);
849 }
850 }
851
852 const FieldAnnotationsItem* GetFieldAnnotations(const AnnotationsDirectoryItem* anno_dir) const {
853 if (anno_dir->fields_size_ == 0) {
854 return nullptr;
855 } else {
856 return reinterpret_cast<const FieldAnnotationsItem*>(&anno_dir[1]);
857 }
858 }
859
860 const MethodAnnotationsItem* GetMethodAnnotations(const AnnotationsDirectoryItem* anno_dir)
861 const {
862 if (anno_dir->methods_size_ == 0) {
863 return nullptr;
864 } else {
865 // Skip past the header and field annotations.
866 const uint8_t* addr = reinterpret_cast<const uint8_t*>(&anno_dir[1]);
867 addr += anno_dir->fields_size_ * sizeof(FieldAnnotationsItem);
868 return reinterpret_cast<const MethodAnnotationsItem*>(addr);
869 }
870 }
871
872 const ParameterAnnotationsItem* GetParameterAnnotations(const AnnotationsDirectoryItem* anno_dir)
873 const {
874 if (anno_dir->parameters_size_ == 0) {
875 return nullptr;
876 } else {
877 // Skip past the header, field annotations, and method annotations.
878 const uint8_t* addr = reinterpret_cast<const uint8_t*>(&anno_dir[1]);
879 addr += anno_dir->fields_size_ * sizeof(FieldAnnotationsItem);
880 addr += anno_dir->methods_size_ * sizeof(MethodAnnotationsItem);
881 return reinterpret_cast<const ParameterAnnotationsItem*>(addr);
882 }
883 }
884
885 const AnnotationSetItem* GetFieldAnnotationSetItem(const FieldAnnotationsItem& anno_item) const {
886 uint32_t offset = anno_item.annotations_off_;
887 if (offset == 0) {
888 return nullptr;
889 } else {
890 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
891 }
892 }
893
894 const AnnotationSetItem* GetMethodAnnotationSetItem(const MethodAnnotationsItem& anno_item)
895 const {
896 uint32_t offset = anno_item.annotations_off_;
897 if (offset == 0) {
898 return nullptr;
899 } else {
900 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
901 }
902 }
903
904 const AnnotationSetRefList* GetParameterAnnotationSetRefList(
905 const ParameterAnnotationsItem* anno_item) const {
906 uint32_t offset = anno_item->annotations_off_;
907 if (offset == 0) {
908 return nullptr;
909 }
910 return reinterpret_cast<const AnnotationSetRefList*>(begin_ + offset);
911 }
912
913 const AnnotationItem* GetAnnotationItem(const AnnotationSetItem* set_item, uint32_t index) const {
914 DCHECK_LE(index, set_item->size_);
915 uint32_t offset = set_item->entries_[index];
916 if (offset == 0) {
917 return nullptr;
918 } else {
919 return reinterpret_cast<const AnnotationItem*>(begin_ + offset);
920 }
921 }
922
923 const AnnotationSetItem* GetSetRefItemItem(const AnnotationSetRefItem* anno_item) const {
924 uint32_t offset = anno_item->annotations_off_;
925 if (offset == 0) {
926 return nullptr;
927 }
928 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
929 }
930
Shih-wei Liao195487c2011-08-20 13:29:04 -0700931 // Debug info opcodes and constants
932 enum {
933 DBG_END_SEQUENCE = 0x00,
934 DBG_ADVANCE_PC = 0x01,
935 DBG_ADVANCE_LINE = 0x02,
936 DBG_START_LOCAL = 0x03,
937 DBG_START_LOCAL_EXTENDED = 0x04,
938 DBG_END_LOCAL = 0x05,
939 DBG_RESTART_LOCAL = 0x06,
940 DBG_SET_PROLOGUE_END = 0x07,
941 DBG_SET_EPILOGUE_BEGIN = 0x08,
942 DBG_SET_FILE = 0x09,
943 DBG_FIRST_SPECIAL = 0x0a,
944 DBG_LINE_BASE = -4,
945 DBG_LINE_RANGE = 15,
946 };
947
Shih-wei Liao195487c2011-08-20 13:29:04 -0700948 struct LineNumFromPcContext {
Ian Rogersca190662012-06-26 15:45:57 -0700949 LineNumFromPcContext(uint32_t address, uint32_t line_num)
950 : address_(address), line_num_(line_num) {}
Shih-wei Liao195487c2011-08-20 13:29:04 -0700951 uint32_t address_;
952 uint32_t line_num_;
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700953 private:
954 DISALLOW_COPY_AND_ASSIGN(LineNumFromPcContext);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700955 };
956
Roland Levillain91d65e02016-01-19 15:59:16 +0000957 // Returns false if there is no debugging information or if it cannot be decoded.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000958 bool DecodeDebugLocalInfo(const CodeItem* code_item, bool is_static, uint32_t method_idx,
959 DexDebugNewLocalCb local_cb, void* context) const;
960
Roland Levillain91d65e02016-01-19 15:59:16 +0000961 // Returns false if there is no debugging information or if it cannot be decoded.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000962 bool DecodeDebugPositionInfo(const CodeItem* code_item, DexDebugNewPositionCb position_cb,
963 void* context) const;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700964
Ian Rogers0571d352011-11-03 19:51:38 -0700965 const char* GetSourceFile(const ClassDef& class_def) const {
Andreas Gampe8a0128a2016-11-28 07:38:35 -0800966 if (!class_def.source_file_idx_.IsValid()) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700967 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700968 } else {
Ian Rogers0571d352011-11-03 19:51:38 -0700969 return StringDataByIdx(class_def.source_file_idx_);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700970 }
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700971 }
972
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800973 int GetPermissions() const;
Ian Rogers1c849e52012-06-28 14:00:33 -0700974
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200975 bool IsReadOnly() const;
976
Brian Carlstrome0948e12013-08-29 09:36:15 -0700977 bool EnableWrite() const;
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200978
Brian Carlstrome0948e12013-08-29 09:36:15 -0700979 bool DisableWrite() const;
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200980
Ian Rogers13735952014-10-08 12:43:28 -0700981 const uint8_t* Begin() const {
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700982 return begin_;
983 }
984
985 size_t Size() const {
986 return size_;
987 }
988
Andreas Gampe90e34042015-04-27 20:01:52 -0700989 // Return the name of the index-th classes.dex in a multidex zip file. This is classes.dex for
990 // index == 0, and classes{index + 1}.dex else.
991 static std::string GetMultiDexClassesDexName(size_t index);
992
993 // Return the (possibly synthetic) dex location for a multidex entry. This is dex_location for
994 // index == 0, and dex_location + multi-dex-separator + GetMultiDexClassesDexName(index) else.
995 static std::string GetMultiDexLocation(size_t index, const char* dex_location);
Calin Juravle4e1d5792014-07-15 23:56:47 +0100996
997 // Returns the canonical form of the given dex location.
998 //
999 // There are different flavors of "dex locations" as follows:
1000 // the file name of a dex file:
1001 // The actual file path that the dex file has on disk.
1002 // dex_location:
1003 // This acts as a key for the class linker to know which dex file to load.
1004 // It may correspond to either an old odex file or a particular dex file
1005 // inside an oat file. In the first case it will also match the file name
1006 // of the dex file. In the second case (oat) it will include the file name
1007 // and possibly some multidex annotation to uniquely identify it.
1008 // canonical_dex_location:
1009 // the dex_location where it's file name part has been made canonical.
1010 static std::string GetDexCanonicalLocation(const char* dex_location);
1011
Richard Uhler07b3c232015-03-31 15:57:54 -07001012 const OatDexFile* GetOatDexFile() const {
1013 return oat_dex_file_;
Andreas Gampefd9eb392014-11-06 16:52:58 -08001014 }
1015
Mathieu Chartier1b868492016-11-16 16:22:37 -08001016 // Used by oat writer.
1017 void SetOatDexFile(OatDexFile* oat_dex_file) const {
1018 oat_dex_file_ = oat_dex_file;
1019 }
1020
David Sehr9323e6e2016-09-13 08:58:35 -07001021 // Utility methods for reading integral values from a buffer.
1022 static int32_t ReadSignedInt(const uint8_t* ptr, int zwidth);
1023 static uint32_t ReadUnsignedInt(const uint8_t* ptr, int zwidth, bool fill_on_right);
1024 static int64_t ReadSignedLong(const uint8_t* ptr, int zwidth);
1025 static uint64_t ReadUnsignedLong(const uint8_t* ptr, int zwidth, bool fill_on_right);
1026
David Sehr709b0702016-10-13 09:12:37 -07001027 // Returns a human-readable form of the method at an index.
1028 std::string PrettyMethod(uint32_t method_idx, bool with_signature = true) const;
1029 // Returns a human-readable form of the field at an index.
1030 std::string PrettyField(uint32_t field_idx, bool with_type = true) const;
1031 // Returns a human-readable form of the type at an index.
Andreas Gampea5b09a62016-11-17 15:21:22 -08001032 std::string PrettyType(dex::TypeIndex type_idx) const;
David Sehr709b0702016-10-13 09:12:37 -07001033
Carl Shapiro1fb86202011-06-27 17:43:13 -07001034 private:
Aart Bik37d6a3b2016-06-21 18:30:10 -07001035 static std::unique_ptr<const DexFile> OpenFile(int fd,
David Sehr733ddb22016-09-19 15:02:18 -07001036 const std::string& location,
Aart Bik37d6a3b2016-06-21 18:30:10 -07001037 bool verify,
1038 bool verify_checksum,
1039 std::string* error_msg);
Brian Carlstrom58ae9412011-10-04 00:56:06 -07001040
Andreas Gampe833a4852014-05-21 18:46:59 -07001041 enum class ZipOpenErrorCode { // private
1042 kNoError,
1043 kEntryNotFound,
1044 kExtractToMemoryError,
1045 kDexFileError,
1046 kMakeReadOnlyError,
1047 kVerifyError
1048 };
1049
David Sehr733ddb22016-09-19 15:02:18 -07001050 // Open all classesXXX.dex files from a zip archive.
1051 static bool OpenAllDexFilesFromZip(const ZipArchive& zip_archive,
1052 const std::string& location,
1053 bool verify_checksum,
1054 std::string* error_msg,
1055 std::vector<std::unique_ptr<const DexFile>>* dex_files);
1056
Mathieu Chartier2cebb242015-04-21 16:50:40 -07001057 // Opens .dex file from the entry_name in a zip archive. error_code is undefined when non-null
Andreas Gampe833a4852014-05-21 18:46:59 -07001058 // return.
David Sehr733ddb22016-09-19 15:02:18 -07001059 static std::unique_ptr<const DexFile> OpenOneDexFileFromZip(const ZipArchive& zip_archive,
1060 const char* entry_name,
1061 const std::string& location,
1062 bool verify_checksum,
1063 std::string* error_msg,
1064 ZipOpenErrorCode* error_code);
1065
1066 enum class VerifyResult { // private
David Sehr9fddd362016-09-22 14:05:37 -07001067 kVerifyNotAttempted,
David Sehr733ddb22016-09-19 15:02:18 -07001068 kVerifySucceeded,
1069 kVerifyFailed
1070 };
1071
1072 static std::unique_ptr<DexFile> OpenCommon(const uint8_t* base,
1073 size_t size,
Aart Bik37d6a3b2016-06-21 18:30:10 -07001074 const std::string& location,
David Sehr733ddb22016-09-19 15:02:18 -07001075 uint32_t location_checksum,
1076 const OatDexFile* oat_dex_file,
1077 bool verify,
Aart Bik37d6a3b2016-06-21 18:30:10 -07001078 bool verify_checksum,
1079 std::string* error_msg,
David Sehr733ddb22016-09-19 15:02:18 -07001080 VerifyResult* verify_result = nullptr);
Brian Carlstrom58ae9412011-10-04 00:56:06 -07001081
Alex Light9c20a142016-08-23 15:05:12 -07001082
1083 // Opens a .dex file at the given address, optionally backed by a MemMap
1084 static std::unique_ptr<const DexFile> OpenMemory(const uint8_t* dex_file,
1085 size_t size,
1086 const std::string& location,
1087 uint32_t location_checksum,
1088 std::unique_ptr<MemMap> mem_map,
1089 const OatDexFile* oat_dex_file,
1090 std::string* error_msg);
1091
David Sehr733ddb22016-09-19 15:02:18 -07001092 DexFile(const uint8_t* base,
1093 size_t size,
Brian Carlstrom28db0122012-10-18 16:20:41 -07001094 const std::string& location,
1095 uint32_t location_checksum,
Richard Uhler07b3c232015-03-31 15:57:54 -07001096 const OatDexFile* oat_dex_file);
jeffhaof6174e82012-01-31 16:14:17 -08001097
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001098 // Top-level initializer that calls other Init methods.
Ian Rogers8d31bbd2013-10-13 10:44:14 -07001099 bool Init(std::string* error_msg);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001100
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -08001101 // Returns true if the header magic and version numbers are of the expected values.
Ian Rogers8d31bbd2013-10-13 10:44:14 -07001102 bool CheckMagicAndVersion(std::string* error_msg) const;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001103
Andreas Gampe833a4852014-05-21 18:46:59 -07001104 // Check whether a location denotes a multidex dex file. This is a very simple check: returns
1105 // whether the string contains the separator character.
1106 static bool IsMultiDexLocation(const char* location);
1107
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001108 // The base address of the memory mapping.
Ian Rogers13735952014-10-08 12:43:28 -07001109 const uint8_t* const begin_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001110
1111 // The size of the underlying memory allocation in bytes.
Ian Rogers62d6c772013-02-27 08:32:07 -08001112 const size_t size_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001113
Elliott Hughes64bf5a32011-09-20 14:43:12 -07001114 // Typically the dex file name when available, alternatively some identifying string.
Brian Carlstroma663ea52011-08-19 23:33:41 -07001115 //
1116 // The ClassLinker will use this to match DexFiles the boot class
1117 // path to DexCache::GetLocation when loading from an image.
1118 const std::string location_;
1119
Brian Carlstrom5b332c82012-02-01 15:02:31 -08001120 const uint32_t location_checksum_;
1121
Brian Carlstrom33f741e2011-10-03 11:24:05 -07001122 // Manages the underlying memory allocation.
Ian Rogers700a4022014-05-19 16:49:03 -07001123 std::unique_ptr<MemMap> mem_map_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001124
1125 // Points to the header section.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001126 const Header* const header_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001127
1128 // Points to the base of the string identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001129 const StringId* const string_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001130
1131 // Points to the base of the type identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001132 const TypeId* const type_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001133
1134 // Points to the base of the field identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001135 const FieldId* const field_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001136
1137 // Points to the base of the method identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001138 const MethodId* const method_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001139
1140 // Points to the base of the prototype identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001141 const ProtoId* const proto_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001142
1143 // Points to the base of the class definition list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001144 const ClassDef* const class_defs_;
Ian Rogers68b56852014-08-29 20:19:11 -07001145
Richard Uhler07b3c232015-03-31 15:57:54 -07001146 // If this dex file was loaded from an oat file, oat_dex_file_ contains a
1147 // pointer to the OatDexFile it was loaded from. Otherwise oat_dex_file_ is
1148 // null.
Mathieu Chartier1b868492016-11-16 16:22:37 -08001149 mutable const OatDexFile* oat_dex_file_;
Andreas Gampee6215c02015-08-31 18:54:38 -07001150
1151 friend class DexFileVerifierTest;
Mathieu Chartier1b868492016-11-16 16:22:37 -08001152 friend class OatWriter;
Mathieu Chartier76172162016-01-26 14:54:06 -08001153 ART_FRIEND_TEST(ClassLinkerTest, RegisterDexFileName); // for constructor
Carl Shapiro1fb86202011-06-27 17:43:13 -07001154};
Mathieu Chartiere5f13e52015-02-24 09:37:21 -08001155
1156struct DexFileReference {
1157 DexFileReference(const DexFile* file, uint32_t idx) : dex_file(file), index(idx) { }
1158 const DexFile* dex_file;
1159 uint32_t index;
1160};
1161
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001162std::ostream& operator<<(std::ostream& os, const DexFile& dex_file);
Carl Shapiro1fb86202011-06-27 17:43:13 -07001163
Ian Rogers0571d352011-11-03 19:51:38 -07001164// Iterate over a dex file's ProtoId's paramters
1165class DexFileParameterIterator {
1166 public:
1167 DexFileParameterIterator(const DexFile& dex_file, const DexFile::ProtoId& proto_id)
1168 : dex_file_(dex_file), size_(0), pos_(0) {
1169 type_list_ = dex_file_.GetProtoParameters(proto_id);
Mathieu Chartier2cebb242015-04-21 16:50:40 -07001170 if (type_list_ != nullptr) {
Ian Rogers0571d352011-11-03 19:51:38 -07001171 size_ = type_list_->Size();
1172 }
1173 }
1174 bool HasNext() const { return pos_ < size_; }
David Srbeckyb06e28e2015-12-10 13:15:00 +00001175 size_t Size() const { return size_; }
Ian Rogers0571d352011-11-03 19:51:38 -07001176 void Next() { ++pos_; }
Andreas Gampea5b09a62016-11-17 15:21:22 -08001177 dex::TypeIndex GetTypeIdx() {
Ian Rogers0571d352011-11-03 19:51:38 -07001178 return type_list_->GetTypeItem(pos_).type_idx_;
1179 }
1180 const char* GetDescriptor() {
Andreas Gampea5b09a62016-11-17 15:21:22 -08001181 return dex_file_.StringByTypeIdx(dex::TypeIndex(GetTypeIdx()));
Ian Rogers0571d352011-11-03 19:51:38 -07001182 }
1183 private:
1184 const DexFile& dex_file_;
1185 const DexFile::TypeList* type_list_;
1186 uint32_t size_;
1187 uint32_t pos_;
1188 DISALLOW_IMPLICIT_CONSTRUCTORS(DexFileParameterIterator);
1189};
1190
Ian Rogersd91d6d62013-09-25 20:26:14 -07001191// Abstract the signature of a method.
Ian Rogers03b6eaf2014-10-28 09:34:57 -07001192class Signature : public ValueObject {
Ian Rogersd91d6d62013-09-25 20:26:14 -07001193 public:
1194 std::string ToString() const;
1195
1196 static Signature NoSignature() {
1197 return Signature();
1198 }
1199
Orion Hodson6c4921b2016-09-21 15:41:06 +01001200 bool IsVoid() const;
1201 uint32_t GetNumberOfParameters() const;
1202
Ian Rogersdfb325e2013-10-30 01:00:44 -07001203 bool operator==(const Signature& rhs) const;
Ian Rogersd91d6d62013-09-25 20:26:14 -07001204 bool operator!=(const Signature& rhs) const {
1205 return !(*this == rhs);
1206 }
1207
Vladimir Markod9cffea2013-11-25 15:08:02 +00001208 bool operator==(const StringPiece& rhs) const;
Ian Rogersd91d6d62013-09-25 20:26:14 -07001209
1210 private:
1211 Signature(const DexFile* dex, const DexFile::ProtoId& proto) : dex_file_(dex), proto_id_(&proto) {
1212 }
1213
1214 Signature() : dex_file_(nullptr), proto_id_(nullptr) {
1215 }
1216
1217 friend class DexFile;
1218
1219 const DexFile* const dex_file_;
1220 const DexFile::ProtoId* const proto_id_;
1221};
1222std::ostream& operator<<(std::ostream& os, const Signature& sig);
1223
Ian Rogers0571d352011-11-03 19:51:38 -07001224// Iterate and decode class_data_item
1225class ClassDataItemIterator {
1226 public:
Ian Rogers13735952014-10-08 12:43:28 -07001227 ClassDataItemIterator(const DexFile& dex_file, const uint8_t* raw_class_data_item)
Ian Rogers0571d352011-11-03 19:51:38 -07001228 : dex_file_(dex_file), pos_(0), ptr_pos_(raw_class_data_item), last_idx_(0) {
1229 ReadClassDataHeader();
1230 if (EndOfInstanceFieldsPos() > 0) {
1231 ReadClassDataField();
1232 } else if (EndOfVirtualMethodsPos() > 0) {
1233 ReadClassDataMethod();
1234 }
1235 }
1236 uint32_t NumStaticFields() const {
1237 return header_.static_fields_size_;
1238 }
1239 uint32_t NumInstanceFields() const {
1240 return header_.instance_fields_size_;
1241 }
1242 uint32_t NumDirectMethods() const {
1243 return header_.direct_methods_size_;
1244 }
1245 uint32_t NumVirtualMethods() const {
1246 return header_.virtual_methods_size_;
1247 }
1248 bool HasNextStaticField() const {
1249 return pos_ < EndOfStaticFieldsPos();
1250 }
1251 bool HasNextInstanceField() const {
1252 return pos_ >= EndOfStaticFieldsPos() && pos_ < EndOfInstanceFieldsPos();
1253 }
1254 bool HasNextDirectMethod() const {
1255 return pos_ >= EndOfInstanceFieldsPos() && pos_ < EndOfDirectMethodsPos();
1256 }
1257 bool HasNextVirtualMethod() const {
1258 return pos_ >= EndOfDirectMethodsPos() && pos_ < EndOfVirtualMethodsPos();
1259 }
1260 bool HasNext() const {
1261 return pos_ < EndOfVirtualMethodsPos();
1262 }
Ian Rogers637c65b2013-05-31 11:46:00 -07001263 inline void Next() {
Ian Rogers0571d352011-11-03 19:51:38 -07001264 pos_++;
1265 if (pos_ < EndOfStaticFieldsPos()) {
1266 last_idx_ = GetMemberIndex();
1267 ReadClassDataField();
1268 } else if (pos_ == EndOfStaticFieldsPos() && NumInstanceFields() > 0) {
1269 last_idx_ = 0; // transition to next array, reset last index
1270 ReadClassDataField();
1271 } else if (pos_ < EndOfInstanceFieldsPos()) {
1272 last_idx_ = GetMemberIndex();
1273 ReadClassDataField();
1274 } else if (pos_ == EndOfInstanceFieldsPos() && NumDirectMethods() > 0) {
1275 last_idx_ = 0; // transition to next array, reset last index
1276 ReadClassDataMethod();
1277 } else if (pos_ < EndOfDirectMethodsPos()) {
1278 last_idx_ = GetMemberIndex();
1279 ReadClassDataMethod();
1280 } else if (pos_ == EndOfDirectMethodsPos() && NumVirtualMethods() > 0) {
1281 last_idx_ = 0; // transition to next array, reset last index
1282 ReadClassDataMethod();
1283 } else if (pos_ < EndOfVirtualMethodsPos()) {
1284 last_idx_ = GetMemberIndex();
1285 ReadClassDataMethod();
1286 } else {
1287 DCHECK(!HasNext());
1288 }
1289 }
1290 uint32_t GetMemberIndex() const {
1291 if (pos_ < EndOfInstanceFieldsPos()) {
1292 return last_idx_ + field_.field_idx_delta_;
1293 } else {
Sebastien Hertzb24bd992013-08-02 15:19:09 +02001294 DCHECK_LT(pos_, EndOfVirtualMethodsPos());
Ian Rogers0571d352011-11-03 19:51:38 -07001295 return last_idx_ + method_.method_idx_delta_;
1296 }
1297 }
Andreas Gampe51829322014-08-25 15:05:04 -07001298 uint32_t GetRawMemberAccessFlags() const {
Ian Rogers0571d352011-11-03 19:51:38 -07001299 if (pos_ < EndOfInstanceFieldsPos()) {
1300 return field_.access_flags_;
1301 } else {
Sebastien Hertzb24bd992013-08-02 15:19:09 +02001302 DCHECK_LT(pos_, EndOfVirtualMethodsPos());
Ian Rogers0571d352011-11-03 19:51:38 -07001303 return method_.access_flags_;
1304 }
1305 }
Andreas Gampe51829322014-08-25 15:05:04 -07001306 uint32_t GetFieldAccessFlags() const {
1307 return GetRawMemberAccessFlags() & kAccValidFieldFlags;
1308 }
1309 uint32_t GetMethodAccessFlags() const {
1310 return GetRawMemberAccessFlags() & kAccValidMethodFlags;
1311 }
1312 bool MemberIsNative() const {
1313 return GetRawMemberAccessFlags() & kAccNative;
1314 }
1315 bool MemberIsFinal() const {
1316 return GetRawMemberAccessFlags() & kAccFinal;
1317 }
Ian Rogers08f753d2012-08-24 14:35:25 -07001318 InvokeType GetMethodInvokeType(const DexFile::ClassDef& class_def) const {
1319 if (HasNextDirectMethod()) {
Andreas Gampe51829322014-08-25 15:05:04 -07001320 if ((GetRawMemberAccessFlags() & kAccStatic) != 0) {
Ian Rogers08f753d2012-08-24 14:35:25 -07001321 return kStatic;
1322 } else {
1323 return kDirect;
1324 }
1325 } else {
Andreas Gampe51829322014-08-25 15:05:04 -07001326 DCHECK_EQ(GetRawMemberAccessFlags() & kAccStatic, 0U);
Ian Rogers08f753d2012-08-24 14:35:25 -07001327 if ((class_def.access_flags_ & kAccInterface) != 0) {
1328 return kInterface;
Andreas Gampe51829322014-08-25 15:05:04 -07001329 } else if ((GetRawMemberAccessFlags() & kAccConstructor) != 0) {
Ian Rogers08f753d2012-08-24 14:35:25 -07001330 return kSuper;
1331 } else {
1332 return kVirtual;
1333 }
1334 }
1335 }
Ian Rogers0571d352011-11-03 19:51:38 -07001336 const DexFile::CodeItem* GetMethodCodeItem() const {
1337 return dex_file_.GetCodeItem(method_.code_off_);
1338 }
1339 uint32_t GetMethodCodeItemOffset() const {
1340 return method_.code_off_;
1341 }
Andreas Gampee6215c02015-08-31 18:54:38 -07001342 const uint8_t* DataPointer() const {
1343 return ptr_pos_;
1344 }
Ian Rogers13735952014-10-08 12:43:28 -07001345 const uint8_t* EndDataPointer() const {
jeffhao10037c82012-01-23 15:06:23 -08001346 CHECK(!HasNext());
1347 return ptr_pos_;
1348 }
Elliott Hughesa21039c2012-06-21 12:09:25 -07001349
Ian Rogers0571d352011-11-03 19:51:38 -07001350 private:
1351 // A dex file's class_data_item is leb128 encoded, this structure holds a decoded form of the
1352 // header for a class_data_item
1353 struct ClassDataHeader {
1354 uint32_t static_fields_size_; // the number of static fields
1355 uint32_t instance_fields_size_; // the number of instance fields
1356 uint32_t direct_methods_size_; // the number of direct methods
1357 uint32_t virtual_methods_size_; // the number of virtual methods
1358 } header_;
1359
1360 // Read and decode header from a class_data_item stream into header
1361 void ReadClassDataHeader();
1362
1363 uint32_t EndOfStaticFieldsPos() const {
1364 return header_.static_fields_size_;
1365 }
1366 uint32_t EndOfInstanceFieldsPos() const {
1367 return EndOfStaticFieldsPos() + header_.instance_fields_size_;
1368 }
1369 uint32_t EndOfDirectMethodsPos() const {
1370 return EndOfInstanceFieldsPos() + header_.direct_methods_size_;
1371 }
1372 uint32_t EndOfVirtualMethodsPos() const {
1373 return EndOfDirectMethodsPos() + header_.virtual_methods_size_;
1374 }
1375
1376 // A decoded version of the field of a class_data_item
1377 struct ClassDataField {
1378 uint32_t field_idx_delta_; // delta of index into the field_ids array for FieldId
1379 uint32_t access_flags_; // access flags for the field
1380 ClassDataField() : field_idx_delta_(0), access_flags_(0) {}
Elliott Hughesa21039c2012-06-21 12:09:25 -07001381
Ian Rogers0571d352011-11-03 19:51:38 -07001382 private:
1383 DISALLOW_COPY_AND_ASSIGN(ClassDataField);
Elliott Hughesee0fa762012-03-26 17:12:41 -07001384 };
1385 ClassDataField field_;
Ian Rogers0571d352011-11-03 19:51:38 -07001386
1387 // Read and decode a field from a class_data_item stream into field
1388 void ReadClassDataField();
1389
1390 // A decoded version of the method of a class_data_item
1391 struct ClassDataMethod {
1392 uint32_t method_idx_delta_; // delta of index into the method_ids array for MethodId
1393 uint32_t access_flags_;
1394 uint32_t code_off_;
1395 ClassDataMethod() : method_idx_delta_(0), access_flags_(0), code_off_(0) {}
Elliott Hughesa21039c2012-06-21 12:09:25 -07001396
Ian Rogers0571d352011-11-03 19:51:38 -07001397 private:
1398 DISALLOW_COPY_AND_ASSIGN(ClassDataMethod);
Elliott Hughesee0fa762012-03-26 17:12:41 -07001399 };
1400 ClassDataMethod method_;
Ian Rogers0571d352011-11-03 19:51:38 -07001401
1402 // Read and decode a method from a class_data_item stream into method
1403 void ReadClassDataMethod();
1404
1405 const DexFile& dex_file_;
1406 size_t pos_; // integral number of items passed
Ian Rogers13735952014-10-08 12:43:28 -07001407 const uint8_t* ptr_pos_; // pointer into stream of class_data_item
Ian Rogers0571d352011-11-03 19:51:38 -07001408 uint32_t last_idx_; // last read field or method index to apply delta to
1409 DISALLOW_IMPLICIT_CONSTRUCTORS(ClassDataItemIterator);
1410};
1411
Ian Rogers0571d352011-11-03 19:51:38 -07001412class EncodedStaticFieldValueIterator {
1413 public:
Shinichiro Hamaji82863f02015-11-05 16:51:33 +09001414 EncodedStaticFieldValueIterator(const DexFile& dex_file,
1415 const DexFile::ClassDef& class_def);
1416
Ian Rogers6a3c1fc2014-10-31 00:33:20 -07001417 bool HasNext() const { return pos_ < array_size_; }
Ian Rogers0571d352011-11-03 19:51:38 -07001418
1419 void Next();
Elliott Hughesa21039c2012-06-21 12:09:25 -07001420
Ian Rogers0571d352011-11-03 19:51:38 -07001421 enum ValueType {
1422 kByte = 0x00,
1423 kShort = 0x02,
1424 kChar = 0x03,
1425 kInt = 0x04,
1426 kLong = 0x06,
1427 kFloat = 0x10,
1428 kDouble = 0x11,
1429 kString = 0x17,
1430 kType = 0x18,
1431 kField = 0x19,
1432 kMethod = 0x1a,
1433 kEnum = 0x1b,
1434 kArray = 0x1c,
1435 kAnnotation = 0x1d,
1436 kNull = 0x1e,
1437 kBoolean = 0x1f
1438 };
1439
Shinichiro Hamaji82863f02015-11-05 16:51:33 +09001440 ValueType GetValueType() const { return type_; }
1441 const jvalue& GetJavaValue() const { return jval_; }
1442
David Sehr9323e6e2016-09-13 08:58:35 -07001443 protected:
Ian Rogers13735952014-10-08 12:43:28 -07001444 static constexpr uint8_t kEncodedValueTypeMask = 0x1f; // 0b11111
1445 static constexpr uint8_t kEncodedValueArgShift = 5;
Ian Rogers0571d352011-11-03 19:51:38 -07001446
1447 const DexFile& dex_file_;
Ian Rogers2dd0e2c2013-01-24 12:42:14 -08001448 size_t array_size_; // Size of array.
1449 size_t pos_; // Current position.
Ian Rogers13735952014-10-08 12:43:28 -07001450 const uint8_t* ptr_; // Pointer into encoded data array.
Ian Rogers2dd0e2c2013-01-24 12:42:14 -08001451 ValueType type_; // Type of current encoded value.
1452 jvalue jval_; // Value of current encoded value.
David Sehr9323e6e2016-09-13 08:58:35 -07001453
1454 private:
Ian Rogers0571d352011-11-03 19:51:38 -07001455 DISALLOW_IMPLICIT_CONSTRUCTORS(EncodedStaticFieldValueIterator);
1456};
Brian Carlstrom88f36542012-10-16 23:24:21 -07001457std::ostream& operator<<(std::ostream& os, const EncodedStaticFieldValueIterator::ValueType& code);
Ian Rogers0571d352011-11-03 19:51:38 -07001458
1459class CatchHandlerIterator {
1460 public:
1461 CatchHandlerIterator(const DexFile::CodeItem& code_item, uint32_t address);
Logan Chien736df022012-04-27 16:25:57 +08001462
1463 CatchHandlerIterator(const DexFile::CodeItem& code_item,
1464 const DexFile::TryItem& try_item);
1465
Ian Rogers13735952014-10-08 12:43:28 -07001466 explicit CatchHandlerIterator(const uint8_t* handler_data) {
Ian Rogers0571d352011-11-03 19:51:38 -07001467 Init(handler_data);
1468 }
1469
Andreas Gampea5b09a62016-11-17 15:21:22 -08001470 dex::TypeIndex GetHandlerTypeIndex() const {
Ian Rogers0571d352011-11-03 19:51:38 -07001471 return handler_.type_idx_;
1472 }
1473 uint32_t GetHandlerAddress() const {
1474 return handler_.address_;
1475 }
1476 void Next();
1477 bool HasNext() const {
1478 return remaining_count_ != -1 || catch_all_;
1479 }
1480 // End of this set of catch blocks, convenience method to locate next set of catch blocks
Ian Rogers13735952014-10-08 12:43:28 -07001481 const uint8_t* EndDataPointer() const {
Ian Rogers0571d352011-11-03 19:51:38 -07001482 CHECK(!HasNext());
1483 return current_data_;
1484 }
Elliott Hughesa21039c2012-06-21 12:09:25 -07001485
Ian Rogers0571d352011-11-03 19:51:38 -07001486 private:
Logan Chien736df022012-04-27 16:25:57 +08001487 void Init(const DexFile::CodeItem& code_item, int32_t offset);
Ian Rogers13735952014-10-08 12:43:28 -07001488 void Init(const uint8_t* handler_data);
Ian Rogers0571d352011-11-03 19:51:38 -07001489
1490 struct CatchHandlerItem {
Andreas Gampea5b09a62016-11-17 15:21:22 -08001491 dex::TypeIndex type_idx_; // type index of the caught exception type
Ian Rogers0571d352011-11-03 19:51:38 -07001492 uint32_t address_; // handler address
1493 } handler_;
Ian Rogers13735952014-10-08 12:43:28 -07001494 const uint8_t* current_data_; // the current handler in dex file.
Ian Rogers0571d352011-11-03 19:51:38 -07001495 int32_t remaining_count_; // number of handlers not read.
1496 bool catch_all_; // is there a handler that will catch all exceptions in case
1497 // that all typed handler does not match.
1498};
1499
Carl Shapiro1fb86202011-06-27 17:43:13 -07001500} // namespace art
1501
Brian Carlstromfc0e3212013-07-17 14:40:12 -07001502#endif // ART_RUNTIME_DEX_FILE_H_