blob: 0ae36f78b52afd492bcd4d44e5d0c1b672bae7e2 [file] [log] [blame]
Elliott Hughes2faa5f12012-01-30 14:42:07 -08001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Carl Shapiro1fb86202011-06-27 17:43:13 -070016
Brian Carlstromfc0e3212013-07-17 14:40:12 -070017#ifndef ART_RUNTIME_DEX_FILE_H_
18#define ART_RUNTIME_DEX_FILE_H_
Carl Shapiro1fb86202011-06-27 17:43:13 -070019
Ian Rogers700a4022014-05-19 16:49:03 -070020#include <memory>
Elliott Hughes0c424cb2011-08-26 10:16:25 -070021#include <string>
Brian Carlstrom74eb46a2011-08-02 20:10:14 -070022#include <vector>
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070023
Elliott Hughes07ed66b2012-12-12 18:34:25 -080024#include "base/logging.h"
Ian Rogersb0fa5dc2014-04-28 16:47:08 -070025#include "base/mutex.h" // For Locks::mutator_lock_.
Ian Rogers03b6eaf2014-10-28 09:34:57 -070026#include "base/value_object.h"
Brian Carlstrom578bbdc2011-07-21 14:07:47 -070027#include "globals.h"
Ian Rogers08f753d2012-08-24 14:35:25 -070028#include "invoke_type.h"
Jesse Wilson6bf19152011-09-29 13:12:33 -040029#include "jni.h"
Ian Rogers08f753d2012-08-24 14:35:25 -070030#include "modifiers.h"
Ian Rogers68b56852014-08-29 20:19:11 -070031#include "utf.h"
Carl Shapiro1fb86202011-06-27 17:43:13 -070032
33namespace art {
34
Ian Rogers576ca0c2014-06-06 15:58:22 -070035class MemMap;
Richard Uhler07b3c232015-03-31 15:57:54 -070036class OatDexFile;
Ian Rogersd91d6d62013-09-25 20:26:14 -070037class Signature;
Ian Rogersfc0e94b2013-09-23 23:51:32 -070038class StringPiece;
Artem Udovichenkod9786b02015-10-14 16:36:55 +030039class TypeLookupTable;
Brian Carlstroma6cc8932012-01-04 14:44:07 -080040class ZipArchive;
41
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070042// TODO: move all of the macro functionality into the DexCache class.
Brian Carlstromf615a612011-07-23 12:50:34 -070043class DexFile {
Carl Shapiro1fb86202011-06-27 17:43:13 -070044 public:
Roland Levillain621b5ea2016-05-18 11:41:33 +010045 // First Dex format version supporting default methods.
Alex Lightb55f1ac2016-04-12 15:50:55 -070046 static const uint32_t kDefaultMethodsVersion = 37;
Roland Levillain621b5ea2016-05-18 11:41:33 +010047 // First Dex format version enforcing class definition ordering rules.
48 static const uint32_t kClassDefinitionOrderEnforcedVersion = 37;
49
Ian Rogers13735952014-10-08 12:43:28 -070050 static const uint8_t kDexMagic[];
Narayan Kamath52e66502016-08-01 14:20:31 +010051 static constexpr size_t kNumDexVersions = 3;
Alex Lightc4961812016-03-23 10:20:41 -070052 static constexpr size_t kDexVersionLen = 4;
53 static const uint8_t kDexMagicVersions[kNumDexVersions][kDexVersionLen];
54
Ian Rogers13735952014-10-08 12:43:28 -070055 static constexpr size_t kSha1DigestSize = 20;
56 static constexpr uint32_t kDexEndianConstant = 0x12345678;
Carl Shapiro80d4dde2011-06-28 16:24:07 -070057
Brian Carlstromb7bbba42011-10-13 14:58:47 -070058 // name of the DexFile entry within a zip archive
59 static const char* kClassesDex;
60
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070061 // The value of an invalid index.
62 static const uint32_t kDexNoIndex = 0xFFFFFFFF;
63
Ian Rogers0571d352011-11-03 19:51:38 -070064 // The value of an invalid index.
65 static const uint16_t kDexNoIndex16 = 0xFFFF;
Carl Shapiro1fb86202011-06-27 17:43:13 -070066
Alex Lightc4961812016-03-23 10:20:41 -070067 // The separator character in MultiDex locations.
Andreas Gampe833a4852014-05-21 18:46:59 -070068 static constexpr char kMultiDexSeparator = ':';
69
70 // A string version of the previous. This is a define so that we can merge string literals in the
71 // preprocessor.
72 #define kMultiDexSeparatorString ":"
73
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070074 // Raw header_item.
75 struct Header {
76 uint8_t magic_[8];
Brian Carlstrom7934ac22013-07-26 10:54:15 -070077 uint32_t checksum_; // See also location_checksum_
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070078 uint8_t signature_[kSha1DigestSize];
jeffhaof6174e82012-01-31 16:14:17 -080079 uint32_t file_size_; // size of entire file
Brian Carlstrom7e49dca2011-07-22 18:07:34 -070080 uint32_t header_size_; // offset to start of next section
81 uint32_t endian_tag_;
Ian Rogers0571d352011-11-03 19:51:38 -070082 uint32_t link_size_; // unused
83 uint32_t link_off_; // unused
84 uint32_t map_off_; // unused
85 uint32_t string_ids_size_; // number of StringIds
86 uint32_t string_ids_off_; // file offset of StringIds array
87 uint32_t type_ids_size_; // number of TypeIds, we don't support more than 65535
88 uint32_t type_ids_off_; // file offset of TypeIds array
89 uint32_t proto_ids_size_; // number of ProtoIds, we don't support more than 65535
90 uint32_t proto_ids_off_; // file offset of ProtoIds array
91 uint32_t field_ids_size_; // number of FieldIds
92 uint32_t field_ids_off_; // file offset of FieldIds array
93 uint32_t method_ids_size_; // number of MethodIds
94 uint32_t method_ids_off_; // file offset of MethodIds array
95 uint32_t class_defs_size_; // number of ClassDefs
96 uint32_t class_defs_off_; // file offset of ClassDef array
97 uint32_t data_size_; // unused
98 uint32_t data_off_; // unused
Elliott Hughesa21039c2012-06-21 12:09:25 -070099
Andreas Gampe76ed99d2016-03-28 18:31:29 -0700100 // Decode the dex magic version
101 uint32_t GetVersion() const;
102
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700103 private:
104 DISALLOW_COPY_AND_ASSIGN(Header);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700105 };
Carl Shapiro1fb86202011-06-27 17:43:13 -0700106
jeffhao10037c82012-01-23 15:06:23 -0800107 // Map item type codes.
108 enum {
109 kDexTypeHeaderItem = 0x0000,
110 kDexTypeStringIdItem = 0x0001,
111 kDexTypeTypeIdItem = 0x0002,
112 kDexTypeProtoIdItem = 0x0003,
113 kDexTypeFieldIdItem = 0x0004,
114 kDexTypeMethodIdItem = 0x0005,
115 kDexTypeClassDefItem = 0x0006,
116 kDexTypeMapList = 0x1000,
117 kDexTypeTypeList = 0x1001,
118 kDexTypeAnnotationSetRefList = 0x1002,
119 kDexTypeAnnotationSetItem = 0x1003,
120 kDexTypeClassDataItem = 0x2000,
121 kDexTypeCodeItem = 0x2001,
122 kDexTypeStringDataItem = 0x2002,
123 kDexTypeDebugInfoItem = 0x2003,
124 kDexTypeAnnotationItem = 0x2004,
125 kDexTypeEncodedArrayItem = 0x2005,
126 kDexTypeAnnotationsDirectoryItem = 0x2006,
127 };
128
129 struct MapItem {
130 uint16_t type_;
131 uint16_t unused_;
132 uint32_t size_;
133 uint32_t offset_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700134
jeffhao10037c82012-01-23 15:06:23 -0800135 private:
136 DISALLOW_COPY_AND_ASSIGN(MapItem);
137 };
138
139 struct MapList {
140 uint32_t size_;
141 MapItem list_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700142
jeffhao10037c82012-01-23 15:06:23 -0800143 private:
144 DISALLOW_COPY_AND_ASSIGN(MapList);
145 };
146
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700147 // Raw string_id_item.
148 struct StringId {
149 uint32_t string_data_off_; // offset in bytes from the base address
Elliott Hughesa21039c2012-06-21 12:09:25 -0700150
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700151 private:
152 DISALLOW_COPY_AND_ASSIGN(StringId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700153 };
154
155 // Raw type_id_item.
156 struct TypeId {
157 uint32_t descriptor_idx_; // index into string_ids
Elliott Hughesa21039c2012-06-21 12:09:25 -0700158
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700159 private:
160 DISALLOW_COPY_AND_ASSIGN(TypeId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700161 };
162
163 // Raw field_id_item.
164 struct FieldId {
Ian Rogers0571d352011-11-03 19:51:38 -0700165 uint16_t class_idx_; // index into type_ids_ array for defining class
166 uint16_t type_idx_; // index into type_ids_ array for field type
167 uint32_t name_idx_; // index into string_ids_ array for field name
Elliott Hughesa21039c2012-06-21 12:09:25 -0700168
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700169 private:
170 DISALLOW_COPY_AND_ASSIGN(FieldId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700171 };
172
173 // Raw method_id_item.
174 struct MethodId {
Ian Rogers0571d352011-11-03 19:51:38 -0700175 uint16_t class_idx_; // index into type_ids_ array for defining class
176 uint16_t proto_idx_; // index into proto_ids_ array for method prototype
177 uint32_t name_idx_; // index into string_ids_ array for method name
Elliott Hughesa21039c2012-06-21 12:09:25 -0700178
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700179 private:
180 DISALLOW_COPY_AND_ASSIGN(MethodId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700181 };
182
183 // Raw proto_id_item.
184 struct ProtoId {
Ian Rogers0571d352011-11-03 19:51:38 -0700185 uint32_t shorty_idx_; // index into string_ids array for shorty descriptor
186 uint16_t return_type_idx_; // index into type_ids array for return type
187 uint16_t pad_; // padding = 0
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700188 uint32_t parameters_off_; // file offset to type_list for parameter types
Elliott Hughesa21039c2012-06-21 12:09:25 -0700189
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700190 private:
191 DISALLOW_COPY_AND_ASSIGN(ProtoId);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700192 };
193
194 // Raw class_def_item.
195 struct ClassDef {
Ian Rogers0571d352011-11-03 19:51:38 -0700196 uint16_t class_idx_; // index into type_ids_ array for this class
197 uint16_t pad1_; // padding = 0
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700198 uint32_t access_flags_;
Ian Rogers0571d352011-11-03 19:51:38 -0700199 uint16_t superclass_idx_; // index into type_ids_ array for superclass
200 uint16_t pad2_; // padding = 0
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700201 uint32_t interfaces_off_; // file offset to TypeList
Brian Carlstrom4a96b602011-07-26 16:40:23 -0700202 uint32_t source_file_idx_; // index into string_ids_ for source file name
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700203 uint32_t annotations_off_; // file offset to annotations_directory_item
204 uint32_t class_data_off_; // file offset to class_data_item
205 uint32_t static_values_off_; // file offset to EncodedArray
Elliott Hughesa21039c2012-06-21 12:09:25 -0700206
Andreas Gampe51829322014-08-25 15:05:04 -0700207 // Returns the valid access flags, that is, Java modifier bits relevant to the ClassDef type
208 // (class or interface). These are all in the lower 16b and do not contain runtime flags.
209 uint32_t GetJavaAccessFlags() const {
210 // Make sure that none of our runtime-only flags are set.
Andreas Gampe575e78c2014-11-03 23:41:03 -0800211 static_assert((kAccValidClassFlags & kAccJavaFlagsMask) == kAccValidClassFlags,
212 "Valid class flags not a subset of Java flags");
213 static_assert((kAccValidInterfaceFlags & kAccJavaFlagsMask) == kAccValidInterfaceFlags,
214 "Valid interface flags not a subset of Java flags");
Andreas Gampe51829322014-08-25 15:05:04 -0700215
216 if ((access_flags_ & kAccInterface) != 0) {
217 // Interface.
218 return access_flags_ & kAccValidInterfaceFlags;
219 } else {
220 // Class.
221 return access_flags_ & kAccValidClassFlags;
222 }
223 }
224
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700225 private:
226 DISALLOW_COPY_AND_ASSIGN(ClassDef);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700227 };
228
229 // Raw type_item.
230 struct TypeItem {
231 uint16_t type_idx_; // index into type_ids section
Elliott Hughesa21039c2012-06-21 12:09:25 -0700232
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700233 private:
234 DISALLOW_COPY_AND_ASSIGN(TypeItem);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700235 };
236
237 // Raw type_list.
238 class TypeList {
239 public:
240 uint32_t Size() const {
241 return size_;
242 }
243
244 const TypeItem& GetTypeItem(uint32_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200245 DCHECK_LT(idx, this->size_);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700246 return this->list_[idx];
247 }
248
Andreas Gampe31a7a0c2014-08-29 16:07:49 -0700249 // Size in bytes of the part of the list that is common.
250 static constexpr size_t GetHeaderSize() {
251 return 4U;
252 }
253
254 // Size in bytes of the whole type list including all the stored elements.
255 static constexpr size_t GetListSize(size_t count) {
256 return GetHeaderSize() + sizeof(TypeItem) * count;
257 }
258
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700259 private:
260 uint32_t size_; // size of the list, in entries
261 TypeItem list_[1]; // elements of the list
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700262 DISALLOW_COPY_AND_ASSIGN(TypeList);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700263 };
264
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700265 // Raw code_item.
266 struct CodeItem {
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700267 uint16_t registers_size_; // the number of registers used by this code
268 // (locals + parameters)
269 uint16_t ins_size_; // the number of words of incoming arguments to the method
270 // that this code is for
271 uint16_t outs_size_; // the number of words of outgoing argument space required
272 // by this code for method invocation
273 uint16_t tries_size_; // the number of try_items for this instance. If non-zero,
274 // then these appear as the tries array just after the
275 // insns in this instance.
276 uint32_t debug_info_off_; // file offset to debug info stream
Ian Rogersd81871c2011-10-03 13:57:23 -0700277 uint32_t insns_size_in_code_units_; // size of the insns array, in 2 byte code units
Igor Murashkinc449e8b2015-06-10 15:56:42 -0700278 uint16_t insns_[1]; // actual array of bytecode.
Elliott Hughesa21039c2012-06-21 12:09:25 -0700279
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700280 private:
281 DISALLOW_COPY_AND_ASSIGN(CodeItem);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700282 };
283
Carl Shapiro2eaa9682011-08-04 19:26:11 -0700284 // Raw try_item.
285 struct TryItem {
286 uint32_t start_addr_;
287 uint16_t insn_count_;
288 uint16_t handler_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700289
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700290 private:
291 DISALLOW_COPY_AND_ASSIGN(TryItem);
Carl Shapiro2eaa9682011-08-04 19:26:11 -0700292 };
293
jeffhao10037c82012-01-23 15:06:23 -0800294 // Annotation constants.
295 enum {
296 kDexVisibilityBuild = 0x00, /* annotation visibility */
297 kDexVisibilityRuntime = 0x01,
298 kDexVisibilitySystem = 0x02,
299
300 kDexAnnotationByte = 0x00,
301 kDexAnnotationShort = 0x02,
302 kDexAnnotationChar = 0x03,
303 kDexAnnotationInt = 0x04,
304 kDexAnnotationLong = 0x06,
305 kDexAnnotationFloat = 0x10,
306 kDexAnnotationDouble = 0x11,
307 kDexAnnotationString = 0x17,
308 kDexAnnotationType = 0x18,
309 kDexAnnotationField = 0x19,
310 kDexAnnotationMethod = 0x1a,
311 kDexAnnotationEnum = 0x1b,
312 kDexAnnotationArray = 0x1c,
313 kDexAnnotationAnnotation = 0x1d,
314 kDexAnnotationNull = 0x1e,
315 kDexAnnotationBoolean = 0x1f,
316
317 kDexAnnotationValueTypeMask = 0x1f, /* low 5 bits */
318 kDexAnnotationValueArgShift = 5,
319 };
320
321 struct AnnotationsDirectoryItem {
322 uint32_t class_annotations_off_;
323 uint32_t fields_size_;
324 uint32_t methods_size_;
325 uint32_t parameters_size_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700326
jeffhao10037c82012-01-23 15:06:23 -0800327 private:
328 DISALLOW_COPY_AND_ASSIGN(AnnotationsDirectoryItem);
329 };
330
331 struct FieldAnnotationsItem {
332 uint32_t field_idx_;
333 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700334
jeffhao10037c82012-01-23 15:06:23 -0800335 private:
336 DISALLOW_COPY_AND_ASSIGN(FieldAnnotationsItem);
337 };
338
339 struct MethodAnnotationsItem {
340 uint32_t method_idx_;
341 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700342
jeffhao10037c82012-01-23 15:06:23 -0800343 private:
344 DISALLOW_COPY_AND_ASSIGN(MethodAnnotationsItem);
345 };
346
347 struct ParameterAnnotationsItem {
348 uint32_t method_idx_;
349 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700350
jeffhao10037c82012-01-23 15:06:23 -0800351 private:
352 DISALLOW_COPY_AND_ASSIGN(ParameterAnnotationsItem);
353 };
354
355 struct AnnotationSetRefItem {
356 uint32_t annotations_off_;
Elliott Hughesa21039c2012-06-21 12:09:25 -0700357
jeffhao10037c82012-01-23 15:06:23 -0800358 private:
359 DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefItem);
360 };
361
362 struct AnnotationSetRefList {
363 uint32_t size_;
364 AnnotationSetRefItem list_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700365
jeffhao10037c82012-01-23 15:06:23 -0800366 private:
367 DISALLOW_COPY_AND_ASSIGN(AnnotationSetRefList);
368 };
369
370 struct AnnotationSetItem {
371 uint32_t size_;
372 uint32_t entries_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700373
jeffhao10037c82012-01-23 15:06:23 -0800374 private:
375 DISALLOW_COPY_AND_ASSIGN(AnnotationSetItem);
376 };
377
378 struct AnnotationItem {
379 uint8_t visibility_;
380 uint8_t annotation_[1];
Elliott Hughesa21039c2012-06-21 12:09:25 -0700381
jeffhao10037c82012-01-23 15:06:23 -0800382 private:
383 DISALLOW_COPY_AND_ASSIGN(AnnotationItem);
384 };
385
Jeff Hao13e748b2015-08-25 20:44:19 +0000386 enum AnnotationResultStyle { // private
387 kAllObjects,
388 kPrimitivesOrObjects,
389 kAllRaw
390 };
391
David Sehr9323e6e2016-09-13 08:58:35 -0700392 struct AnnotationValue;
393
Brian Carlstrom5b332c82012-02-01 15:02:31 -0800394 // Returns the checksum of a file for comparison with GetLocationChecksum().
395 // For .dex files, this is the header checksum.
396 // For zip files, this is the classes.dex zip entry CRC32 checksum.
397 // Return true if the checksum could be found, false otherwise.
Ian Rogers8d31bbd2013-10-13 10:44:14 -0700398 static bool GetChecksum(const char* filename, uint32_t* checksum, std::string* error_msg);
Brian Carlstrom78128a62011-09-15 17:21:19 -0700399
Andreas Gampe833a4852014-05-21 18:46:59 -0700400 // Opens .dex files found in the container, guessing the container format based on file extension.
Aart Bik37d6a3b2016-06-21 18:30:10 -0700401 static bool Open(const char* filename,
402 const char* location,
403 bool verify_checksum,
404 std::string* error_msg,
Richard Uhlerfbef44d2014-12-23 09:48:51 -0800405 std::vector<std::unique_ptr<const DexFile>>* dex_files);
jeffhao262bf462011-10-20 18:36:32 -0700406
Brian Carlstrom89521892011-12-07 22:05:07 -0800407 // Opens .dex file, backed by existing memory
Richard Uhlerfbef44d2014-12-23 09:48:51 -0800408 static std::unique_ptr<const DexFile> Open(const uint8_t* base, size_t size,
409 const std::string& location,
410 uint32_t location_checksum,
Richard Uhler07b3c232015-03-31 15:57:54 -0700411 const OatDexFile* oat_dex_file,
Andreas Gampe3a2bd292016-01-26 17:23:47 -0800412 bool verify,
Aart Bik37d6a3b2016-06-21 18:30:10 -0700413 bool verify_checksum,
Andreas Gampe3a2bd292016-01-26 17:23:47 -0800414 std::string* error_msg);
Brian Carlstrom89521892011-12-07 22:05:07 -0800415
Orion Hodsona4c2a052016-08-17 10:51:42 +0100416 // Opens .dex file that has been memory-mapped by the caller.
417 static std::unique_ptr<const DexFile> Open(const std::string& location,
418 uint32_t location_checkum,
419 std::unique_ptr<MemMap> mem_map,
420 bool verify,
421 bool verify_checksum,
422 std::string* error_msg);
423
424 // Checks whether the given file has the dex magic, or is a zip file with a classes.dex entry.
425 // If this function returns false, Open will not succeed. The inverse is not true, however.
426 static bool MaybeDex(const char* filename);
427
Andreas Gampe833a4852014-05-21 18:46:59 -0700428 // Open all classesXXX.dex files from a zip archive.
Aart Bik37d6a3b2016-06-21 18:30:10 -0700429 static bool OpenFromZip(const ZipArchive& zip_archive,
430 const std::string& location,
431 bool verify_checksum,
Richard Uhlerfbef44d2014-12-23 09:48:51 -0800432 std::string* error_msg,
433 std::vector<std::unique_ptr<const DexFile>>* dex_files);
Brian Carlstroma6cc8932012-01-04 14:44:07 -0800434
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700435 // Closes a .dex file.
Brian Carlstromf615a612011-07-23 12:50:34 -0700436 virtual ~DexFile();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700437
Brian Carlstroma663ea52011-08-19 23:33:41 -0700438 const std::string& GetLocation() const {
439 return location_;
440 }
441
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700442 // For normal dex files, location and base location coincide. If a dex file is part of a multidex
443 // archive, the base location is the name of the originating jar/apk, stripped of any internal
444 // classes*.dex path.
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100445 static std::string GetBaseLocation(const char* location) {
446 const char* pos = strrchr(location, kMultiDexSeparator);
447 if (pos == nullptr) {
448 return location;
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700449 } else {
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100450 return std::string(location, pos - location);
451 }
452 }
453
Richard Uhlere5fed032015-03-18 08:21:11 -0700454 static std::string GetBaseLocation(const std::string& location) {
455 return GetBaseLocation(location.c_str());
456 }
457
458 // Returns the ':classes*.dex' part of the dex location. Returns an empty
459 // string if there is no multidex suffix for the given location.
460 // The kMultiDexSeparator is included in the returned suffix.
461 static std::string GetMultiDexSuffix(const std::string& location) {
462 size_t pos = location.rfind(kMultiDexSeparator);
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100463 if (pos == std::string::npos) {
Richard Uhlere5fed032015-03-18 08:21:11 -0700464 return "";
Vladimir Markoaa4497d2014-09-05 14:01:17 +0100465 } else {
Richard Uhlere5fed032015-03-18 08:21:11 -0700466 return location.substr(pos);
Andreas Gampecb8f9e82014-07-24 15:35:50 -0700467 }
468 }
469
Richard Uhlere5fed032015-03-18 08:21:11 -0700470 std::string GetBaseLocation() const {
471 return GetBaseLocation(location_);
472 }
473
Brian Carlstrom5b332c82012-02-01 15:02:31 -0800474 // For DexFiles directly from .dex files, this is the checksum from the DexFile::Header.
475 // For DexFiles opened from a zip files, this will be the ZipEntry CRC32 of classes.dex.
476 uint32_t GetLocationChecksum() const {
477 return location_checksum_;
478 }
479
Brian Carlstroma663ea52011-08-19 23:33:41 -0700480 const Header& GetHeader() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700481 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700482 return *header_;
Carl Shapiro1fb86202011-06-27 17:43:13 -0700483 }
484
Ian Rogers0571d352011-11-03 19:51:38 -0700485 // Decode the dex magic version
Andreas Gampe76ed99d2016-03-28 18:31:29 -0700486 uint32_t GetVersion() const {
487 return GetHeader().GetVersion();
488 }
Ian Rogersd81871c2011-10-03 13:57:23 -0700489
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800490 // Returns true if the byte string points to the magic value.
Ian Rogers13735952014-10-08 12:43:28 -0700491 static bool IsMagicValid(const uint8_t* magic);
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800492
493 // Returns true if the byte string after the magic is the correct value.
Ian Rogers13735952014-10-08 12:43:28 -0700494 static bool IsVersionValid(const uint8_t* magic);
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -0800495
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700496 // Returns the number of string identifiers in the .dex file.
497 size_t NumStringIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700498 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700499 return header_->string_ids_size_;
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700500 }
501
Ian Rogers0571d352011-11-03 19:51:38 -0700502 // Returns the StringId at the specified index.
503 const StringId& GetStringId(uint32_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700504 DCHECK_LT(idx, NumStringIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700505 return string_ids_[idx];
506 }
507
508 uint32_t GetIndexForStringId(const StringId& string_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800509 CHECK_GE(&string_id, string_ids_) << GetLocation();
510 CHECK_LT(&string_id, string_ids_ + header_->string_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700511 return &string_id - string_ids_;
512 }
513
514 int32_t GetStringLength(const StringId& string_id) const;
515
Ian Rogersdfb325e2013-10-30 01:00:44 -0700516 // Returns a pointer to the UTF-8 string data referred to by the given string_id as well as the
517 // length of the string when decoded as a UTF-16 string. Note the UTF-16 length is not the same
518 // as the string length of the string data.
519 const char* GetStringDataAndUtf16Length(const StringId& string_id, uint32_t* utf16_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700520
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100521 const char* GetStringData(const StringId& string_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700522
Ian Rogersdfb325e2013-10-30 01:00:44 -0700523 // Index version of GetStringDataAndUtf16Length.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100524 const char* StringDataAndUtf16LengthByIdx(uint32_t idx, uint32_t* utf16_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700525
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100526 const char* StringDataByIdx(uint32_t idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700527
Ian Rogers637c65b2013-05-31 11:46:00 -0700528 // Looks up a string id for a given modified utf8 string.
529 const StringId* FindStringId(const char* string) const;
530
Artem Udovichenkod9786b02015-10-14 16:36:55 +0300531 const TypeId* FindTypeId(const char* string) const;
532
Ian Rogers637c65b2013-05-31 11:46:00 -0700533 // Looks up a string id for a given utf16 string.
Vladimir Markoa48aef42014-12-03 17:53:53 +0000534 const StringId* FindStringId(const uint16_t* string, size_t length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700535
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700536 // Returns the number of type identifiers in the .dex file.
Ian Rogers68b56852014-08-29 20:19:11 -0700537 uint32_t NumTypeIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700538 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700539 return header_->type_ids_size_;
Carl Shapiro5fafe2b2011-07-09 15:34:41 -0700540 }
541
Ian Rogers0571d352011-11-03 19:51:38 -0700542 // Returns the TypeId at the specified index.
543 const TypeId& GetTypeId(uint32_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700544 DCHECK_LT(idx, NumTypeIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700545 return type_ids_[idx];
Carl Shapiro5fafe2b2011-07-09 15:34:41 -0700546 }
547
Ian Rogers0571d352011-11-03 19:51:38 -0700548 uint16_t GetIndexForTypeId(const TypeId& type_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800549 CHECK_GE(&type_id, type_ids_) << GetLocation();
550 CHECK_LT(&type_id, type_ids_ + header_->type_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700551 size_t result = &type_id - type_ids_;
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800552 DCHECK_LT(result, 65536U) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700553 return static_cast<uint16_t>(result);
554 }
555
556 // Get the descriptor string associated with a given type index.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100557 const char* StringByTypeIdx(uint32_t idx, uint32_t* unicode_length) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700558
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100559 const char* StringByTypeIdx(uint32_t idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700560
561 // Returns the type descriptor string of a type id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100562 const char* GetTypeDescriptor(const TypeId& type_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700563
564 // Looks up a type for the given string index
565 const TypeId* FindTypeId(uint32_t string_idx) const;
566
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700567 // Returns the number of field identifiers in the .dex file.
568 size_t NumFieldIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700569 DCHECK(header_ != nullptr) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700570 return header_->field_ids_size_;
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700571 }
572
Ian Rogers0571d352011-11-03 19:51:38 -0700573 // Returns the FieldId at the specified index.
574 const FieldId& GetFieldId(uint32_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200575 DCHECK_LT(idx, NumFieldIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700576 return field_ids_[idx];
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700577 }
578
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800579 uint32_t GetIndexForFieldId(const FieldId& field_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800580 CHECK_GE(&field_id, field_ids_) << GetLocation();
581 CHECK_LT(&field_id, field_ids_ + header_->field_ids_size_) << GetLocation();
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800582 return &field_id - field_ids_;
583 }
584
585 // Looks up a field by its declaring class, name and type
586 const FieldId* FindFieldId(const DexFile::TypeId& declaring_klass,
587 const DexFile::StringId& name,
588 const DexFile::TypeId& type) const;
589
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700590 // Returns the declaring class descriptor string of a field id.
591 const char* GetFieldDeclaringClassDescriptor(const FieldId& field_id) const {
Brian Carlstromb9edb842011-08-28 16:31:06 -0700592 const DexFile::TypeId& type_id = GetTypeId(field_id.class_idx_);
593 return GetTypeDescriptor(type_id);
594 }
595
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700596 // Returns the class descriptor string of a field id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100597 const char* GetFieldTypeDescriptor(const FieldId& field_id) const;
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700598
Brian Carlstromb9edb842011-08-28 16:31:06 -0700599 // Returns the name of a field id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100600 const char* GetFieldName(const FieldId& field_id) const;
Brian Carlstromb9edb842011-08-28 16:31:06 -0700601
Ian Rogers0571d352011-11-03 19:51:38 -0700602 // Returns the number of method identifiers in the .dex file.
603 size_t NumMethodIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700604 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700605 return header_->method_ids_size_;
606 }
607
608 // Returns the MethodId at the specified index.
609 const MethodId& GetMethodId(uint32_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700610 DCHECK_LT(idx, NumMethodIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700611 return method_ids_[idx];
612 }
613
614 uint32_t GetIndexForMethodId(const MethodId& method_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800615 CHECK_GE(&method_id, method_ids_) << GetLocation();
616 CHECK_LT(&method_id, method_ids_ + header_->method_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700617 return &method_id - method_ids_;
618 }
619
Ian Rogers9b1a4f42011-11-14 18:35:10 -0800620 // Looks up a method by its declaring class, name and proto_id
621 const MethodId* FindMethodId(const DexFile::TypeId& declaring_klass,
622 const DexFile::StringId& name,
Ian Rogers0571d352011-11-03 19:51:38 -0700623 const DexFile::ProtoId& signature) const;
624
Brian Carlstrom6b4ef022011-10-23 14:59:04 -0700625 // Returns the declaring class descriptor string of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100626 const char* GetMethodDeclaringClassDescriptor(const MethodId& method_id) const;
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700627
jeffhao98eacac2011-09-14 16:11:53 -0700628 // Returns the prototype of a method id.
Brian Carlstromaded5f72011-10-07 17:15:04 -0700629 const ProtoId& GetMethodPrototype(const MethodId& method_id) const {
630 return GetProtoId(method_id.proto_idx_);
631 }
632
Ian Rogersd91d6d62013-09-25 20:26:14 -0700633 // Returns a representation of the signature of a method id.
634 const Signature GetMethodSignature(const MethodId& method_id) const;
jeffhao98eacac2011-09-14 16:11:53 -0700635
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700636 // Returns the name of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100637 const char* GetMethodName(const MethodId& method_id) const;
Brian Carlstrom7540ff42011-09-04 16:38:46 -0700638
Calin Juravle68ad6492015-08-18 17:08:12 +0100639 // Returns the shorty of a method by its index.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100640 const char* GetMethodShorty(uint32_t idx) const;
Calin Juravle68ad6492015-08-18 17:08:12 +0100641
Ian Rogers0571d352011-11-03 19:51:38 -0700642 // Returns the shorty of a method id.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100643 const char* GetMethodShorty(const MethodId& method_id) const;
644 const char* GetMethodShorty(const MethodId& method_id, uint32_t* length) const;
645
Ian Rogers0571d352011-11-03 19:51:38 -0700646 // Returns the number of class definitions in the .dex file.
Ian Rogers68b56852014-08-29 20:19:11 -0700647 uint32_t NumClassDefs() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700648 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700649 return header_->class_defs_size_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700650 }
651
652 // Returns the ClassDef at the specified index.
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700653 const ClassDef& GetClassDef(uint16_t idx) const {
Sebastien Hertzb24bd992013-08-02 15:19:09 +0200654 DCHECK_LT(idx, NumClassDefs()) << GetLocation();
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700655 return class_defs_[idx];
656 }
657
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700658 uint16_t GetIndexForClassDef(const ClassDef& class_def) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800659 CHECK_GE(&class_def, class_defs_) << GetLocation();
660 CHECK_LT(&class_def, class_defs_ + header_->class_defs_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700661 return &class_def - class_defs_;
662 }
663
664 // Returns the class descriptor string of a class definition.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100665 const char* GetClassDescriptor(const ClassDef& class_def) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700666
Mathieu Chartiere7c9a8c2014-11-06 16:35:45 -0800667 // Looks up a class definition by its class descriptor. Hash must be
668 // ComputeModifiedUtf8Hash(descriptor).
669 const ClassDef* FindClassDef(const char* descriptor, size_t hash) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700670
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700671 // Looks up a class definition by its type index.
672 const ClassDef* FindClassDef(uint16_t type_idx) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700673
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700674 const TypeList* GetInterfacesList(const ClassDef& class_def) const {
675 if (class_def.interfaces_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700676 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700677 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700678 const uint8_t* addr = begin_ + class_def.interfaces_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700679 return reinterpret_cast<const TypeList*>(addr);
680 }
681 }
682
Ian Rogers0571d352011-11-03 19:51:38 -0700683 // Returns a pointer to the raw memory mapped class_data_item
Ian Rogers13735952014-10-08 12:43:28 -0700684 const uint8_t* GetClassData(const ClassDef& class_def) const {
Ian Rogers0571d352011-11-03 19:51:38 -0700685 if (class_def.class_data_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700686 return nullptr;
Ian Rogers0571d352011-11-03 19:51:38 -0700687 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800688 return begin_ + class_def.class_data_off_;
Ian Rogers0571d352011-11-03 19:51:38 -0700689 }
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700690 }
691
Ian Rogers0571d352011-11-03 19:51:38 -0700692 //
Ian Rogers6d4d9fc2011-11-30 16:24:48 -0800693 const CodeItem* GetCodeItem(const uint32_t code_off) const {
Alex Light9139e002015-10-09 15:59:48 -0700694 DCHECK_LT(code_off, size_) << "Code item offset larger then maximum allowed offset";
Ian Rogers6d4d9fc2011-11-30 16:24:48 -0800695 if (code_off == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700696 return nullptr; // native or abstract method
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700697 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700698 const uint8_t* addr = begin_ + code_off;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700699 return reinterpret_cast<const CodeItem*>(addr);
700 }
701 }
702
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100703 const char* GetReturnTypeDescriptor(const ProtoId& proto_id) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700704
705 // Returns the number of prototype identifiers in the .dex file.
706 size_t NumProtoIds() const {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700707 DCHECK(header_ != nullptr) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700708 return header_->proto_ids_size_;
709 }
710
711 // Returns the ProtoId at the specified index.
712 const ProtoId& GetProtoId(uint32_t idx) const {
Ian Rogers4f6ad8a2013-03-18 15:27:28 -0700713 DCHECK_LT(idx, NumProtoIds()) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700714 return proto_ids_[idx];
715 }
716
717 uint16_t GetIndexForProtoId(const ProtoId& proto_id) const {
Brian Carlstrom61e513c2011-12-09 15:30:06 -0800718 CHECK_GE(&proto_id, proto_ids_) << GetLocation();
719 CHECK_LT(&proto_id, proto_ids_ + header_->proto_ids_size_) << GetLocation();
Ian Rogers0571d352011-11-03 19:51:38 -0700720 return &proto_id - proto_ids_;
721 }
722
723 // Looks up a proto id for a given return type and signature type list
Ian Rogersd91d6d62013-09-25 20:26:14 -0700724 const ProtoId* FindProtoId(uint16_t return_type_idx,
Vladimir Marko5c96e6b2013-11-14 15:34:17 +0000725 const uint16_t* signature_type_idxs, uint32_t signature_length) const;
726 const ProtoId* FindProtoId(uint16_t return_type_idx,
727 const std::vector<uint16_t>& signature_type_idxs) const {
728 return FindProtoId(return_type_idx, &signature_type_idxs[0], signature_type_idxs.size());
729 }
Ian Rogers0571d352011-11-03 19:51:38 -0700730
731 // Given a signature place the type ids into the given vector, returns true on success
Ian Rogersd91d6d62013-09-25 20:26:14 -0700732 bool CreateTypeList(const StringPiece& signature, uint16_t* return_type_idx,
733 std::vector<uint16_t>* param_type_idxs) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700734
Ian Rogersd91d6d62013-09-25 20:26:14 -0700735 // Create a Signature from the given string signature or return Signature::NoSignature if not
736 // possible.
737 const Signature CreateSignature(const StringPiece& signature) const;
Ian Rogers0571d352011-11-03 19:51:38 -0700738
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700739 // Returns the short form method descriptor for the given prototype.
Vladimir Marko5c6a5872016-06-27 13:50:16 +0100740 const char* GetShorty(uint32_t proto_idx) const;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700741
742 const TypeList* GetProtoParameters(const ProtoId& proto_id) const {
743 if (proto_id.parameters_off_ == 0) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700744 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700745 } else {
Ian Rogers13735952014-10-08 12:43:28 -0700746 const uint8_t* addr = begin_ + proto_id.parameters_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700747 return reinterpret_cast<const TypeList*>(addr);
748 }
749 }
750
Ian Rogers13735952014-10-08 12:43:28 -0700751 const uint8_t* GetEncodedStaticFieldValuesArray(const ClassDef& class_def) const {
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700752 if (class_def.static_values_off_ == 0) {
753 return 0;
754 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800755 return begin_ + class_def.static_values_off_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700756 }
757 }
758
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800759 static const TryItem* GetTryItems(const CodeItem& code_item, uint32_t offset);
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700760
761 // Get the base of the encoded data for the given DexCode.
Ian Rogers13735952014-10-08 12:43:28 -0700762 static const uint8_t* GetCatchHandlerData(const CodeItem& code_item, uint32_t offset) {
763 const uint8_t* handler_data =
764 reinterpret_cast<const uint8_t*>(GetTryItems(code_item, code_item.tries_size_));
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700765 return handler_data + offset;
766 }
767
Ian Rogersdbbc99d2013-04-18 16:51:54 -0700768 // Find which try region is associated with the given address (ie dex pc). Returns -1 if none.
769 static int32_t FindTryItem(const CodeItem &code_item, uint32_t address);
770
771 // Find the handler offset associated with the given address (ie dex pc). Returns -1 if none.
772 static int32_t FindCatchHandlerOffset(const CodeItem &code_item, uint32_t address);
Shih-wei Liao2fb97532011-08-11 16:17:23 -0700773
Shih-wei Liao195487c2011-08-20 13:29:04 -0700774 // Get the pointer to the start of the debugging data
Ian Rogers13735952014-10-08 12:43:28 -0700775 const uint8_t* GetDebugInfoStream(const CodeItem* code_item) const {
David Srbecky68529422015-07-07 19:13:29 +0100776 // Check that the offset is in bounds.
777 // Note that although the specification says that 0 should be used if there
778 // is no debug information, some applications incorrectly use 0xFFFFFFFF.
779 if (code_item->debug_info_off_ == 0 || code_item->debug_info_off_ >= size_) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700780 return nullptr;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700781 } else {
Ian Rogers30fab402012-01-23 15:43:46 -0800782 return begin_ + code_item->debug_info_off_;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700783 }
784 }
785
David Srbeckyb06e28e2015-12-10 13:15:00 +0000786 struct PositionInfo {
787 PositionInfo()
788 : address_(0),
789 line_(0),
790 source_file_(nullptr),
791 prologue_end_(false),
792 epilogue_begin_(false) {
793 }
794
795 uint32_t address_; // In 16-bit code units.
796 uint32_t line_; // Source code line number starting at 1.
797 const char* source_file_; // nullptr if the file from ClassDef still applies.
798 bool prologue_end_;
799 bool epilogue_begin_;
800 };
801
Shih-wei Liao195487c2011-08-20 13:29:04 -0700802 // Callback for "new position table entry".
803 // Returning true causes the decoder to stop early.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000804 typedef bool (*DexDebugNewPositionCb)(void* context, const PositionInfo& entry);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700805
David Srbeckyb06e28e2015-12-10 13:15:00 +0000806 struct LocalInfo {
807 LocalInfo()
808 : name_(nullptr),
809 descriptor_(nullptr),
810 signature_(nullptr),
811 start_address_(0),
812 end_address_(0),
813 reg_(0),
814 is_live_(false) {
815 }
Shih-wei Liao195487c2011-08-20 13:29:04 -0700816
David Srbeckyb06e28e2015-12-10 13:15:00 +0000817 const char* name_; // E.g., list. It can be nullptr if unknown.
818 const char* descriptor_; // E.g., Ljava/util/LinkedList;
819 const char* signature_; // E.g., java.util.LinkedList<java.lang.Integer>
820 uint32_t start_address_; // PC location where the local is first defined.
821 uint32_t end_address_; // PC location where the local is no longer defined.
822 uint16_t reg_; // Dex register which stores the values.
823 bool is_live_; // Is the local defined and live.
824 };
825
826 // Callback for "new locals table entry".
827 typedef void (*DexDebugNewLocalCb)(void* context, const LocalInfo& entry);
828
829 static bool LineNumForPcCb(void* context, const PositionInfo& entry);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700830
Jeff Hao13e748b2015-08-25 20:44:19 +0000831 const AnnotationsDirectoryItem* GetAnnotationsDirectory(const ClassDef& class_def) const {
832 if (class_def.annotations_off_ == 0) {
833 return nullptr;
834 } else {
835 return reinterpret_cast<const AnnotationsDirectoryItem*>(begin_ + class_def.annotations_off_);
836 }
837 }
838
839 const AnnotationSetItem* GetClassAnnotationSet(const AnnotationsDirectoryItem* anno_dir) const {
840 if (anno_dir->class_annotations_off_ == 0) {
841 return nullptr;
842 } else {
843 return reinterpret_cast<const AnnotationSetItem*>(begin_ + anno_dir->class_annotations_off_);
844 }
845 }
846
847 const FieldAnnotationsItem* GetFieldAnnotations(const AnnotationsDirectoryItem* anno_dir) const {
848 if (anno_dir->fields_size_ == 0) {
849 return nullptr;
850 } else {
851 return reinterpret_cast<const FieldAnnotationsItem*>(&anno_dir[1]);
852 }
853 }
854
855 const MethodAnnotationsItem* GetMethodAnnotations(const AnnotationsDirectoryItem* anno_dir)
856 const {
857 if (anno_dir->methods_size_ == 0) {
858 return nullptr;
859 } else {
860 // Skip past the header and field annotations.
861 const uint8_t* addr = reinterpret_cast<const uint8_t*>(&anno_dir[1]);
862 addr += anno_dir->fields_size_ * sizeof(FieldAnnotationsItem);
863 return reinterpret_cast<const MethodAnnotationsItem*>(addr);
864 }
865 }
866
867 const ParameterAnnotationsItem* GetParameterAnnotations(const AnnotationsDirectoryItem* anno_dir)
868 const {
869 if (anno_dir->parameters_size_ == 0) {
870 return nullptr;
871 } else {
872 // Skip past the header, field annotations, and method annotations.
873 const uint8_t* addr = reinterpret_cast<const uint8_t*>(&anno_dir[1]);
874 addr += anno_dir->fields_size_ * sizeof(FieldAnnotationsItem);
875 addr += anno_dir->methods_size_ * sizeof(MethodAnnotationsItem);
876 return reinterpret_cast<const ParameterAnnotationsItem*>(addr);
877 }
878 }
879
880 const AnnotationSetItem* GetFieldAnnotationSetItem(const FieldAnnotationsItem& anno_item) const {
881 uint32_t offset = anno_item.annotations_off_;
882 if (offset == 0) {
883 return nullptr;
884 } else {
885 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
886 }
887 }
888
889 const AnnotationSetItem* GetMethodAnnotationSetItem(const MethodAnnotationsItem& anno_item)
890 const {
891 uint32_t offset = anno_item.annotations_off_;
892 if (offset == 0) {
893 return nullptr;
894 } else {
895 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
896 }
897 }
898
899 const AnnotationSetRefList* GetParameterAnnotationSetRefList(
900 const ParameterAnnotationsItem* anno_item) const {
901 uint32_t offset = anno_item->annotations_off_;
902 if (offset == 0) {
903 return nullptr;
904 }
905 return reinterpret_cast<const AnnotationSetRefList*>(begin_ + offset);
906 }
907
908 const AnnotationItem* GetAnnotationItem(const AnnotationSetItem* set_item, uint32_t index) const {
909 DCHECK_LE(index, set_item->size_);
910 uint32_t offset = set_item->entries_[index];
911 if (offset == 0) {
912 return nullptr;
913 } else {
914 return reinterpret_cast<const AnnotationItem*>(begin_ + offset);
915 }
916 }
917
918 const AnnotationSetItem* GetSetRefItemItem(const AnnotationSetRefItem* anno_item) const {
919 uint32_t offset = anno_item->annotations_off_;
920 if (offset == 0) {
921 return nullptr;
922 }
923 return reinterpret_cast<const AnnotationSetItem*>(begin_ + offset);
924 }
925
Shih-wei Liao195487c2011-08-20 13:29:04 -0700926 // Debug info opcodes and constants
927 enum {
928 DBG_END_SEQUENCE = 0x00,
929 DBG_ADVANCE_PC = 0x01,
930 DBG_ADVANCE_LINE = 0x02,
931 DBG_START_LOCAL = 0x03,
932 DBG_START_LOCAL_EXTENDED = 0x04,
933 DBG_END_LOCAL = 0x05,
934 DBG_RESTART_LOCAL = 0x06,
935 DBG_SET_PROLOGUE_END = 0x07,
936 DBG_SET_EPILOGUE_BEGIN = 0x08,
937 DBG_SET_FILE = 0x09,
938 DBG_FIRST_SPECIAL = 0x0a,
939 DBG_LINE_BASE = -4,
940 DBG_LINE_RANGE = 15,
941 };
942
Shih-wei Liao195487c2011-08-20 13:29:04 -0700943 struct LineNumFromPcContext {
Ian Rogersca190662012-06-26 15:45:57 -0700944 LineNumFromPcContext(uint32_t address, uint32_t line_num)
945 : address_(address), line_num_(line_num) {}
Shih-wei Liao195487c2011-08-20 13:29:04 -0700946 uint32_t address_;
947 uint32_t line_num_;
Brian Carlstromd2fbb2b2011-08-23 11:57:08 -0700948 private:
949 DISALLOW_COPY_AND_ASSIGN(LineNumFromPcContext);
Shih-wei Liao195487c2011-08-20 13:29:04 -0700950 };
951
Roland Levillain91d65e02016-01-19 15:59:16 +0000952 // Returns false if there is no debugging information or if it cannot be decoded.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000953 bool DecodeDebugLocalInfo(const CodeItem* code_item, bool is_static, uint32_t method_idx,
954 DexDebugNewLocalCb local_cb, void* context) const;
955
Roland Levillain91d65e02016-01-19 15:59:16 +0000956 // Returns false if there is no debugging information or if it cannot be decoded.
David Srbeckyb06e28e2015-12-10 13:15:00 +0000957 bool DecodeDebugPositionInfo(const CodeItem* code_item, DexDebugNewPositionCb position_cb,
958 void* context) const;
Shih-wei Liao195487c2011-08-20 13:29:04 -0700959
Ian Rogers0571d352011-11-03 19:51:38 -0700960 const char* GetSourceFile(const ClassDef& class_def) const {
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700961 if (class_def.source_file_idx_ == 0xffffffff) {
Mathieu Chartier2cebb242015-04-21 16:50:40 -0700962 return nullptr;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700963 } else {
Ian Rogers0571d352011-11-03 19:51:38 -0700964 return StringDataByIdx(class_def.source_file_idx_);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -0700965 }
Carl Shapiro0e5d75d2011-07-06 18:28:37 -0700966 }
967
Ian Rogers2dd0e2c2013-01-24 12:42:14 -0800968 int GetPermissions() const;
Ian Rogers1c849e52012-06-28 14:00:33 -0700969
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200970 bool IsReadOnly() const;
971
Brian Carlstrome0948e12013-08-29 09:36:15 -0700972 bool EnableWrite() const;
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200973
Brian Carlstrome0948e12013-08-29 09:36:15 -0700974 bool DisableWrite() const;
Sebastien Hertz2d6ba512013-05-17 11:31:37 +0200975
Ian Rogers13735952014-10-08 12:43:28 -0700976 const uint8_t* Begin() const {
Ian Rogers8b2c0b92013-09-19 02:56:49 -0700977 return begin_;
978 }
979
980 size_t Size() const {
981 return size_;
982 }
983
Andreas Gampe90e34042015-04-27 20:01:52 -0700984 // Return the name of the index-th classes.dex in a multidex zip file. This is classes.dex for
985 // index == 0, and classes{index + 1}.dex else.
986 static std::string GetMultiDexClassesDexName(size_t index);
987
988 // Return the (possibly synthetic) dex location for a multidex entry. This is dex_location for
989 // index == 0, and dex_location + multi-dex-separator + GetMultiDexClassesDexName(index) else.
990 static std::string GetMultiDexLocation(size_t index, const char* dex_location);
Calin Juravle4e1d5792014-07-15 23:56:47 +0100991
992 // Returns the canonical form of the given dex location.
993 //
994 // There are different flavors of "dex locations" as follows:
995 // the file name of a dex file:
996 // The actual file path that the dex file has on disk.
997 // dex_location:
998 // This acts as a key for the class linker to know which dex file to load.
999 // It may correspond to either an old odex file or a particular dex file
1000 // inside an oat file. In the first case it will also match the file name
1001 // of the dex file. In the second case (oat) it will include the file name
1002 // and possibly some multidex annotation to uniquely identify it.
1003 // canonical_dex_location:
1004 // the dex_location where it's file name part has been made canonical.
1005 static std::string GetDexCanonicalLocation(const char* dex_location);
1006
Richard Uhler07b3c232015-03-31 15:57:54 -07001007 const OatDexFile* GetOatDexFile() const {
1008 return oat_dex_file_;
Andreas Gampefd9eb392014-11-06 16:52:58 -08001009 }
1010
Artem Udovichenkod9786b02015-10-14 16:36:55 +03001011 TypeLookupTable* GetTypeLookupTable() const {
1012 return lookup_table_.get();
1013 }
1014
Vladimir Marko9bdf1082016-01-21 12:15:52 +00001015 void CreateTypeLookupTable(uint8_t* storage = nullptr) const;
Artem Udovichenkod9786b02015-10-14 16:36:55 +03001016
David Sehr9323e6e2016-09-13 08:58:35 -07001017 // Utility methods for reading integral values from a buffer.
1018 static int32_t ReadSignedInt(const uint8_t* ptr, int zwidth);
1019 static uint32_t ReadUnsignedInt(const uint8_t* ptr, int zwidth, bool fill_on_right);
1020 static int64_t ReadSignedLong(const uint8_t* ptr, int zwidth);
1021 static uint64_t ReadUnsignedLong(const uint8_t* ptr, int zwidth, bool fill_on_right);
1022
Carl Shapiro1fb86202011-06-27 17:43:13 -07001023 private:
Brian Carlstrom58ae9412011-10-04 00:56:06 -07001024 // Opens a .dex file
Aart Bik37d6a3b2016-06-21 18:30:10 -07001025 static std::unique_ptr<const DexFile> OpenFile(int fd,
1026 const char* location,
1027 bool verify,
1028 bool verify_checksum,
1029 std::string* error_msg);
Brian Carlstrom58ae9412011-10-04 00:56:06 -07001030
Andreas Gampe833a4852014-05-21 18:46:59 -07001031 // Opens dex files from within a .jar, .zip, or .apk file
Aart Bik37d6a3b2016-06-21 18:30:10 -07001032 static bool OpenZip(int fd,
1033 const std::string& location,
1034 bool verify_checksum,
1035 std::string* error_msg,
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001036 std::vector<std::unique_ptr<const DexFile>>* dex_files);
Andreas Gampe833a4852014-05-21 18:46:59 -07001037
1038 enum class ZipOpenErrorCode { // private
1039 kNoError,
1040 kEntryNotFound,
1041 kExtractToMemoryError,
1042 kDexFileError,
1043 kMakeReadOnlyError,
1044 kVerifyError
1045 };
1046
Mathieu Chartier2cebb242015-04-21 16:50:40 -07001047 // Opens .dex file from the entry_name in a zip archive. error_code is undefined when non-null
Andreas Gampe833a4852014-05-21 18:46:59 -07001048 // return.
Aart Bik37d6a3b2016-06-21 18:30:10 -07001049 static std::unique_ptr<const DexFile> Open(const ZipArchive& zip_archive,
1050 const char* entry_name,
1051 const std::string& location,
1052 bool verify_checksum,
1053 std::string* error_msg,
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001054 ZipOpenErrorCode* error_code);
Brian Carlstrom58ae9412011-10-04 00:56:06 -07001055
Brian Carlstrom89521892011-12-07 22:05:07 -08001056 // Opens a .dex file at the given address backed by a MemMap
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001057 static std::unique_ptr<const DexFile> OpenMemory(const std::string& location,
1058 uint32_t location_checksum,
Orion Hodsona4c2a052016-08-17 10:51:42 +01001059 std::unique_ptr<MemMap> mem_map,
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001060 std::string* error_msg);
Brian Carlstrom89521892011-12-07 22:05:07 -08001061
1062 // Opens a .dex file at the given address, optionally backed by a MemMap
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001063 static std::unique_ptr<const DexFile> OpenMemory(const uint8_t* dex_file,
1064 size_t size,
1065 const std::string& location,
1066 uint32_t location_checksum,
Orion Hodsona4c2a052016-08-17 10:51:42 +01001067 std::unique_ptr<MemMap> mem_map,
Richard Uhler07b3c232015-03-31 15:57:54 -07001068 const OatDexFile* oat_dex_file,
Richard Uhlerfbef44d2014-12-23 09:48:51 -08001069 std::string* error_msg);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001070
Ian Rogers13735952014-10-08 12:43:28 -07001071 DexFile(const uint8_t* base, size_t size,
Brian Carlstrom28db0122012-10-18 16:20:41 -07001072 const std::string& location,
1073 uint32_t location_checksum,
Orion Hodsona4c2a052016-08-17 10:51:42 +01001074 std::unique_ptr<MemMap> mem_map,
Richard Uhler07b3c232015-03-31 15:57:54 -07001075 const OatDexFile* oat_dex_file);
jeffhaof6174e82012-01-31 16:14:17 -08001076
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001077 // Top-level initializer that calls other Init methods.
Ian Rogers8d31bbd2013-10-13 10:44:14 -07001078 bool Init(std::string* error_msg);
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001079
Brian Carlstrom6e3b1d92012-01-11 01:36:32 -08001080 // Returns true if the header magic and version numbers are of the expected values.
Ian Rogers8d31bbd2013-10-13 10:44:14 -07001081 bool CheckMagicAndVersion(std::string* error_msg) const;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001082
Andreas Gampe833a4852014-05-21 18:46:59 -07001083 // Check whether a location denotes a multidex dex file. This is a very simple check: returns
1084 // whether the string contains the separator character.
1085 static bool IsMultiDexLocation(const char* location);
1086
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001087 // The base address of the memory mapping.
Ian Rogers13735952014-10-08 12:43:28 -07001088 const uint8_t* const begin_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001089
1090 // The size of the underlying memory allocation in bytes.
Ian Rogers62d6c772013-02-27 08:32:07 -08001091 const size_t size_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001092
Elliott Hughes64bf5a32011-09-20 14:43:12 -07001093 // Typically the dex file name when available, alternatively some identifying string.
Brian Carlstroma663ea52011-08-19 23:33:41 -07001094 //
1095 // The ClassLinker will use this to match DexFiles the boot class
1096 // path to DexCache::GetLocation when loading from an image.
1097 const std::string location_;
1098
Brian Carlstrom5b332c82012-02-01 15:02:31 -08001099 const uint32_t location_checksum_;
1100
Brian Carlstrom33f741e2011-10-03 11:24:05 -07001101 // Manages the underlying memory allocation.
Ian Rogers700a4022014-05-19 16:49:03 -07001102 std::unique_ptr<MemMap> mem_map_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001103
1104 // Points to the header section.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001105 const Header* const header_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001106
1107 // Points to the base of the string identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001108 const StringId* const string_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001109
1110 // Points to the base of the type identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001111 const TypeId* const type_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001112
1113 // Points to the base of the field identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001114 const FieldId* const field_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001115
1116 // Points to the base of the method identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001117 const MethodId* const method_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001118
1119 // Points to the base of the prototype identifier list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001120 const ProtoId* const proto_ids_;
Brian Carlstrom7e49dca2011-07-22 18:07:34 -07001121
1122 // Points to the base of the class definition list.
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001123 const ClassDef* const class_defs_;
Ian Rogers68b56852014-08-29 20:19:11 -07001124
Richard Uhler07b3c232015-03-31 15:57:54 -07001125 // If this dex file was loaded from an oat file, oat_dex_file_ contains a
1126 // pointer to the OatDexFile it was loaded from. Otherwise oat_dex_file_ is
1127 // null.
1128 const OatDexFile* oat_dex_file_;
Artem Udovichenkod9786b02015-10-14 16:36:55 +03001129 mutable std::unique_ptr<TypeLookupTable> lookup_table_;
Andreas Gampee6215c02015-08-31 18:54:38 -07001130
1131 friend class DexFileVerifierTest;
Mathieu Chartier76172162016-01-26 14:54:06 -08001132 ART_FRIEND_TEST(ClassLinkerTest, RegisterDexFileName); // for constructor
Carl Shapiro1fb86202011-06-27 17:43:13 -07001133};
Mathieu Chartiere5f13e52015-02-24 09:37:21 -08001134
1135struct DexFileReference {
1136 DexFileReference(const DexFile* file, uint32_t idx) : dex_file(file), index(idx) { }
1137 const DexFile* dex_file;
1138 uint32_t index;
1139};
1140
Brian Carlstrom0d6adac2014-02-05 17:39:16 -08001141std::ostream& operator<<(std::ostream& os, const DexFile& dex_file);
Carl Shapiro1fb86202011-06-27 17:43:13 -07001142
Ian Rogers0571d352011-11-03 19:51:38 -07001143// Iterate over a dex file's ProtoId's paramters
1144class DexFileParameterIterator {
1145 public:
1146 DexFileParameterIterator(const DexFile& dex_file, const DexFile::ProtoId& proto_id)
1147 : dex_file_(dex_file), size_(0), pos_(0) {
1148 type_list_ = dex_file_.GetProtoParameters(proto_id);
Mathieu Chartier2cebb242015-04-21 16:50:40 -07001149 if (type_list_ != nullptr) {
Ian Rogers0571d352011-11-03 19:51:38 -07001150 size_ = type_list_->Size();
1151 }
1152 }
1153 bool HasNext() const { return pos_ < size_; }
David Srbeckyb06e28e2015-12-10 13:15:00 +00001154 size_t Size() const { return size_; }
Ian Rogers0571d352011-11-03 19:51:38 -07001155 void Next() { ++pos_; }
Ian Rogers6d4d9fc2011-11-30 16:24:48 -08001156 uint16_t GetTypeIdx() {
Ian Rogers0571d352011-11-03 19:51:38 -07001157 return type_list_->GetTypeItem(pos_).type_idx_;
1158 }
1159 const char* GetDescriptor() {
Ian Rogers6d4d9fc2011-11-30 16:24:48 -08001160 return dex_file_.StringByTypeIdx(GetTypeIdx());
Ian Rogers0571d352011-11-03 19:51:38 -07001161 }
1162 private:
1163 const DexFile& dex_file_;
1164 const DexFile::TypeList* type_list_;
1165 uint32_t size_;
1166 uint32_t pos_;
1167 DISALLOW_IMPLICIT_CONSTRUCTORS(DexFileParameterIterator);
1168};
1169
Ian Rogersd91d6d62013-09-25 20:26:14 -07001170// Abstract the signature of a method.
Ian Rogers03b6eaf2014-10-28 09:34:57 -07001171class Signature : public ValueObject {
Ian Rogersd91d6d62013-09-25 20:26:14 -07001172 public:
1173 std::string ToString() const;
1174
1175 static Signature NoSignature() {
1176 return Signature();
1177 }
1178
Ian Rogersdfb325e2013-10-30 01:00:44 -07001179 bool operator==(const Signature& rhs) const;
Ian Rogersd91d6d62013-09-25 20:26:14 -07001180 bool operator!=(const Signature& rhs) const {
1181 return !(*this == rhs);
1182 }
1183
Vladimir Markod9cffea2013-11-25 15:08:02 +00001184 bool operator==(const StringPiece& rhs) const;
Ian Rogersd91d6d62013-09-25 20:26:14 -07001185
1186 private:
1187 Signature(const DexFile* dex, const DexFile::ProtoId& proto) : dex_file_(dex), proto_id_(&proto) {
1188 }
1189
1190 Signature() : dex_file_(nullptr), proto_id_(nullptr) {
1191 }
1192
1193 friend class DexFile;
1194
1195 const DexFile* const dex_file_;
1196 const DexFile::ProtoId* const proto_id_;
1197};
1198std::ostream& operator<<(std::ostream& os, const Signature& sig);
1199
Ian Rogers0571d352011-11-03 19:51:38 -07001200// Iterate and decode class_data_item
1201class ClassDataItemIterator {
1202 public:
Ian Rogers13735952014-10-08 12:43:28 -07001203 ClassDataItemIterator(const DexFile& dex_file, const uint8_t* raw_class_data_item)
Ian Rogers0571d352011-11-03 19:51:38 -07001204 : dex_file_(dex_file), pos_(0), ptr_pos_(raw_class_data_item), last_idx_(0) {
1205 ReadClassDataHeader();
1206 if (EndOfInstanceFieldsPos() > 0) {
1207 ReadClassDataField();
1208 } else if (EndOfVirtualMethodsPos() > 0) {
1209 ReadClassDataMethod();
1210 }
1211 }
1212 uint32_t NumStaticFields() const {
1213 return header_.static_fields_size_;
1214 }
1215 uint32_t NumInstanceFields() const {
1216 return header_.instance_fields_size_;
1217 }
1218 uint32_t NumDirectMethods() const {
1219 return header_.direct_methods_size_;
1220 }
1221 uint32_t NumVirtualMethods() const {
1222 return header_.virtual_methods_size_;
1223 }
1224 bool HasNextStaticField() const {
1225 return pos_ < EndOfStaticFieldsPos();
1226 }
1227 bool HasNextInstanceField() const {
1228 return pos_ >= EndOfStaticFieldsPos() && pos_ < EndOfInstanceFieldsPos();
1229 }
1230 bool HasNextDirectMethod() const {
1231 return pos_ >= EndOfInstanceFieldsPos() && pos_ < EndOfDirectMethodsPos();
1232 }
1233 bool HasNextVirtualMethod() const {
1234 return pos_ >= EndOfDirectMethodsPos() && pos_ < EndOfVirtualMethodsPos();
1235 }
1236 bool HasNext() const {
1237 return pos_ < EndOfVirtualMethodsPos();
1238 }
Ian Rogers637c65b2013-05-31 11:46:00 -07001239 inline void Next() {
Ian Rogers0571d352011-11-03 19:51:38 -07001240 pos_++;
1241 if (pos_ < EndOfStaticFieldsPos()) {
1242 last_idx_ = GetMemberIndex();
1243 ReadClassDataField();
1244 } else if (pos_ == EndOfStaticFieldsPos() && NumInstanceFields() > 0) {
1245 last_idx_ = 0; // transition to next array, reset last index
1246 ReadClassDataField();
1247 } else if (pos_ < EndOfInstanceFieldsPos()) {
1248 last_idx_ = GetMemberIndex();
1249 ReadClassDataField();
1250 } else if (pos_ == EndOfInstanceFieldsPos() && NumDirectMethods() > 0) {
1251 last_idx_ = 0; // transition to next array, reset last index
1252 ReadClassDataMethod();
1253 } else if (pos_ < EndOfDirectMethodsPos()) {
1254 last_idx_ = GetMemberIndex();
1255 ReadClassDataMethod();
1256 } else if (pos_ == EndOfDirectMethodsPos() && NumVirtualMethods() > 0) {
1257 last_idx_ = 0; // transition to next array, reset last index
1258 ReadClassDataMethod();
1259 } else if (pos_ < EndOfVirtualMethodsPos()) {
1260 last_idx_ = GetMemberIndex();
1261 ReadClassDataMethod();
1262 } else {
1263 DCHECK(!HasNext());
1264 }
1265 }
1266 uint32_t GetMemberIndex() const {
1267 if (pos_ < EndOfInstanceFieldsPos()) {
1268 return last_idx_ + field_.field_idx_delta_;
1269 } else {
Sebastien Hertzb24bd992013-08-02 15:19:09 +02001270 DCHECK_LT(pos_, EndOfVirtualMethodsPos());
Ian Rogers0571d352011-11-03 19:51:38 -07001271 return last_idx_ + method_.method_idx_delta_;
1272 }
1273 }
Andreas Gampe51829322014-08-25 15:05:04 -07001274 uint32_t GetRawMemberAccessFlags() const {
Ian Rogers0571d352011-11-03 19:51:38 -07001275 if (pos_ < EndOfInstanceFieldsPos()) {
1276 return field_.access_flags_;
1277 } else {
Sebastien Hertzb24bd992013-08-02 15:19:09 +02001278 DCHECK_LT(pos_, EndOfVirtualMethodsPos());
Ian Rogers0571d352011-11-03 19:51:38 -07001279 return method_.access_flags_;
1280 }
1281 }
Andreas Gampe51829322014-08-25 15:05:04 -07001282 uint32_t GetFieldAccessFlags() const {
1283 return GetRawMemberAccessFlags() & kAccValidFieldFlags;
1284 }
1285 uint32_t GetMethodAccessFlags() const {
1286 return GetRawMemberAccessFlags() & kAccValidMethodFlags;
1287 }
1288 bool MemberIsNative() const {
1289 return GetRawMemberAccessFlags() & kAccNative;
1290 }
1291 bool MemberIsFinal() const {
1292 return GetRawMemberAccessFlags() & kAccFinal;
1293 }
Ian Rogers08f753d2012-08-24 14:35:25 -07001294 InvokeType GetMethodInvokeType(const DexFile::ClassDef& class_def) const {
1295 if (HasNextDirectMethod()) {
Andreas Gampe51829322014-08-25 15:05:04 -07001296 if ((GetRawMemberAccessFlags() & kAccStatic) != 0) {
Ian Rogers08f753d2012-08-24 14:35:25 -07001297 return kStatic;
1298 } else {
1299 return kDirect;
1300 }
1301 } else {
Andreas Gampe51829322014-08-25 15:05:04 -07001302 DCHECK_EQ(GetRawMemberAccessFlags() & kAccStatic, 0U);
Ian Rogers08f753d2012-08-24 14:35:25 -07001303 if ((class_def.access_flags_ & kAccInterface) != 0) {
1304 return kInterface;
Andreas Gampe51829322014-08-25 15:05:04 -07001305 } else if ((GetRawMemberAccessFlags() & kAccConstructor) != 0) {
Ian Rogers08f753d2012-08-24 14:35:25 -07001306 return kSuper;
1307 } else {
1308 return kVirtual;
1309 }
1310 }
1311 }
Ian Rogers0571d352011-11-03 19:51:38 -07001312 const DexFile::CodeItem* GetMethodCodeItem() const {
1313 return dex_file_.GetCodeItem(method_.code_off_);
1314 }
1315 uint32_t GetMethodCodeItemOffset() const {
1316 return method_.code_off_;
1317 }
Andreas Gampee6215c02015-08-31 18:54:38 -07001318 const uint8_t* DataPointer() const {
1319 return ptr_pos_;
1320 }
Ian Rogers13735952014-10-08 12:43:28 -07001321 const uint8_t* EndDataPointer() const {
jeffhao10037c82012-01-23 15:06:23 -08001322 CHECK(!HasNext());
1323 return ptr_pos_;
1324 }
Elliott Hughesa21039c2012-06-21 12:09:25 -07001325
Ian Rogers0571d352011-11-03 19:51:38 -07001326 private:
1327 // A dex file's class_data_item is leb128 encoded, this structure holds a decoded form of the
1328 // header for a class_data_item
1329 struct ClassDataHeader {
1330 uint32_t static_fields_size_; // the number of static fields
1331 uint32_t instance_fields_size_; // the number of instance fields
1332 uint32_t direct_methods_size_; // the number of direct methods
1333 uint32_t virtual_methods_size_; // the number of virtual methods
1334 } header_;
1335
1336 // Read and decode header from a class_data_item stream into header
1337 void ReadClassDataHeader();
1338
1339 uint32_t EndOfStaticFieldsPos() const {
1340 return header_.static_fields_size_;
1341 }
1342 uint32_t EndOfInstanceFieldsPos() const {
1343 return EndOfStaticFieldsPos() + header_.instance_fields_size_;
1344 }
1345 uint32_t EndOfDirectMethodsPos() const {
1346 return EndOfInstanceFieldsPos() + header_.direct_methods_size_;
1347 }
1348 uint32_t EndOfVirtualMethodsPos() const {
1349 return EndOfDirectMethodsPos() + header_.virtual_methods_size_;
1350 }
1351
1352 // A decoded version of the field of a class_data_item
1353 struct ClassDataField {
1354 uint32_t field_idx_delta_; // delta of index into the field_ids array for FieldId
1355 uint32_t access_flags_; // access flags for the field
1356 ClassDataField() : field_idx_delta_(0), access_flags_(0) {}
Elliott Hughesa21039c2012-06-21 12:09:25 -07001357
Ian Rogers0571d352011-11-03 19:51:38 -07001358 private:
1359 DISALLOW_COPY_AND_ASSIGN(ClassDataField);
Elliott Hughesee0fa762012-03-26 17:12:41 -07001360 };
1361 ClassDataField field_;
Ian Rogers0571d352011-11-03 19:51:38 -07001362
1363 // Read and decode a field from a class_data_item stream into field
1364 void ReadClassDataField();
1365
1366 // A decoded version of the method of a class_data_item
1367 struct ClassDataMethod {
1368 uint32_t method_idx_delta_; // delta of index into the method_ids array for MethodId
1369 uint32_t access_flags_;
1370 uint32_t code_off_;
1371 ClassDataMethod() : method_idx_delta_(0), access_flags_(0), code_off_(0) {}
Elliott Hughesa21039c2012-06-21 12:09:25 -07001372
Ian Rogers0571d352011-11-03 19:51:38 -07001373 private:
1374 DISALLOW_COPY_AND_ASSIGN(ClassDataMethod);
Elliott Hughesee0fa762012-03-26 17:12:41 -07001375 };
1376 ClassDataMethod method_;
Ian Rogers0571d352011-11-03 19:51:38 -07001377
1378 // Read and decode a method from a class_data_item stream into method
1379 void ReadClassDataMethod();
1380
1381 const DexFile& dex_file_;
1382 size_t pos_; // integral number of items passed
Ian Rogers13735952014-10-08 12:43:28 -07001383 const uint8_t* ptr_pos_; // pointer into stream of class_data_item
Ian Rogers0571d352011-11-03 19:51:38 -07001384 uint32_t last_idx_; // last read field or method index to apply delta to
1385 DISALLOW_IMPLICIT_CONSTRUCTORS(ClassDataItemIterator);
1386};
1387
Ian Rogers0571d352011-11-03 19:51:38 -07001388class EncodedStaticFieldValueIterator {
1389 public:
Shinichiro Hamaji82863f02015-11-05 16:51:33 +09001390 EncodedStaticFieldValueIterator(const DexFile& dex_file,
1391 const DexFile::ClassDef& class_def);
1392
Ian Rogers6a3c1fc2014-10-31 00:33:20 -07001393 bool HasNext() const { return pos_ < array_size_; }
Ian Rogers0571d352011-11-03 19:51:38 -07001394
1395 void Next();
Elliott Hughesa21039c2012-06-21 12:09:25 -07001396
Ian Rogers0571d352011-11-03 19:51:38 -07001397 enum ValueType {
1398 kByte = 0x00,
1399 kShort = 0x02,
1400 kChar = 0x03,
1401 kInt = 0x04,
1402 kLong = 0x06,
1403 kFloat = 0x10,
1404 kDouble = 0x11,
1405 kString = 0x17,
1406 kType = 0x18,
1407 kField = 0x19,
1408 kMethod = 0x1a,
1409 kEnum = 0x1b,
1410 kArray = 0x1c,
1411 kAnnotation = 0x1d,
1412 kNull = 0x1e,
1413 kBoolean = 0x1f
1414 };
1415
Shinichiro Hamaji82863f02015-11-05 16:51:33 +09001416 ValueType GetValueType() const { return type_; }
1417 const jvalue& GetJavaValue() const { return jval_; }
1418
David Sehr9323e6e2016-09-13 08:58:35 -07001419 protected:
Ian Rogers13735952014-10-08 12:43:28 -07001420 static constexpr uint8_t kEncodedValueTypeMask = 0x1f; // 0b11111
1421 static constexpr uint8_t kEncodedValueArgShift = 5;
Ian Rogers0571d352011-11-03 19:51:38 -07001422
1423 const DexFile& dex_file_;
Ian Rogers2dd0e2c2013-01-24 12:42:14 -08001424 size_t array_size_; // Size of array.
1425 size_t pos_; // Current position.
Ian Rogers13735952014-10-08 12:43:28 -07001426 const uint8_t* ptr_; // Pointer into encoded data array.
Ian Rogers2dd0e2c2013-01-24 12:42:14 -08001427 ValueType type_; // Type of current encoded value.
1428 jvalue jval_; // Value of current encoded value.
David Sehr9323e6e2016-09-13 08:58:35 -07001429
1430 private:
Ian Rogers0571d352011-11-03 19:51:38 -07001431 DISALLOW_IMPLICIT_CONSTRUCTORS(EncodedStaticFieldValueIterator);
1432};
Brian Carlstrom88f36542012-10-16 23:24:21 -07001433std::ostream& operator<<(std::ostream& os, const EncodedStaticFieldValueIterator::ValueType& code);
Ian Rogers0571d352011-11-03 19:51:38 -07001434
1435class CatchHandlerIterator {
1436 public:
1437 CatchHandlerIterator(const DexFile::CodeItem& code_item, uint32_t address);
Logan Chien736df022012-04-27 16:25:57 +08001438
1439 CatchHandlerIterator(const DexFile::CodeItem& code_item,
1440 const DexFile::TryItem& try_item);
1441
Ian Rogers13735952014-10-08 12:43:28 -07001442 explicit CatchHandlerIterator(const uint8_t* handler_data) {
Ian Rogers0571d352011-11-03 19:51:38 -07001443 Init(handler_data);
1444 }
1445
1446 uint16_t GetHandlerTypeIndex() const {
1447 return handler_.type_idx_;
1448 }
1449 uint32_t GetHandlerAddress() const {
1450 return handler_.address_;
1451 }
1452 void Next();
1453 bool HasNext() const {
1454 return remaining_count_ != -1 || catch_all_;
1455 }
1456 // End of this set of catch blocks, convenience method to locate next set of catch blocks
Ian Rogers13735952014-10-08 12:43:28 -07001457 const uint8_t* EndDataPointer() const {
Ian Rogers0571d352011-11-03 19:51:38 -07001458 CHECK(!HasNext());
1459 return current_data_;
1460 }
Elliott Hughesa21039c2012-06-21 12:09:25 -07001461
Ian Rogers0571d352011-11-03 19:51:38 -07001462 private:
Logan Chien736df022012-04-27 16:25:57 +08001463 void Init(const DexFile::CodeItem& code_item, int32_t offset);
Ian Rogers13735952014-10-08 12:43:28 -07001464 void Init(const uint8_t* handler_data);
Ian Rogers0571d352011-11-03 19:51:38 -07001465
1466 struct CatchHandlerItem {
1467 uint16_t type_idx_; // type index of the caught exception type
1468 uint32_t address_; // handler address
1469 } handler_;
Ian Rogers13735952014-10-08 12:43:28 -07001470 const uint8_t* current_data_; // the current handler in dex file.
Ian Rogers0571d352011-11-03 19:51:38 -07001471 int32_t remaining_count_; // number of handlers not read.
1472 bool catch_all_; // is there a handler that will catch all exceptions in case
1473 // that all typed handler does not match.
1474};
1475
Carl Shapiro1fb86202011-06-27 17:43:13 -07001476} // namespace art
1477
Brian Carlstromfc0e3212013-07-17 14:40:12 -07001478#endif // ART_RUNTIME_DEX_FILE_H_