blob: 3c8393f90cd164cf817e6f4154f6ddc5739036cd [file] [log] [blame]
Yabin Cuiec12ed92015-06-08 10:38:10 -07001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "dso.h"
18
Yabin Cuib3783552015-06-11 11:15:42 -070019#include <stdlib.h>
Yabin Cuicc2e59e2015-08-21 14:23:43 -070020#include <string.h>
Yabin Cuic8485602015-08-20 15:04:39 -070021
Yabin Cuicc2e59e2015-08-21 14:23:43 -070022#include <algorithm>
Yabin Cuic8485602015-08-20 15:04:39 -070023#include <limits>
Yabin Cuidd401b32018-04-11 11:17:06 -070024#include <memory>
Yabin Cui7078c672020-11-10 16:24:12 -080025#include <optional>
Yabin Cui9ba4d942020-09-08 16:12:46 -070026#include <string_view>
Yabin Cuicc2e59e2015-08-21 14:23:43 -070027#include <vector>
Yabin Cuic8485602015-08-20 15:04:39 -070028
Yabin Cuib4212972016-05-25 14:08:05 -070029#include <android-base/file.h>
Elliott Hughes66dd09e2015-12-04 14:00:57 -080030#include <android-base/logging.h>
Yabin Cui40b70ff2018-04-09 14:06:08 -070031#include <android-base/strings.h>
Yabin Cuic8485602015-08-20 15:04:39 -070032
Yabin Cui075dd182020-08-05 19:51:36 +000033#include "JITDebugReader.h"
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +020034#include "environment.h"
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +010035#include "kallsyms.h"
Yabin Cuib1a885b2016-02-14 19:18:02 -080036#include "read_apk.h"
Yabin Cui516a87c2018-03-26 17:34:00 -070037#include "read_dex_file.h"
Yabin Cuiec12ed92015-06-08 10:38:10 -070038#include "read_elf.h"
Yabin Cuib3783552015-06-11 11:15:42 -070039#include "utils.h"
Yabin Cuiec12ed92015-06-08 10:38:10 -070040
Yabin Cuifaa7b922021-01-11 17:35:57 -080041namespace simpleperf {
42
Yabin Cui075dd182020-08-05 19:51:36 +000043using android::base::EndsWith;
Yabin Cui9ba4d942020-09-08 16:12:46 -070044using android::base::StartsWith;
Yabin Cui3a880452020-06-29 16:37:31 -070045
Yabin Cui40b70ff2018-04-09 14:06:08 -070046namespace simpleperf_dso_impl {
47
Yabin Cui1b9b1c12018-10-29 14:23:48 -070048std::string RemovePathSeparatorSuffix(const std::string& path) {
49 // Don't remove path separator suffix for '/'.
Yabin Cui075dd182020-08-05 19:51:36 +000050 if (EndsWith(path, OS_PATH_SEPARATOR) && path.size() > 1u) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -070051 return path.substr(0, path.size() - 1);
52 }
53 return path;
54}
55
Yabin Cui40b70ff2018-04-09 14:06:08 -070056void DebugElfFileFinder::Reset() {
Yabin Cui0bf695b2024-08-22 15:41:29 -070057 allow_mismatched_build_id_ = false;
Yabin Cui40b70ff2018-04-09 14:06:08 -070058 vdso_64bit_.clear();
59 vdso_32bit_.clear();
60 symfs_dir_.clear();
61 build_id_to_file_map_.clear();
62}
63
64bool DebugElfFileFinder::SetSymFsDir(const std::string& symfs_dir) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -070065 symfs_dir_ = RemovePathSeparatorSuffix(symfs_dir);
66 if (!IsDir(symfs_dir_)) {
67 LOG(ERROR) << "Invalid symfs_dir '" << symfs_dir_ << "'";
68 return false;
Yabin Cui40b70ff2018-04-09 14:06:08 -070069 }
Yabin Cui1b9b1c12018-10-29 14:23:48 -070070 std::string build_id_list_file = symfs_dir_ + OS_PATH_SEPARATOR + "build_id_list";
Yabin Cui40b70ff2018-04-09 14:06:08 -070071 std::string build_id_list;
72 if (android::base::ReadFileToString(build_id_list_file, &build_id_list)) {
73 for (auto& line : android::base::Split(build_id_list, "\n")) {
Yabin Cui2969a9e2018-04-19 17:06:24 -070074 std::vector<std::string> items = android::base::Split(line, "=");
Yabin Cui40b70ff2018-04-09 14:06:08 -070075 if (items.size() == 2u) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -070076 build_id_to_file_map_[items[0]] = symfs_dir_ + OS_PATH_SEPARATOR + items[1];
Yabin Cui40b70ff2018-04-09 14:06:08 -070077 }
78 }
79 }
80 return true;
81}
82
Yabin Cui3939b9d2018-07-20 17:12:13 -070083bool DebugElfFileFinder::AddSymbolDir(const std::string& symbol_dir) {
84 if (!IsDir(symbol_dir)) {
85 LOG(ERROR) << "Invalid symbol dir " << symbol_dir;
86 return false;
87 }
Yabin Cui1b9b1c12018-10-29 14:23:48 -070088 std::string dir = RemovePathSeparatorSuffix(symbol_dir);
Yabin Cui3939b9d2018-07-20 17:12:13 -070089 CollectBuildIdInDir(dir);
90 return true;
91}
92
93void DebugElfFileFinder::CollectBuildIdInDir(const std::string& dir) {
94 for (const std::string& entry : GetEntriesInDir(dir)) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -070095 std::string path = dir + OS_PATH_SEPARATOR + entry;
Yabin Cui3939b9d2018-07-20 17:12:13 -070096 if (IsDir(path)) {
97 CollectBuildIdInDir(path);
98 } else {
99 BuildId build_id;
Yabin Cui3a880452020-06-29 16:37:31 -0700100 ElfStatus status;
101 auto elf = ElfFile::Open(path, &status);
Yabin Cuiab9cb232024-09-05 14:45:54 -0700102 if (status == ElfStatus::NO_ERROR) {
103 if (elf->GetBuildId(&build_id) == ElfStatus::NO_ERROR) {
104 build_id_to_file_map_[build_id.ToString()] = path;
105 } else {
106 no_build_id_files_.emplace_back(std::move(path));
107 }
Yabin Cui3939b9d2018-07-20 17:12:13 -0700108 }
109 }
110 }
111}
112
Yabin Cui40b70ff2018-04-09 14:06:08 -0700113void DebugElfFileFinder::SetVdsoFile(const std::string& vdso_file, bool is_64bit) {
114 if (is_64bit) {
115 vdso_64bit_ = vdso_file;
116 } else {
117 vdso_32bit_ = vdso_file;
118 }
119}
120
Yabin Cui0bf695b2024-08-22 15:41:29 -0700121bool DebugElfFileFinder::CheckDebugFilePath(const std::string& path, BuildId& build_id,
122 bool report_build_id_mismatch) {
Yabin Cui991477b2020-07-17 16:12:15 -0700123 ElfStatus status;
124 auto elf = ElfFile::Open(path, &status);
125 if (!elf) {
126 return false;
127 }
128 BuildId debug_build_id;
129 status = elf->GetBuildId(&debug_build_id);
130 if (status != ElfStatus::NO_ERROR && status != ElfStatus::NO_BUILD_ID) {
131 return false;
132 }
133
Yabin Cui0bf695b2024-08-22 15:41:29 -0700134 if (allow_mismatched_build_id_) {
135 return true;
136 }
137
Yabin Cui991477b2020-07-17 16:12:15 -0700138 // Native libraries in apks and kernel modules may not have build ids.
139 // So build_id and debug_build_id can either be empty, or have the same value.
140 bool match = build_id == debug_build_id;
141 if (!match && report_build_id_mismatch) {
142 LOG(WARNING) << path << " isn't used because of build id mismatch: expected " << build_id
143 << ", real " << debug_build_id;
144 }
145 return match;
146}
147
Yabin Cui40b70ff2018-04-09 14:06:08 -0700148std::string DebugElfFileFinder::FindDebugFile(const std::string& dso_path, bool force_64bit,
149 BuildId& build_id) {
150 if (dso_path == "[vdso]") {
151 if (force_64bit && !vdso_64bit_.empty()) {
152 return vdso_64bit_;
153 } else if (!force_64bit && !vdso_32bit_.empty()) {
154 return vdso_32bit_;
155 }
Yabin Cui3939b9d2018-07-20 17:12:13 -0700156 }
Yabin Cuid347bb42019-11-14 15:24:07 -0800157 if (build_id.IsEmpty()) {
158 // Try reading build id from file if we don't already have one.
159 GetBuildIdFromDsoPath(dso_path, &build_id);
160 }
Yabin Cui3939b9d2018-07-20 17:12:13 -0700161
Yabin Cui5d269c72019-05-31 15:30:17 -0700162 // 1. Try build_id_to_file_map.
163 if (!build_id_to_file_map_.empty()) {
Yabin Cui0bf695b2024-08-22 15:41:29 -0700164 if (!build_id.IsEmpty()) {
Yabin Cui5d269c72019-05-31 15:30:17 -0700165 auto it = build_id_to_file_map_.find(build_id.ToString());
Yabin Cui991477b2020-07-17 16:12:15 -0700166 if (it != build_id_to_file_map_.end() && CheckDebugFilePath(it->second, build_id, false)) {
Yabin Cui5d269c72019-05-31 15:30:17 -0700167 return it->second;
168 }
169 }
Yabin Cuiab9cb232024-09-05 14:45:54 -0700170 }
171 if (allow_mismatched_build_id_) {
172 std::optional<std::string> s = SearchFileMapByPath(dso_path);
173 if (s.has_value()) {
174 return s.value();
Yabin Cui0bf695b2024-08-22 15:41:29 -0700175 }
Yabin Cui5d269c72019-05-31 15:30:17 -0700176 }
Yabin Cui1b9b1c12018-10-29 14:23:48 -0700177 if (!symfs_dir_.empty()) {
Yabin Cuia4496ad2019-11-18 16:40:28 -0800178 // 2. Try concatenating symfs_dir and dso_path.
Yabin Cui1b9b1c12018-10-29 14:23:48 -0700179 std::string path = GetPathInSymFsDir(dso_path);
Yabin Cui991477b2020-07-17 16:12:15 -0700180 if (CheckDebugFilePath(path, build_id, true)) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -0700181 return path;
182 }
Christopher Ferris56a3fa12021-10-12 17:23:30 -0700183 if (EndsWith(dso_path, ".apk") && IsRegularFile(path)) {
184 return path;
185 }
Yabin Cuia4496ad2019-11-18 16:40:28 -0800186 // 3. Try concatenating symfs_dir and basename of dso_path.
187 path = symfs_dir_ + OS_PATH_SEPARATOR + android::base::Basename(dso_path);
Yabin Cui991477b2020-07-17 16:12:15 -0700188 if (CheckDebugFilePath(path, build_id, false)) {
Yabin Cuia4496ad2019-11-18 16:40:28 -0800189 return path;
190 }
Yabin Cui3939b9d2018-07-20 17:12:13 -0700191 }
Yabin Cuia4496ad2019-11-18 16:40:28 -0800192 // 4. Try concatenating /usr/lib/debug and dso_path.
Yabin Cui3939b9d2018-07-20 17:12:13 -0700193 // Linux host can store debug shared libraries in /usr/lib/debug.
Yabin Cui991477b2020-07-17 16:12:15 -0700194 if (CheckDebugFilePath("/usr/lib/debug" + dso_path, build_id, false)) {
Yabin Cui3939b9d2018-07-20 17:12:13 -0700195 return "/usr/lib/debug" + dso_path;
196 }
Yabin Cui40b70ff2018-04-09 14:06:08 -0700197 return dso_path;
198}
Yabin Cui1b9b1c12018-10-29 14:23:48 -0700199
200std::string DebugElfFileFinder::GetPathInSymFsDir(const std::string& path) {
201 auto add_symfs_prefix = [&](const std::string& path) {
Yabin Cui9ba4d942020-09-08 16:12:46 -0700202 if (StartsWith(path, OS_PATH_SEPARATOR)) {
Yabin Cui1b9b1c12018-10-29 14:23:48 -0700203 return symfs_dir_ + path;
204 }
205 return symfs_dir_ + OS_PATH_SEPARATOR + path;
206 };
207 if (OS_PATH_SEPARATOR == '/') {
208 return add_symfs_prefix(path);
209 }
210 // Paths in recorded perf.data uses '/' as path separator. When reporting on Windows, it needs
211 // to be converted to '\\'.
212 auto tuple = SplitUrlInApk(path);
213 if (std::get<0>(tuple)) {
214 std::string apk_path = std::get<1>(tuple);
215 std::string entry_path = std::get<2>(tuple);
216 std::replace(apk_path.begin(), apk_path.end(), '/', OS_PATH_SEPARATOR);
217 return GetUrlInApk(add_symfs_prefix(apk_path), entry_path);
218 }
219 std::string elf_path = path;
220 std::replace(elf_path.begin(), elf_path.end(), '/', OS_PATH_SEPARATOR);
221 return add_symfs_prefix(elf_path);
222}
Yabin Cui0bf695b2024-08-22 15:41:29 -0700223
224std::optional<std::string> DebugElfFileFinder::SearchFileMapByPath(const std::string& path) {
225 std::string filename;
226 if (size_t pos = path.rfind('/'); pos != std::string::npos) {
227 filename = path.substr(pos + 1);
228 } else {
229 filename = path;
230 }
231 std::string best_elf_file;
232 size_t best_match_length = 0;
Yabin Cuiab9cb232024-09-05 14:45:54 -0700233 auto check_file = [&](const std::string& elf_file) {
Yabin Cui0bf695b2024-08-22 15:41:29 -0700234 if (EndsWith(elf_file, filename)) {
235 size_t i = elf_file.size();
236 size_t j = path.size();
237 while (i > 0 && j > 0 && elf_file[i - 1] == path[j - 1]) {
238 i--;
239 j--;
240 }
241 size_t match_length = elf_file.size() - i;
242 if (match_length > best_match_length) {
243 best_elf_file = elf_file;
244 best_match_length = match_length;
245 }
246 }
Yabin Cuiab9cb232024-09-05 14:45:54 -0700247 };
248
249 for (const auto& p : build_id_to_file_map_) {
250 check_file(p.second);
251 }
252 for (const auto& elf_file : no_build_id_files_) {
253 check_file(elf_file);
Yabin Cui0bf695b2024-08-22 15:41:29 -0700254 }
255 if (!best_elf_file.empty()) {
256 LOG(INFO) << "Found " << best_elf_file << " for " << path << " by filename";
257 return best_elf_file;
258 }
259 return std::nullopt;
260}
261
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200262} // namespace simpleperf_dso_impl
Yabin Cui40b70ff2018-04-09 14:06:08 -0700263
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700264static OneTimeFreeAllocator symbol_name_allocator;
265
Martin Stjernholm7c27cc22018-11-28 00:46:00 +0000266Symbol::Symbol(std::string_view name, uint64_t addr, uint64_t len)
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700267 : addr(addr),
268 len(len),
269 name_(symbol_name_allocator.AllocateString(name)),
Yabin Cui767dd172016-06-02 21:02:43 -0700270 demangled_name_(nullptr),
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200271 dump_id_(UINT_MAX) {}
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700272
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700273const char* Symbol::DemangledName() const {
274 if (demangled_name_ == nullptr) {
275 const std::string s = Dso::Demangle(name_);
Yabin Cui40eef9e2021-04-13 13:08:31 -0700276 SetDemangledName(s);
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700277 }
278 return demangled_name_;
Yabin Cuiec12ed92015-06-08 10:38:10 -0700279}
280
Yabin Cui40eef9e2021-04-13 13:08:31 -0700281void Symbol::SetDemangledName(std::string_view name) const {
282 if (name == name_) {
283 demangled_name_ = name_;
284 } else {
285 demangled_name_ = symbol_name_allocator.AllocateString(name);
286 }
287}
288
Yabin Cuifef95142021-08-19 10:51:00 -0700289std::string_view Symbol::FunctionName() const {
Yabin Cui1e16b202021-08-16 13:37:35 -0700290 // Name with signature is like "void ctep.v(cteo, ctgc, ctbn)".
291 std::string_view name = DemangledName();
292 auto brace_pos = name.find('(');
293 if (brace_pos != name.npos) {
294 name = name.substr(0, brace_pos);
295 auto space_pos = name.rfind(' ');
296 if (space_pos != name.npos) {
297 name = name.substr(space_pos + 1);
298 }
299 }
300 return name;
301}
302
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800303static bool CompareSymbolToAddr(const Symbol& s, uint64_t addr) {
304 return s.addr < addr;
305}
306
307static bool CompareAddrToSymbol(uint64_t addr, const Symbol& s) {
308 return addr < s.addr;
309}
310
Yabin Cuic8485602015-08-20 15:04:39 -0700311bool Dso::demangle_ = true;
Yabin Cuic8485602015-08-20 15:04:39 -0700312std::string Dso::vmlinux_;
Yabin Cuib4212972016-05-25 14:08:05 -0700313std::string Dso::kallsyms_;
Yabin Cuic8485602015-08-20 15:04:39 -0700314std::unordered_map<std::string, BuildId> Dso::build_id_map_;
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700315size_t Dso::dso_count_;
Yabin Cui16501ff2016-10-19 15:06:29 -0700316uint32_t Dso::g_dump_id_;
Yabin Cui40b70ff2018-04-09 14:06:08 -0700317simpleperf_dso_impl::DebugElfFileFinder Dso::debug_elf_file_finder_;
Yabin Cuiba50c4b2015-07-21 11:24:48 -0700318
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200319void Dso::SetDemangle(bool demangle) {
320 demangle_ = demangle;
321}
Yabin Cuib3783552015-06-11 11:15:42 -0700322
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200323extern "C" char* __cxa_demangle(const char* mangled_name, char* buf, size_t* n, int* status);
Yabin Cui4d8137f2023-02-14 17:00:25 -0800324#if defined(__linux__) || defined(__darwin__)
325extern "C" char* rustc_demangle(const char* mangled, char* out, size_t* len, int* status);
326#endif
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700327
Yabin Cuic8485602015-08-20 15:04:39 -0700328std::string Dso::Demangle(const std::string& name) {
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700329 if (!demangle_) {
330 return name;
331 }
332 int status;
333 bool is_linker_symbol = (name.find(linker_prefix) == 0);
334 const char* mangled_str = name.c_str();
335 if (is_linker_symbol) {
336 mangled_str += linker_prefix.size();
337 }
Yabin Cui4d8137f2023-02-14 17:00:25 -0800338
339 if (mangled_str[0] == '_') {
340 char* demangled_name = nullptr;
341 int status = -2; // -2 means name didn't demangle.
342 if (mangled_str[1] == 'Z') {
343 demangled_name = __cxa_demangle(mangled_str, nullptr, nullptr, &status);
344#if defined(__linux__) || defined(__darwin__)
345 } else if (mangled_str[1] == 'R') {
346 demangled_name = rustc_demangle(mangled_str, nullptr, nullptr, &status);
347#endif
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700348 }
Yabin Cui4d8137f2023-02-14 17:00:25 -0800349 if (status == 0) {
350 // demangled successfully
351 std::string result;
352 if (is_linker_symbol) {
353 result = std::string("[linker]") + demangled_name;
354 } else {
355 result = demangled_name;
356 }
357 free(demangled_name);
358 return result;
359 }
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700360 }
Yabin Cui4d8137f2023-02-14 17:00:25 -0800361
362 // failed to demangle
363 if (is_linker_symbol) {
364 return std::string("[linker]") + mangled_str;
365 }
366 return name;
Yabin Cuib10a8fb2015-08-18 16:32:18 -0700367}
368
Yabin Cuic8485602015-08-20 15:04:39 -0700369bool Dso::SetSymFsDir(const std::string& symfs_dir) {
Yabin Cui40b70ff2018-04-09 14:06:08 -0700370 return debug_elf_file_finder_.SetSymFsDir(symfs_dir);
Yabin Cuic8485602015-08-20 15:04:39 -0700371}
372
Yabin Cui3939b9d2018-07-20 17:12:13 -0700373bool Dso::AddSymbolDir(const std::string& symbol_dir) {
374 return debug_elf_file_finder_.AddSymbolDir(symbol_dir);
375}
376
Yabin Cui0bf695b2024-08-22 15:41:29 -0700377void Dso::AllowMismatchedBuildId() {
378 return debug_elf_file_finder_.AllowMismatchedBuildId();
379}
380
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200381void Dso::SetVmlinux(const std::string& vmlinux) {
382 vmlinux_ = vmlinux;
383}
Yabin Cuic8485602015-08-20 15:04:39 -0700384
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200385void Dso::SetBuildIds(const std::vector<std::pair<std::string, BuildId>>& build_ids) {
Yabin Cuic8485602015-08-20 15:04:39 -0700386 std::unordered_map<std::string, BuildId> map;
387 for (auto& pair : build_ids) {
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200388 LOG(DEBUG) << "build_id_map: " << pair.first << ", " << pair.second.ToString();
Yabin Cuic8485602015-08-20 15:04:39 -0700389 map.insert(pair);
390 }
391 build_id_map_ = std::move(map);
392}
393
Yabin Cuic68e66d2018-03-07 15:47:15 -0800394void Dso::SetVdsoFile(const std::string& vdso_file, bool is_64bit) {
Yabin Cui40b70ff2018-04-09 14:06:08 -0700395 debug_elf_file_finder_.SetVdsoFile(vdso_file, is_64bit);
Yabin Cui63a1c3d2017-05-19 12:57:44 -0700396}
397
Yabin Cui52c63692016-11-28 17:28:08 -0800398BuildId Dso::FindExpectedBuildIdForPath(const std::string& path) {
399 auto it = build_id_map_.find(path);
Yabin Cuic8485602015-08-20 15:04:39 -0700400 if (it != build_id_map_.end()) {
401 return it->second;
402 }
403 return BuildId();
404}
405
Yabin Cui11424c42022-03-10 16:04:04 -0800406BuildId Dso::GetExpectedBuildId() const {
Yabin Cui52c63692016-11-28 17:28:08 -0800407 return FindExpectedBuildIdForPath(path_);
408}
409
Yabin Cui11424c42022-03-10 16:04:04 -0800410Dso::Dso(DsoType type, const std::string& path)
Yabin Cui767dd172016-06-02 21:02:43 -0700411 : type_(type),
Yabin Cui767dd172016-06-02 21:02:43 -0700412 path_(path),
Yabin Cui767dd172016-06-02 21:02:43 -0700413 is_loaded_(false),
Yabin Cui16501ff2016-10-19 15:06:29 -0700414 dump_id_(UINT_MAX),
Yabin Cuie466d4d2017-08-11 17:03:07 -0700415 symbol_dump_id_(0),
416 symbol_warning_loglevel_(android::base::WARNING) {
Yabin Cui15475e62016-07-14 13:26:19 -0700417 size_t pos = path.find_last_of("/\\");
418 if (pos != std::string::npos) {
419 file_name_ = path.substr(pos + 1);
420 } else {
421 file_name_ = path;
422 }
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700423 dso_count_++;
Yabin Cuic8485602015-08-20 15:04:39 -0700424}
425
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700426Dso::~Dso() {
427 if (--dso_count_ == 0) {
Yabin Cuib4212972016-05-25 14:08:05 -0700428 // Clean up global variables when no longer used.
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700429 symbol_name_allocator.Clear();
Yabin Cuib4212972016-05-25 14:08:05 -0700430 demangle_ = true;
Yabin Cuib4212972016-05-25 14:08:05 -0700431 vmlinux_.clear();
432 kallsyms_.clear();
433 build_id_map_.clear();
Yabin Cui16501ff2016-10-19 15:06:29 -0700434 g_dump_id_ = 0;
Yabin Cui40b70ff2018-04-09 14:06:08 -0700435 debug_elf_file_finder_.Reset();
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700436 }
437}
438
Yabin Cui16501ff2016-10-19 15:06:29 -0700439uint32_t Dso::CreateDumpId() {
440 CHECK(!HasDumpId());
441 return dump_id_ = g_dump_id_++;
442}
443
444uint32_t Dso::CreateSymbolDumpId(const Symbol* symbol) {
445 CHECK(!symbol->HasDumpId());
446 symbol->dump_id_ = symbol_dump_id_++;
447 return symbol->dump_id_;
448}
449
Yabin Cui7078c672020-11-10 16:24:12 -0800450std::optional<uint64_t> Dso::IpToFileOffset(uint64_t ip, uint64_t map_start, uint64_t map_pgoff) {
451 return ip - map_start + map_pgoff;
452}
453
Yabin Cui547c60e2015-10-12 16:56:05 -0700454const Symbol* Dso::FindSymbol(uint64_t vaddr_in_dso) {
Yabin Cuic8485602015-08-20 15:04:39 -0700455 if (!is_loaded_) {
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800456 LoadSymbols();
Yabin Cuic5b4a312016-10-24 13:38:38 -0700457 }
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800458 auto it = std::upper_bound(symbols_.begin(), symbols_.end(), vaddr_in_dso, CompareAddrToSymbol);
Yabin Cui516a87c2018-03-26 17:34:00 -0700459 if (it != symbols_.begin()) {
460 --it;
461 if (it->addr <= vaddr_in_dso && (it->addr + it->len > vaddr_in_dso)) {
462 return &*it;
Yabin Cuic8485602015-08-20 15:04:39 -0700463 }
464 }
Yabin Cuic5b4a312016-10-24 13:38:38 -0700465 if (!unknown_symbols_.empty()) {
466 auto it = unknown_symbols_.find(vaddr_in_dso);
467 if (it != unknown_symbols_.end()) {
468 return &it->second;
Yabin Cuic8485602015-08-20 15:04:39 -0700469 }
470 }
471 return nullptr;
472}
473
Yabin Cuic5b4a312016-10-24 13:38:38 -0700474void Dso::SetSymbols(std::vector<Symbol>* symbols) {
475 symbols_ = std::move(*symbols);
476 symbols->clear();
477}
478
479void Dso::AddUnknownSymbol(uint64_t vaddr_in_dso, const std::string& name) {
480 unknown_symbols_.insert(std::make_pair(vaddr_in_dso, Symbol(name, vaddr_in_dso, 1)));
481}
482
Yabin Cuiac4b2492020-12-09 16:27:57 -0800483bool Dso::IsForJavaMethod() const {
Yabin Cui10bbd842018-08-13 17:42:25 -0700484 if (type_ == DSO_DEX_FILE) {
485 return true;
486 }
487 if (type_ == DSO_ELF_FILE) {
Yabin Cui9ba4d942020-09-08 16:12:46 -0700488 if (JITDebugReader::IsPathInJITSymFile(path_)) {
Yabin Cuie32ed2b2020-07-23 15:30:14 -0700489 return true;
490 }
Yabin Cui9ba4d942020-09-08 16:12:46 -0700491 // JITDebugReader in old versions generates symfiles in 'TemporaryFile-XXXXXX'.
492 size_t pos = path_.rfind('/');
493 pos = (pos == std::string::npos) ? 0 : pos + 1;
494 return StartsWith(std::string_view(&path_[pos], path_.size() - pos), "TemporaryFile");
Yabin Cui10bbd842018-08-13 17:42:25 -0700495 }
496 return false;
497}
498
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800499void Dso::LoadSymbols() {
500 if (!is_loaded_) {
501 is_loaded_ = true;
502 std::vector<Symbol> symbols = LoadSymbolsImpl();
503 if (symbols_.empty()) {
504 symbols_ = std::move(symbols);
505 } else {
506 std::vector<Symbol> merged_symbols;
507 std::set_union(symbols_.begin(), symbols_.end(), symbols.begin(), symbols.end(),
508 std::back_inserter(merged_symbols), Symbol::CompareValueByAddr);
509 symbols_ = std::move(merged_symbols);
510 }
Yabin Cuic8485602015-08-20 15:04:39 -0700511 }
Yabin Cuiba50c4b2015-07-21 11:24:48 -0700512}
513
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200514static void ReportReadElfSymbolResult(
515 ElfStatus result, const std::string& path, const std::string& debug_file_path,
Yabin Cui516a87c2018-03-26 17:34:00 -0700516 android::base::LogSeverity warning_loglevel = android::base::WARNING) {
Yabin Cuidec43c12016-07-29 16:40:40 -0700517 if (result == ElfStatus::NO_ERROR) {
Yabin Cui516a87c2018-03-26 17:34:00 -0700518 LOG(VERBOSE) << "Read symbols from " << debug_file_path << " successfully";
Yabin Cuidec43c12016-07-29 16:40:40 -0700519 } else if (result == ElfStatus::NO_SYMBOL_TABLE) {
Yabin Cui516a87c2018-03-26 17:34:00 -0700520 if (path == "[vdso]") {
Yabin Cui63a1c3d2017-05-19 12:57:44 -0700521 // Vdso only contains dynamic symbol table, and we can't change that.
Yabin Cui516a87c2018-03-26 17:34:00 -0700522 return;
Yabin Cui63a1c3d2017-05-19 12:57:44 -0700523 }
Yabin Cuidec43c12016-07-29 16:40:40 -0700524 // Lacking symbol table isn't considered as an error but worth reporting.
Yabin Cui516a87c2018-03-26 17:34:00 -0700525 LOG(warning_loglevel) << debug_file_path << " doesn't contain symbol table";
Yabin Cuidec43c12016-07-29 16:40:40 -0700526 } else {
Yabin Cui516a87c2018-03-26 17:34:00 -0700527 LOG(warning_loglevel) << "failed to read symbols from " << debug_file_path << ": " << result;
Yabin Cuidec43c12016-07-29 16:40:40 -0700528 }
529}
530
Yabin Cui516a87c2018-03-26 17:34:00 -0700531static void SortAndFixSymbols(std::vector<Symbol>& symbols) {
532 std::sort(symbols.begin(), symbols.end(), Symbol::CompareValueByAddr);
Yabin Cuic8485602015-08-20 15:04:39 -0700533 Symbol* prev_symbol = nullptr;
Yabin Cui516a87c2018-03-26 17:34:00 -0700534 for (auto& symbol : symbols) {
Yabin Cuic8485602015-08-20 15:04:39 -0700535 if (prev_symbol != nullptr && prev_symbol->len == 0) {
Yabin Cuicc2e59e2015-08-21 14:23:43 -0700536 prev_symbol->len = symbol.addr - prev_symbol->addr;
Yabin Cuic8485602015-08-20 15:04:39 -0700537 }
Yabin Cui3d4aa262017-11-01 15:58:55 -0700538 prev_symbol = &symbol;
Yabin Cui638c5582015-07-01 16:16:57 -0700539 }
Yabin Cui516a87c2018-03-26 17:34:00 -0700540}
541
Yabin Cuidd401b32018-04-11 11:17:06 -0700542class DexFileDso : public Dso {
543 public:
Yabin Cui11424c42022-03-10 16:04:04 -0800544 DexFileDso(const std::string& path) : Dso(DSO_DEX_FILE, path) {}
Yabin Cuidd401b32018-04-11 11:17:06 -0700545
546 void AddDexFileOffset(uint64_t dex_file_offset) override {
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200547 auto it = std::lower_bound(dex_file_offsets_.begin(), dex_file_offsets_.end(), dex_file_offset);
Yabin Cuic8571d42018-06-06 11:20:39 -0700548 if (it != dex_file_offsets_.end() && *it == dex_file_offset) {
549 return;
550 }
551 dex_file_offsets_.insert(it, dex_file_offset);
Yabin Cuidd401b32018-04-11 11:17:06 -0700552 }
553
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200554 const std::vector<uint64_t>* DexFileOffsets() override { return &dex_file_offsets_; }
Yabin Cuidd401b32018-04-11 11:17:06 -0700555
Yabin Cuidb2c4932019-02-07 15:06:42 -0800556 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t map_start, uint64_t map_pgoff) override {
557 return ip - map_start + map_pgoff;
558 }
559
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800560 std::vector<Symbol> LoadSymbolsImpl() override {
Yabin Cuidd401b32018-04-11 11:17:06 -0700561 std::vector<Symbol> symbols;
Yabin Cui8b8ed0f2023-10-24 16:18:38 -0700562 if (StartsWith(path_, kDexFileInMemoryPrefix)) {
563 // For dex file in memory, the symbols should already be set via SetSymbols().
564 return symbols;
565 }
566
Yabin Cui11424c42022-03-10 16:04:04 -0800567 const std::string& debug_file_path = GetDebugFilePath();
568 auto tuple = SplitUrlInApk(debug_file_path);
Yabin Cui83b0e122021-11-03 14:10:10 -0700569 // Symbols of dex files are collected on device. If the dex file doesn't exist, probably
570 // we are reporting on host, and there is no need to report warning of missing dex files.
Yabin Cui11424c42022-03-10 16:04:04 -0800571 if (!IsRegularFile(std::get<0>(tuple) ? std::get<1>(tuple) : debug_file_path)) {
572 LOG(DEBUG) << "skip reading symbols from non-exist dex_file " << debug_file_path;
Yabin Cui83b0e122021-11-03 14:10:10 -0700573 return symbols;
574 }
Yabin Cui2a53ff32018-05-21 17:37:00 -0700575 bool status = false;
David Srbecky6a296b62021-04-15 20:52:22 +0100576 auto symbol_callback = [&](DexFileSymbol* symbol) {
577 symbols.emplace_back(symbol->name, symbol->addr, symbol->size);
Yabin Cui710f3722021-03-23 17:45:39 -0700578 };
Yabin Cui2a53ff32018-05-21 17:37:00 -0700579 if (std::get<0>(tuple)) {
580 std::unique_ptr<ArchiveHelper> ahelper = ArchiveHelper::CreateInstance(std::get<1>(tuple));
581 ZipEntry entry;
582 std::vector<uint8_t> data;
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200583 if (ahelper && ahelper->FindEntry(std::get<2>(tuple), &entry) &&
584 ahelper->GetEntryData(entry, &data)) {
Yabin Cui11424c42022-03-10 16:04:04 -0800585 status = ReadSymbolsFromDexFileInMemory(data.data(), data.size(), debug_file_path,
Yabin Cui17769f22021-07-13 16:39:16 -0700586 dex_file_offsets_, symbol_callback);
Yabin Cui2a53ff32018-05-21 17:37:00 -0700587 }
588 } else {
Yabin Cui11424c42022-03-10 16:04:04 -0800589 status = ReadSymbolsFromDexFile(debug_file_path, dex_file_offsets_, symbol_callback);
Yabin Cui2a53ff32018-05-21 17:37:00 -0700590 }
591 if (!status) {
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +0200592 android::base::LogSeverity level =
593 symbols_.empty() ? android::base::WARNING : android::base::DEBUG;
Yabin Cui11424c42022-03-10 16:04:04 -0800594 LOG(level) << "Failed to read symbols from dex_file " << debug_file_path;
Yabin Cuidd401b32018-04-11 11:17:06 -0700595 return symbols;
596 }
Yabin Cui11424c42022-03-10 16:04:04 -0800597 LOG(VERBOSE) << "Read symbols from dex_file " << debug_file_path << " successfully";
Yabin Cuidd401b32018-04-11 11:17:06 -0700598 SortAndFixSymbols(symbols);
599 return symbols;
600 }
601
602 private:
603 std::vector<uint64_t> dex_file_offsets_;
604};
605
Yabin Cui516a87c2018-03-26 17:34:00 -0700606class ElfDso : public Dso {
607 public:
Yabin Cui11424c42022-03-10 16:04:04 -0800608 ElfDso(const std::string& path, bool force_64bit)
609 : Dso(DSO_ELF_FILE, path), force_64bit_(force_64bit) {}
Yabin Cui516a87c2018-03-26 17:34:00 -0700610
Yabin Cuie32ed2b2020-07-23 15:30:14 -0700611 std::string_view GetReportPath() const override {
Yabin Cui9ba4d942020-09-08 16:12:46 -0700612 if (JITDebugReader::IsPathInJITSymFile(path_)) {
613 if (path_.find(kJITAppCacheFile) != path_.npos) {
Yabin Cui075dd182020-08-05 19:51:36 +0000614 return "[JIT app cache]";
615 }
Yabin Cui9ba4d942020-09-08 16:12:46 -0700616 return "[JIT zygote cache]";
Yabin Cuie32ed2b2020-07-23 15:30:14 -0700617 }
618 return path_;
619 }
620
Yabin Cuidb2c4932019-02-07 15:06:42 -0800621 void SetMinExecutableVaddr(uint64_t min_vaddr, uint64_t file_offset) override {
622 min_vaddr_ = min_vaddr;
623 file_offset_of_min_vaddr_ = file_offset;
Yabin Cuic8485602015-08-20 15:04:39 -0700624 }
Yabin Cui516a87c2018-03-26 17:34:00 -0700625
Yabin Cuidb2c4932019-02-07 15:06:42 -0800626 void GetMinExecutableVaddr(uint64_t* min_vaddr, uint64_t* file_offset) override {
627 if (type_ == DSO_DEX_FILE) {
628 return dex_file_dso_->GetMinExecutableVaddr(min_vaddr, file_offset);
629 }
630 if (min_vaddr_ == uninitialized_value) {
631 min_vaddr_ = 0;
632 BuildId build_id = GetExpectedBuildId();
Yabin Cui90c3b302020-07-01 10:09:16 -0700633
634 ElfStatus status;
Yabin Cui11424c42022-03-10 16:04:04 -0800635 auto elf = ElfFile::Open(GetDebugFilePath(), &build_id, &status);
Yabin Cui90c3b302020-07-01 10:09:16 -0700636 if (elf) {
637 min_vaddr_ = elf->ReadMinExecutableVaddr(&file_offset_of_min_vaddr_);
Yabin Cuidb2c4932019-02-07 15:06:42 -0800638 } else {
Yabin Cuif376bf02023-04-18 13:22:49 -0700639 // This is likely to be a file wrongly thought of as an ELF file, due to stack unwinding.
640 // No need to report it by default.
641 LOG(DEBUG) << "failed to read min virtual address of " << GetDebugFilePath() << ": "
642 << status;
Yabin Cuidb2c4932019-02-07 15:06:42 -0800643 }
644 }
645 *min_vaddr = min_vaddr_;
646 *file_offset = file_offset_of_min_vaddr_;
647 }
648
649 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t map_start, uint64_t map_pgoff) override {
650 if (type_ == DSO_DEX_FILE) {
651 return dex_file_dso_->IpToVaddrInFile(ip, map_start, map_pgoff);
652 }
653 uint64_t min_vaddr;
654 uint64_t file_offset_of_min_vaddr;
655 GetMinExecutableVaddr(&min_vaddr, &file_offset_of_min_vaddr);
656 if (file_offset_of_min_vaddr == uninitialized_value) {
657 return ip - map_start + min_vaddr;
658 }
659 // Apps may make part of the executable segment of a shared library writeable, which can
660 // generate multiple executable segments at runtime. So use map_pgoff to calculate
661 // vaddr_in_file.
662 return ip - map_start + map_pgoff - file_offset_of_min_vaddr + min_vaddr;
Yabin Cui516a87c2018-03-26 17:34:00 -0700663 }
664
Yabin Cuidd401b32018-04-11 11:17:06 -0700665 void AddDexFileOffset(uint64_t dex_file_offset) override {
666 if (type_ == DSO_ELF_FILE) {
667 // When simpleperf does unwinding while recording, it processes mmap records before reading
668 // dex file linked list (via JITDebugReader). To process mmap records, it creates Dso
669 // objects of type ELF_FILE. Then after reading dex file linked list, it realizes some
670 // ELF_FILE Dso objects should actually be DEX_FILE, because they have dex file offsets.
671 // So here converts ELF_FILE Dso into DEX_FILE Dso.
672 type_ = DSO_DEX_FILE;
Yabin Cui11424c42022-03-10 16:04:04 -0800673 dex_file_dso_.reset(new DexFileDso(path_));
Yabin Cuidd401b32018-04-11 11:17:06 -0700674 }
675 dex_file_dso_->AddDexFileOffset(dex_file_offset);
676 }
677
678 const std::vector<uint64_t>* DexFileOffsets() override {
679 return dex_file_dso_ ? dex_file_dso_->DexFileOffsets() : nullptr;
680 }
681
Yabin Cui516a87c2018-03-26 17:34:00 -0700682 protected:
Yabin Cui11424c42022-03-10 16:04:04 -0800683 std::string FindDebugFilePath() const override {
684 BuildId build_id = GetExpectedBuildId();
685 return debug_elf_file_finder_.FindDebugFile(path_, force_64bit_, build_id);
686 }
687
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800688 std::vector<Symbol> LoadSymbolsImpl() override {
Yabin Cuidd401b32018-04-11 11:17:06 -0700689 if (dex_file_dso_) {
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800690 return dex_file_dso_->LoadSymbolsImpl();
Yabin Cuidd401b32018-04-11 11:17:06 -0700691 }
Yabin Cui516a87c2018-03-26 17:34:00 -0700692 std::vector<Symbol> symbols;
693 BuildId build_id = GetExpectedBuildId();
694 auto symbol_callback = [&](const ElfFileSymbol& symbol) {
695 if (symbol.is_func || (symbol.is_label && symbol.is_in_text_section)) {
696 symbols.emplace_back(symbol.name, symbol.vaddr, symbol.len);
697 }
698 };
699 ElfStatus status;
Yabin Cui11424c42022-03-10 16:04:04 -0800700 auto elf = ElfFile::Open(GetDebugFilePath(), &build_id, &status);
Yabin Cui01947032020-06-30 14:36:46 -0700701 if (elf) {
702 status = elf->ParseSymbols(symbol_callback);
Yabin Cui516a87c2018-03-26 17:34:00 -0700703 }
Yabin Cui2315ff62022-11-14 11:52:18 -0800704 android::base::LogSeverity log_level = android::base::WARNING;
Yabin Cuif376bf02023-04-18 13:22:49 -0700705 if (!symbols_.empty() || !symbols.empty()) {
Yabin Cui2315ff62022-11-14 11:52:18 -0800706 // We already have some symbols when recording.
707 log_level = android::base::DEBUG;
708 }
709 if ((status == ElfStatus::FILE_NOT_FOUND || status == ElfStatus::FILE_MALFORMED) &&
710 build_id.IsEmpty()) {
Yabin Cuif376bf02023-04-18 13:22:49 -0700711 // This is likely to be a file wrongly thought of as an ELF file, due to stack unwinding.
Yabin Cui2315ff62022-11-14 11:52:18 -0800712 log_level = android::base::DEBUG;
713 }
714 ReportReadElfSymbolResult(status, path_, GetDebugFilePath(), log_level);
Yabin Cui516a87c2018-03-26 17:34:00 -0700715 SortAndFixSymbols(symbols);
716 return symbols;
717 }
718
719 private:
Yabin Cuidb2c4932019-02-07 15:06:42 -0800720 static constexpr uint64_t uninitialized_value = std::numeric_limits<uint64_t>::max();
721
Yabin Cui11424c42022-03-10 16:04:04 -0800722 bool force_64bit_;
Yabin Cuidb2c4932019-02-07 15:06:42 -0800723 uint64_t min_vaddr_ = uninitialized_value;
724 uint64_t file_offset_of_min_vaddr_ = uninitialized_value;
Yabin Cuidd401b32018-04-11 11:17:06 -0700725 std::unique_ptr<DexFileDso> dex_file_dso_;
Yabin Cui516a87c2018-03-26 17:34:00 -0700726};
727
728class KernelDso : public Dso {
729 public:
Yabin Cuic5184712023-10-13 14:10:17 -0700730 KernelDso(const std::string& path) : Dso(DSO_KERNEL, path) {}
Yabin Cui516a87c2018-03-26 17:34:00 -0700731
Yabin Cui7078c672020-11-10 16:24:12 -0800732 // IpToVaddrInFile() and LoadSymbols() must be consistent in fixing addresses changed by kernel
733 // address space layout randomization.
734 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t map_start, uint64_t) override {
735 if (map_start != 0 && GetKernelStartAddr() != 0) {
736 // Fix kernel addresses changed by kernel address randomization.
737 fix_kernel_address_randomization_ = true;
738 return ip - map_start + GetKernelStartAddr();
739 }
740 return ip;
741 }
742
743 std::optional<uint64_t> IpToFileOffset(uint64_t ip, uint64_t map_start, uint64_t) override {
744 if (map_start != 0 && GetKernelStartOffset() != 0) {
745 return ip - map_start + GetKernelStartOffset();
746 }
747 return std::nullopt;
748 }
Yabin Cuidb2c4932019-02-07 15:06:42 -0800749
Yabin Cui516a87c2018-03-26 17:34:00 -0700750 protected:
Yabin Cui11424c42022-03-10 16:04:04 -0800751 std::string FindDebugFilePath() const override {
752 BuildId build_id = GetExpectedBuildId();
Yabin Cuic5184712023-10-13 14:10:17 -0700753 if (!vmlinux_.empty()) {
754 // Use vmlinux as the kernel debug file.
755 ElfStatus status;
756 if (ElfFile::Open(vmlinux_, &build_id, &status)) {
757 return vmlinux_;
758 }
759 }
Yabin Cui11424c42022-03-10 16:04:04 -0800760 return debug_elf_file_finder_.FindDebugFile(path_, false, build_id);
761 }
762
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800763 std::vector<Symbol> LoadSymbolsImpl() override {
Yabin Cui516a87c2018-03-26 17:34:00 -0700764 std::vector<Symbol> symbols;
Yabin Cuic7aed042022-09-09 15:54:45 -0700765 ReadSymbolsFromDebugFile(&symbols);
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +0100766
Yabin Cui7078c672020-11-10 16:24:12 -0800767 if (symbols.empty() && !kallsyms_.empty()) {
768 ReadSymbolsFromKallsyms(kallsyms_, &symbols);
769 }
Yabin Cui36b57d92020-12-17 17:06:27 -0800770#if defined(__linux__)
Yabin Cui7078c672020-11-10 16:24:12 -0800771 if (symbols.empty()) {
772 ReadSymbolsFromProc(&symbols);
773 }
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +0100774#endif // defined(__linux__)
Yabin Cui7078c672020-11-10 16:24:12 -0800775 SortAndFixSymbols(symbols);
Yabin Cuic5184712023-10-13 14:10:17 -0700776 if (!symbols.empty() && symbols.back().len == 0) {
Yabin Cui7078c672020-11-10 16:24:12 -0800777 symbols.back().len = std::numeric_limits<uint64_t>::max() - symbols.back().addr;
778 }
779 return symbols;
780 }
781
782 private:
783 void ReadSymbolsFromDebugFile(std::vector<Symbol>* symbols) {
Yabin Cuic7aed042022-09-09 15:54:45 -0700784 ElfStatus status;
785 auto elf = ElfFile::Open(GetDebugFilePath(), &status);
786 if (!elf) {
787 return;
788 }
789
Yabin Cui7078c672020-11-10 16:24:12 -0800790 if (!fix_kernel_address_randomization_) {
791 LOG(WARNING) << "Don't know how to fix addresses changed by kernel address randomization. So "
792 "symbols in "
Yabin Cui11424c42022-03-10 16:04:04 -0800793 << GetDebugFilePath() << " are not used";
Yabin Cui7078c672020-11-10 16:24:12 -0800794 return;
795 }
796 // symbols_ are kernel symbols got from /proc/kallsyms while recording. Those symbols are
797 // not fixed for kernel address randomization. So clear them to avoid mixing them with
798 // symbols in debug_file_path.
799 symbols_.clear();
800
801 auto symbol_callback = [&](const ElfFileSymbol& symbol) {
802 if (symbol.is_func) {
803 symbols->emplace_back(symbol.name, symbol.vaddr, symbol.len);
Yabin Cui01947032020-06-30 14:36:46 -0700804 }
Yabin Cui7078c672020-11-10 16:24:12 -0800805 };
Yabin Cuic7aed042022-09-09 15:54:45 -0700806 status = elf->ParseSymbols(symbol_callback);
Yabin Cui11424c42022-03-10 16:04:04 -0800807 ReportReadElfSymbolResult(status, path_, GetDebugFilePath());
Yabin Cui7078c672020-11-10 16:24:12 -0800808 }
809
810 void ReadSymbolsFromKallsyms(std::string& kallsyms, std::vector<Symbol>* symbols) {
811 auto symbol_callback = [&](const KernelSymbol& symbol) {
812 if (strchr("TtWw", symbol.type) && symbol.addr != 0u) {
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800813 if (symbol.module == nullptr) {
814 symbols->emplace_back(symbol.name, symbol.addr, 0);
815 } else {
816 std::string name = std::string(symbol.name) + " [" + symbol.module + "]";
817 symbols->emplace_back(name, symbol.addr, 0);
818 }
Yabin Cui7078c672020-11-10 16:24:12 -0800819 }
820 return false;
821 };
822 ProcessKernelSymbols(kallsyms, symbol_callback);
823 if (symbols->empty()) {
824 LOG(WARNING) << "Symbol addresses in /proc/kallsyms on device are all zero. "
825 "`echo 0 >/proc/sys/kernel/kptr_restrict` if possible.";
826 }
827 }
828
Yabin Cui36b57d92020-12-17 17:06:27 -0800829#if defined(__linux__)
Yabin Cui7078c672020-11-10 16:24:12 -0800830 void ReadSymbolsFromProc(std::vector<Symbol>* symbols) {
831 BuildId build_id = GetExpectedBuildId();
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +0100832 if (!build_id.IsEmpty()) {
Yabin Cui516a87c2018-03-26 17:34:00 -0700833 // Try /proc/kallsyms only when asked to do so, or when build id matches.
834 // Otherwise, it is likely to use /proc/kallsyms on host for perf.data recorded on device.
835 bool can_read_kallsyms = true;
836 if (!build_id.IsEmpty()) {
837 BuildId real_build_id;
838 if (!GetKernelBuildId(&real_build_id) || build_id != real_build_id) {
839 LOG(DEBUG) << "failed to read symbols from /proc/kallsyms: Build id mismatch";
840 can_read_kallsyms = false;
841 }
842 }
843 if (can_read_kallsyms) {
844 std::string kallsyms;
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +0100845 if (LoadKernelSymbols(&kallsyms)) {
Yabin Cui7078c672020-11-10 16:24:12 -0800846 ReadSymbolsFromKallsyms(kallsyms, symbols);
Yabin Cui516a87c2018-03-26 17:34:00 -0700847 }
848 }
849 }
Yabin Cui516a87c2018-03-26 17:34:00 -0700850 }
ThiƩbaud Weksteene7e750e2020-11-19 15:07:46 +0100851#endif // defined(__linux__)
Yabin Cui516a87c2018-03-26 17:34:00 -0700852
Yabin Cui7078c672020-11-10 16:24:12 -0800853 uint64_t GetKernelStartAddr() {
854 if (!kernel_start_addr_) {
855 ParseKernelStartAddr();
Yabin Cui516a87c2018-03-26 17:34:00 -0700856 }
Yabin Cui7078c672020-11-10 16:24:12 -0800857 return kernel_start_addr_.value();
Yabin Cui516a87c2018-03-26 17:34:00 -0700858 }
Yabin Cui7078c672020-11-10 16:24:12 -0800859
860 uint64_t GetKernelStartOffset() {
861 if (!kernel_start_file_offset_) {
862 ParseKernelStartAddr();
863 }
864 return kernel_start_file_offset_.value();
865 }
866
867 void ParseKernelStartAddr() {
868 kernel_start_addr_ = 0;
869 kernel_start_file_offset_ = 0;
Yabin Cuic7aed042022-09-09 15:54:45 -0700870 ElfStatus status;
871 if (auto elf = ElfFile::Open(GetDebugFilePath(), &status); elf) {
872 for (const auto& section : elf->GetSectionHeader()) {
873 if (section.name == ".text") {
874 kernel_start_addr_ = section.vaddr;
875 kernel_start_file_offset_ = section.file_offset;
876 break;
Yabin Cui7078c672020-11-10 16:24:12 -0800877 }
878 }
879 }
880 }
881
Yabin Cui7078c672020-11-10 16:24:12 -0800882 bool fix_kernel_address_randomization_ = false;
883 std::optional<uint64_t> kernel_start_addr_;
884 std::optional<uint64_t> kernel_start_file_offset_;
Yabin Cui516a87c2018-03-26 17:34:00 -0700885};
886
887class KernelModuleDso : public Dso {
888 public:
Yabin Cui11424c42022-03-10 16:04:04 -0800889 KernelModuleDso(const std::string& path, uint64_t memory_start, uint64_t memory_end,
890 Dso* kernel_dso)
891 : Dso(DSO_KERNEL_MODULE, path),
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800892 memory_start_(memory_start),
893 memory_end_(memory_end),
894 kernel_dso_(kernel_dso) {}
895
896 void SetMinExecutableVaddr(uint64_t min_vaddr, uint64_t memory_offset) override {
897 min_vaddr_ = min_vaddr;
898 memory_offset_of_min_vaddr_ = memory_offset;
899 }
900
901 void GetMinExecutableVaddr(uint64_t* min_vaddr, uint64_t* memory_offset) override {
902 if (!min_vaddr_) {
903 CalculateMinVaddr();
904 }
905 *min_vaddr = min_vaddr_.value();
906 *memory_offset = memory_offset_of_min_vaddr_.value();
907 }
Yabin Cui516a87c2018-03-26 17:34:00 -0700908
Yabin Cuidb2c4932019-02-07 15:06:42 -0800909 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t map_start, uint64_t) override {
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800910 uint64_t min_vaddr;
911 uint64_t memory_offset;
912 GetMinExecutableVaddr(&min_vaddr, &memory_offset);
913 return ip - map_start - memory_offset + min_vaddr;
Yabin Cuidb2c4932019-02-07 15:06:42 -0800914 }
915
Yabin Cui516a87c2018-03-26 17:34:00 -0700916 protected:
Yabin Cui11424c42022-03-10 16:04:04 -0800917 std::string FindDebugFilePath() const override {
918 BuildId build_id = GetExpectedBuildId();
919 return debug_elf_file_finder_.FindDebugFile(path_, false, build_id);
920 }
921
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800922 std::vector<Symbol> LoadSymbolsImpl() override {
Yabin Cui516a87c2018-03-26 17:34:00 -0700923 std::vector<Symbol> symbols;
924 BuildId build_id = GetExpectedBuildId();
925 auto symbol_callback = [&](const ElfFileSymbol& symbol) {
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800926 // We only know how to map ip addrs to symbols in text section.
927 if (symbol.is_in_text_section && (symbol.is_label || symbol.is_func)) {
Yabin Cui516a87c2018-03-26 17:34:00 -0700928 symbols.emplace_back(symbol.name, symbol.vaddr, symbol.len);
929 }
930 };
Yabin Cui01947032020-06-30 14:36:46 -0700931 ElfStatus status;
Yabin Cui11424c42022-03-10 16:04:04 -0800932 auto elf = ElfFile::Open(GetDebugFilePath(), &build_id, &status);
Yabin Cui01947032020-06-30 14:36:46 -0700933 if (elf) {
934 status = elf->ParseSymbols(symbol_callback);
935 }
Yabin Cui2c928d62024-04-03 13:46:08 -0700936 // Don't warn when a kernel module is missing. As a backup, we read symbols from /proc/kallsyms.
937 ReportReadElfSymbolResult(status, path_, GetDebugFilePath(), android::base::DEBUG);
Yabin Cui516a87c2018-03-26 17:34:00 -0700938 SortAndFixSymbols(symbols);
939 return symbols;
940 }
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800941
942 private:
943 void CalculateMinVaddr() {
944 min_vaddr_ = 0;
945 memory_offset_of_min_vaddr_ = 0;
946
947 // min_vaddr and memory_offset are used to convert an ip addr of a kernel module to its
948 // vaddr_in_file, as shown in IpToVaddrInFile(). When the kernel loads a kernel module, it
949 // puts ALLOC sections (like .plt, .text.ftrace_trampoline, .text) in memory in order. The
950 // text section may not be at the start of the module memory. To do address conversion, we
951 // need to know its relative position in the module memory. There are two ways:
952 // 1. Read the kernel module file to calculate the relative position of .text section. It
953 // is relatively complex and depends on both PLT entries and the kernel version.
Yabin Cui4d8137f2023-02-14 17:00:25 -0800954 // 2. Find a module symbol in .text section, get its address in memory from /proc/kallsyms,
955 // and its vaddr_in_file from the kernel module file. Then other symbols in .text section can
956 // be mapped in the same way. Below we use the second method.
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800957
Yabin Cui2c928d62024-04-03 13:46:08 -0700958 if (!IsRegularFile(GetDebugFilePath())) {
959 return;
960 }
961
Yabin Cuif3da1ed2020-11-25 15:37:38 -0800962 // 1. Select a module symbol in /proc/kallsyms.
963 kernel_dso_->LoadSymbols();
964 const auto& kernel_symbols = kernel_dso_->GetSymbols();
965 auto it = std::lower_bound(kernel_symbols.begin(), kernel_symbols.end(), memory_start_,
966 CompareSymbolToAddr);
967 const Symbol* kernel_symbol = nullptr;
968 while (it != kernel_symbols.end() && it->addr < memory_end_) {
969 if (strlen(it->Name()) > 0 && it->Name()[0] != '$') {
970 kernel_symbol = &*it;
971 break;
972 }
973 ++it;
974 }
975 if (kernel_symbol == nullptr) {
976 return;
977 }
978
979 // 2. Find the symbol in .ko file.
980 std::string symbol_name = kernel_symbol->Name();
981 if (auto pos = symbol_name.rfind(' '); pos != std::string::npos) {
982 symbol_name.resize(pos);
983 }
984 LoadSymbols();
985 for (const auto& symbol : symbols_) {
986 if (symbol_name == symbol.Name()) {
987 min_vaddr_ = symbol.addr;
988 memory_offset_of_min_vaddr_ = kernel_symbol->addr - memory_start_;
989 return;
990 }
991 }
992 }
993
994 uint64_t memory_start_;
995 uint64_t memory_end_;
996 Dso* kernel_dso_;
997 std::optional<uint64_t> min_vaddr_;
998 std::optional<uint64_t> memory_offset_of_min_vaddr_;
Yabin Cui516a87c2018-03-26 17:34:00 -0700999};
1000
Evgeny Eltsin91dbae02020-08-27 15:46:09 +02001001class SymbolMapFileDso : public Dso {
1002 public:
Yabin Cui11424c42022-03-10 16:04:04 -08001003 SymbolMapFileDso(const std::string& path) : Dso(DSO_SYMBOL_MAP_FILE, path) {}
Evgeny Eltsin91dbae02020-08-27 15:46:09 +02001004
1005 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t, uint64_t) override { return ip; }
1006
1007 protected:
Yabin Cuif3da1ed2020-11-25 15:37:38 -08001008 std::vector<Symbol> LoadSymbolsImpl() override { return {}; }
Evgeny Eltsin91dbae02020-08-27 15:46:09 +02001009};
1010
Yabin Cuic36ea8b2018-04-16 18:21:40 -07001011class UnknownDso : public Dso {
1012 public:
Yabin Cui11424c42022-03-10 16:04:04 -08001013 UnknownDso(const std::string& path) : Dso(DSO_UNKNOWN_FILE, path) {}
Yabin Cuic36ea8b2018-04-16 18:21:40 -07001014
ThiƩbaud Weksteen4848ee02020-10-23 16:06:59 +02001015 uint64_t IpToVaddrInFile(uint64_t ip, uint64_t, uint64_t) override { return ip; }
Yabin Cuidb2c4932019-02-07 15:06:42 -08001016
Yabin Cuic36ea8b2018-04-16 18:21:40 -07001017 protected:
Yabin Cuif3da1ed2020-11-25 15:37:38 -08001018 std::vector<Symbol> LoadSymbolsImpl() override { return std::vector<Symbol>(); }
Yabin Cuic36ea8b2018-04-16 18:21:40 -07001019};
1020
Yabin Cui516a87c2018-03-26 17:34:00 -07001021std::unique_ptr<Dso> Dso::CreateDso(DsoType dso_type, const std::string& dso_path,
1022 bool force_64bit) {
Yabin Cui516a87c2018-03-26 17:34:00 -07001023 switch (dso_type) {
Yabin Cui7078c672020-11-10 16:24:12 -08001024 case DSO_ELF_FILE:
Yabin Cui11424c42022-03-10 16:04:04 -08001025 return std::unique_ptr<Dso>(new ElfDso(dso_path, force_64bit));
Yabin Cui516a87c2018-03-26 17:34:00 -07001026 case DSO_KERNEL:
Yabin Cui11424c42022-03-10 16:04:04 -08001027 return std::unique_ptr<Dso>(new KernelDso(dso_path));
Yabin Cui516a87c2018-03-26 17:34:00 -07001028 case DSO_DEX_FILE:
Yabin Cui11424c42022-03-10 16:04:04 -08001029 return std::unique_ptr<Dso>(new DexFileDso(dso_path));
Evgeny Eltsin91dbae02020-08-27 15:46:09 +02001030 case DSO_SYMBOL_MAP_FILE:
1031 return std::unique_ptr<Dso>(new SymbolMapFileDso(dso_path));
Yabin Cuic36ea8b2018-04-16 18:21:40 -07001032 case DSO_UNKNOWN_FILE:
1033 return std::unique_ptr<Dso>(new UnknownDso(dso_path));
Yabin Cui516a87c2018-03-26 17:34:00 -07001034 default:
Yabin Cui90a547e2022-12-07 16:29:13 -08001035 LOG(ERROR) << "Unexpected dso_type " << static_cast<int>(dso_type);
1036 return nullptr;
Yabin Cui516a87c2018-03-26 17:34:00 -07001037 }
Yabin Cui516a87c2018-03-26 17:34:00 -07001038}
1039
Yabin Cui16f41ff2021-03-23 14:58:25 -07001040std::unique_ptr<Dso> Dso::CreateDsoWithBuildId(DsoType dso_type, const std::string& dso_path,
1041 BuildId& build_id) {
Yabin Cui11424c42022-03-10 16:04:04 -08001042 std::unique_ptr<Dso> dso;
Yabin Cui16f41ff2021-03-23 14:58:25 -07001043 switch (dso_type) {
1044 case DSO_ELF_FILE:
Yabin Cui11424c42022-03-10 16:04:04 -08001045 dso.reset(new ElfDso(dso_path, false));
1046 break;
Yabin Cui16f41ff2021-03-23 14:58:25 -07001047 case DSO_KERNEL:
Yabin Cui11424c42022-03-10 16:04:04 -08001048 dso.reset(new KernelDso(dso_path));
1049 break;
Yabin Cui16f41ff2021-03-23 14:58:25 -07001050 case DSO_KERNEL_MODULE:
Yabin Cui11424c42022-03-10 16:04:04 -08001051 dso.reset(new KernelModuleDso(dso_path, 0, 0, nullptr));
1052 break;
Yabin Cui16f41ff2021-03-23 14:58:25 -07001053 default:
Yabin Cui90a547e2022-12-07 16:29:13 -08001054 LOG(ERROR) << "Unexpected dso_type " << static_cast<int>(dso_type);
Yabin Cui11424c42022-03-10 16:04:04 -08001055 return nullptr;
Yabin Cui16f41ff2021-03-23 14:58:25 -07001056 }
Yabin Cui11424c42022-03-10 16:04:04 -08001057 dso->debug_file_path_ = debug_elf_file_finder_.FindDebugFile(dso_path, false, build_id);
1058 return dso;
Yabin Cui4ad10fb2020-04-01 15:45:48 -07001059}
1060
Yabin Cuif3da1ed2020-11-25 15:37:38 -08001061std::unique_ptr<Dso> Dso::CreateKernelModuleDso(const std::string& dso_path, uint64_t memory_start,
1062 uint64_t memory_end, Dso* kernel_dso) {
Yabin Cui11424c42022-03-10 16:04:04 -08001063 return std::unique_ptr<Dso>(new KernelModuleDso(dso_path, memory_start, memory_end, kernel_dso));
Yabin Cuif3da1ed2020-11-25 15:37:38 -08001064}
1065
Yabin Cui767dd172016-06-02 21:02:43 -07001066const char* DsoTypeToString(DsoType dso_type) {
1067 switch (dso_type) {
1068 case DSO_KERNEL:
1069 return "dso_kernel";
1070 case DSO_KERNEL_MODULE:
1071 return "dso_kernel_module";
1072 case DSO_ELF_FILE:
1073 return "dso_elf_file";
Yabin Cui516a87c2018-03-26 17:34:00 -07001074 case DSO_DEX_FILE:
1075 return "dso_dex_file";
Evgeny Eltsin91dbae02020-08-27 15:46:09 +02001076 case DSO_SYMBOL_MAP_FILE:
1077 return "dso_symbol_map_file";
Yabin Cui767dd172016-06-02 21:02:43 -07001078 default:
1079 return "unknown";
1080 }
1081}
Yabin Cui40b70ff2018-04-09 14:06:08 -07001082
1083bool GetBuildIdFromDsoPath(const std::string& dso_path, BuildId* build_id) {
Yabin Cui3a880452020-06-29 16:37:31 -07001084 ElfStatus status;
1085 auto elf = ElfFile::Open(dso_path, &status);
1086 if (status == ElfStatus::NO_ERROR && elf->GetBuildId(build_id) == ElfStatus::NO_ERROR) {
1087 return true;
Yabin Cui40b70ff2018-04-09 14:06:08 -07001088 }
Yabin Cui3a880452020-06-29 16:37:31 -07001089 return false;
Yabin Cui40b70ff2018-04-09 14:06:08 -07001090}
Yabin Cuifaa7b922021-01-11 17:35:57 -08001091
Yabin Cui290e9c42023-05-01 15:09:30 -07001092bool GetBuildId(const Dso& dso, BuildId& build_id) {
1093 if (dso.type() == DSO_KERNEL) {
1094 if (GetKernelBuildId(&build_id)) {
1095 return true;
1096 }
1097 } else if (dso.type() == DSO_KERNEL_MODULE) {
1098 bool has_build_id = false;
1099 if (android::base::EndsWith(dso.Path(), ".ko")) {
1100 return GetBuildIdFromDsoPath(dso.Path(), &build_id);
1101 }
1102 if (const std::string& path = dso.Path();
1103 path.size() > 2 && path[0] == '[' && path.back() == ']') {
1104 // For kernel modules that we can't find the corresponding file, read build id from /sysfs.
1105 return GetModuleBuildId(path.substr(1, path.size() - 2), &build_id);
1106 }
1107 } else if (dso.type() == DSO_ELF_FILE) {
1108 if (dso.Path() == DEFAULT_EXECNAME_FOR_THREAD_MMAP || dso.IsForJavaMethod()) {
1109 return false;
1110 }
1111 if (GetBuildIdFromDsoPath(dso.Path(), &build_id)) {
1112 return true;
1113 }
1114 }
1115 return false;
1116}
1117
Yabin Cuifaa7b922021-01-11 17:35:57 -08001118} // namespace simpleperf