DebugInfo.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457
  1. /*
  2. * Copyright (c) 2020-2021, Itamar S. <itamar8910@gmail.com>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "DebugInfo.h"
  7. #include <AK/Debug.h>
  8. #include <AK/LexicalPath.h>
  9. #include <AK/MemoryStream.h>
  10. #include <AK/QuickSort.h>
  11. #include <LibDebug/Dwarf/CompilationUnit.h>
  12. #include <LibDebug/Dwarf/DwarfInfo.h>
  13. #include <LibDebug/Dwarf/Expression.h>
  14. namespace Debug {
  15. DebugInfo::DebugInfo(ELF::Image const& elf, String source_root, FlatPtr base_address)
  16. : m_elf(elf)
  17. , m_source_root(move(source_root))
  18. , m_base_address(base_address)
  19. , m_dwarf_info(m_elf)
  20. {
  21. prepare_variable_scopes();
  22. prepare_lines();
  23. }
  24. void DebugInfo::prepare_variable_scopes()
  25. {
  26. m_dwarf_info.for_each_compilation_unit([&](Dwarf::CompilationUnit const& unit) {
  27. auto root = unit.root_die();
  28. parse_scopes_impl(root);
  29. });
  30. }
  31. void DebugInfo::parse_scopes_impl(Dwarf::DIE const& die)
  32. {
  33. die.for_each_child([&](Dwarf::DIE const& child) {
  34. if (child.is_null())
  35. return;
  36. if (!(child.tag() == Dwarf::EntryTag::SubProgram || child.tag() == Dwarf::EntryTag::LexicalBlock))
  37. return;
  38. if (child.get_attribute(Dwarf::Attribute::Inline).has_value()) {
  39. dbgln_if(SPAM_DEBUG, "DWARF inlined functions are not supported");
  40. return;
  41. }
  42. if (child.get_attribute(Dwarf::Attribute::Ranges).has_value()) {
  43. dbgln_if(SPAM_DEBUG, "DWARF ranges are not supported");
  44. return;
  45. }
  46. auto name = child.get_attribute(Dwarf::Attribute::Name);
  47. VariablesScope scope {};
  48. scope.is_function = (child.tag() == Dwarf::EntryTag::SubProgram);
  49. if (name.has_value())
  50. scope.name = name.value().data.as_string;
  51. if (!child.get_attribute(Dwarf::Attribute::LowPc).has_value()) {
  52. dbgln_if(SPAM_DEBUG, "DWARF: Couldn't find attribute LowPc for scope");
  53. return;
  54. }
  55. scope.address_low = child.get_attribute(Dwarf::Attribute::LowPc).value().data.as_addr;
  56. // The attribute name HighPc is confusing. In this context, it seems to actually be a positive offset from LowPc
  57. scope.address_high = scope.address_low + child.get_attribute(Dwarf::Attribute::HighPc).value().data.as_addr;
  58. child.for_each_child([&](Dwarf::DIE const& variable_entry) {
  59. if (!(variable_entry.tag() == Dwarf::EntryTag::Variable
  60. || variable_entry.tag() == Dwarf::EntryTag::FormalParameter))
  61. return;
  62. scope.dies_of_variables.append(variable_entry);
  63. });
  64. m_scopes.append(scope);
  65. parse_scopes_impl(child);
  66. });
  67. }
  68. void DebugInfo::prepare_lines()
  69. {
  70. Vector<Dwarf::LineProgram::LineInfo> all_lines;
  71. m_dwarf_info.for_each_compilation_unit([&all_lines](Dwarf::CompilationUnit const& unit) {
  72. all_lines.extend(unit.line_program().lines());
  73. });
  74. HashMap<FlyString, Optional<String>> memoized_full_paths;
  75. auto compute_full_path = [&](FlyString const& file_path) -> Optional<String> {
  76. if (file_path.view().contains("Toolchain/"sv) || file_path.view().contains("libgcc"sv))
  77. return {};
  78. if (file_path.view().starts_with("./"sv) && !m_source_root.is_null())
  79. return LexicalPath::join(m_source_root, file_path).string();
  80. if (auto index_of_serenity_slash = file_path.view().find("serenity/"sv); index_of_serenity_slash.has_value()) {
  81. auto start_index = index_of_serenity_slash.value() + "serenity/"sv.length();
  82. return file_path.view().substring_view(start_index, file_path.length() - start_index);
  83. }
  84. return file_path;
  85. };
  86. m_sorted_lines.ensure_capacity(all_lines.size());
  87. for (auto const& line_info : all_lines) {
  88. auto maybe_full_path = memoized_full_paths.ensure(line_info.file, [&] { return compute_full_path(line_info.file); });
  89. if (!maybe_full_path.has_value())
  90. continue;
  91. m_sorted_lines.unchecked_append({ line_info.address, maybe_full_path.release_value(), line_info.line });
  92. }
  93. quick_sort(m_sorted_lines, [](auto& a, auto& b) {
  94. return a.address < b.address;
  95. });
  96. }
  97. Optional<DebugInfo::SourcePosition> DebugInfo::get_source_position(FlatPtr target_address) const
  98. {
  99. if (m_sorted_lines.is_empty())
  100. return {};
  101. if (target_address < m_sorted_lines[0].address)
  102. return {};
  103. // TODO: We can do a binary search here
  104. for (size_t i = 0; i < m_sorted_lines.size() - 1; ++i) {
  105. if (m_sorted_lines[i + 1].address > target_address) {
  106. return SourcePosition::from_line_info(m_sorted_lines[i]);
  107. }
  108. }
  109. return {};
  110. }
  111. Optional<DebugInfo::SourcePositionAndAddress> DebugInfo::get_address_from_source_position(String const& file, size_t line) const
  112. {
  113. String file_path = file;
  114. if (!file_path.starts_with("/"))
  115. file_path = String::formatted("/{}", file_path);
  116. constexpr char SERENITY_LIBS_PREFIX[] = "/usr/src/serenity";
  117. if (file.starts_with(SERENITY_LIBS_PREFIX)) {
  118. file_path = file.substring(sizeof(SERENITY_LIBS_PREFIX), file.length() - sizeof(SERENITY_LIBS_PREFIX));
  119. file_path = String::formatted("../{}", file_path);
  120. }
  121. Optional<SourcePositionAndAddress> result;
  122. for (const auto& line_entry : m_sorted_lines) {
  123. if (!line_entry.file.ends_with(file_path))
  124. continue;
  125. if (line_entry.line > line)
  126. continue;
  127. // We look for the source position that is closest to the desired position, and is not after it.
  128. // For example, get_address_of_source_position("main.cpp", 73) could return the address for an instruction whose location is ("main.cpp", 72)
  129. // as there might not be an instruction mapped for "main.cpp", 73.
  130. if (!result.has_value() || (line_entry.line > result.value().line)) {
  131. result = SourcePositionAndAddress { line_entry.file, line_entry.line, line_entry.address };
  132. }
  133. }
  134. return result;
  135. }
  136. NonnullOwnPtrVector<DebugInfo::VariableInfo> DebugInfo::get_variables_in_current_scope(const PtraceRegisters& regs) const
  137. {
  138. NonnullOwnPtrVector<DebugInfo::VariableInfo> variables;
  139. // TODO: We can store the scopes in a better data structure
  140. for (const auto& scope : m_scopes) {
  141. FlatPtr ip;
  142. #if ARCH(I386)
  143. ip = regs.eip;
  144. #else
  145. ip = regs.rip;
  146. #endif
  147. if (ip - m_base_address < scope.address_low || ip - m_base_address >= scope.address_high)
  148. continue;
  149. for (const auto& die_entry : scope.dies_of_variables) {
  150. auto variable_info = create_variable_info(die_entry, regs);
  151. if (!variable_info)
  152. continue;
  153. variables.append(variable_info.release_nonnull());
  154. }
  155. }
  156. return variables;
  157. }
  158. static Optional<Dwarf::DIE> parse_variable_type_die(Dwarf::DIE const& variable_die, DebugInfo::VariableInfo& variable_info)
  159. {
  160. auto type_die_offset = variable_die.get_attribute(Dwarf::Attribute::Type);
  161. if (!type_die_offset.has_value())
  162. return {};
  163. VERIFY(type_die_offset.value().type == Dwarf::AttributeValue::Type::DieReference);
  164. auto type_die = variable_die.compilation_unit().get_die_at_offset(type_die_offset.value().data.as_unsigned);
  165. auto type_name = type_die.get_attribute(Dwarf::Attribute::Name);
  166. if (type_name.has_value()) {
  167. variable_info.type_name = type_name.value().data.as_string;
  168. } else {
  169. dbgln("Unnamed DWARF type at offset: {}", type_die.offset());
  170. variable_info.type_name = "[Unnamed Type]";
  171. }
  172. return type_die;
  173. }
  174. static void parse_variable_location(Dwarf::DIE const& variable_die, DebugInfo::VariableInfo& variable_info, PtraceRegisters const& regs)
  175. {
  176. auto location_info = variable_die.get_attribute(Dwarf::Attribute::Location);
  177. if (!location_info.has_value()) {
  178. location_info = variable_die.get_attribute(Dwarf::Attribute::MemberLocation);
  179. }
  180. if (!location_info.has_value())
  181. return;
  182. switch (location_info.value().type) {
  183. case Dwarf::AttributeValue::Type::UnsignedNumber:
  184. variable_info.location_type = DebugInfo::VariableInfo::LocationType::Address;
  185. variable_info.location_data.address = location_info.value().data.as_addr;
  186. break;
  187. case Dwarf::AttributeValue::Type::DwarfExpression: {
  188. auto expression_bytes = ReadonlyBytes { location_info.value().data.as_raw_bytes.bytes, location_info.value().data.as_raw_bytes.length };
  189. auto value = Dwarf::Expression::evaluate(expression_bytes, regs);
  190. if (value.type != Dwarf::Expression::Type::None) {
  191. VERIFY(value.type == Dwarf::Expression::Type::UnsignedInteger);
  192. variable_info.location_type = DebugInfo::VariableInfo::LocationType::Address;
  193. variable_info.location_data.address = value.data.as_addr;
  194. }
  195. break;
  196. }
  197. default:
  198. dbgln("Warning: unhandled Dwarf location type: {}", (int)location_info.value().type);
  199. }
  200. }
  201. OwnPtr<DebugInfo::VariableInfo> DebugInfo::create_variable_info(Dwarf::DIE const& variable_die, PtraceRegisters const& regs, u32 address_offset) const
  202. {
  203. VERIFY(is_variable_tag_supported(variable_die.tag()));
  204. if (variable_die.tag() == Dwarf::EntryTag::FormalParameter
  205. && !variable_die.get_attribute(Dwarf::Attribute::Name).has_value()) {
  206. // We don't want to display info for unused parameters
  207. return {};
  208. }
  209. NonnullOwnPtr<VariableInfo> variable_info = make<VariableInfo>();
  210. auto name_attribute = variable_die.get_attribute(Dwarf::Attribute::Name);
  211. if (name_attribute.has_value())
  212. variable_info->name = name_attribute.value().data.as_string;
  213. auto type_die = parse_variable_type_die(variable_die, *variable_info);
  214. if (variable_die.tag() == Dwarf::EntryTag::Enumerator) {
  215. auto constant = variable_die.get_attribute(Dwarf::Attribute::ConstValue);
  216. VERIFY(constant.has_value());
  217. switch (constant.value().type) {
  218. case Dwarf::AttributeValue::Type::UnsignedNumber:
  219. variable_info->constant_data.as_u32 = constant.value().data.as_unsigned;
  220. break;
  221. case Dwarf::AttributeValue::Type::SignedNumber:
  222. variable_info->constant_data.as_i32 = constant.value().data.as_signed;
  223. break;
  224. case Dwarf::AttributeValue::Type::String:
  225. variable_info->constant_data.as_string = constant.value().data.as_string;
  226. break;
  227. default:
  228. VERIFY_NOT_REACHED();
  229. }
  230. } else {
  231. parse_variable_location(variable_die, *variable_info, regs);
  232. variable_info->location_data.address += address_offset;
  233. }
  234. if (type_die.has_value())
  235. add_type_info_to_variable(type_die.value(), regs, variable_info);
  236. return variable_info;
  237. }
  238. void DebugInfo::add_type_info_to_variable(Dwarf::DIE const& type_die, PtraceRegisters const& regs, DebugInfo::VariableInfo* parent_variable) const
  239. {
  240. OwnPtr<VariableInfo> type_info;
  241. auto is_array_type = type_die.tag() == Dwarf::EntryTag::ArrayType;
  242. if (type_die.tag() == Dwarf::EntryTag::EnumerationType
  243. || type_die.tag() == Dwarf::EntryTag::StructureType
  244. || is_array_type) {
  245. type_info = create_variable_info(type_die, regs);
  246. }
  247. type_die.for_each_child([&](Dwarf::DIE const& member) {
  248. if (member.is_null())
  249. return;
  250. if (is_array_type && member.tag() == Dwarf::EntryTag::SubRangeType) {
  251. auto upper_bound = member.get_attribute(Dwarf::Attribute::UpperBound);
  252. VERIFY(upper_bound.has_value());
  253. auto size = upper_bound.value().data.as_unsigned + 1;
  254. type_info->dimension_sizes.append(size);
  255. return;
  256. }
  257. if (!is_variable_tag_supported(member.tag()))
  258. return;
  259. auto member_variable = create_variable_info(member, regs, parent_variable->location_data.address);
  260. VERIFY(member_variable);
  261. if (type_die.tag() == Dwarf::EntryTag::EnumerationType) {
  262. member_variable->parent = type_info.ptr();
  263. type_info->members.append(member_variable.release_nonnull());
  264. } else {
  265. if (parent_variable->location_type != DebugInfo::VariableInfo::LocationType::Address)
  266. return;
  267. member_variable->parent = parent_variable;
  268. parent_variable->members.append(member_variable.release_nonnull());
  269. }
  270. });
  271. if (type_info) {
  272. if (is_array_type) {
  273. StringBuilder array_type_name;
  274. array_type_name.append(type_info->type_name);
  275. for (auto array_size : type_info->dimension_sizes) {
  276. array_type_name.append("[");
  277. array_type_name.append(String::formatted("{:d}", array_size));
  278. array_type_name.append("]");
  279. }
  280. parent_variable->type_name = array_type_name.to_string();
  281. }
  282. parent_variable->type = move(type_info);
  283. parent_variable->type->type_tag = type_die.tag();
  284. }
  285. }
  286. bool DebugInfo::is_variable_tag_supported(Dwarf::EntryTag const& tag)
  287. {
  288. return tag == Dwarf::EntryTag::Variable
  289. || tag == Dwarf::EntryTag::Member
  290. || tag == Dwarf::EntryTag::FormalParameter
  291. || tag == Dwarf::EntryTag::EnumerationType
  292. || tag == Dwarf::EntryTag::Enumerator
  293. || tag == Dwarf::EntryTag::StructureType
  294. || tag == Dwarf::EntryTag::ArrayType;
  295. }
  296. String DebugInfo::name_of_containing_function(FlatPtr address) const
  297. {
  298. auto function = get_containing_function(address);
  299. if (!function.has_value())
  300. return {};
  301. return function.value().name;
  302. }
  303. Optional<DebugInfo::VariablesScope> DebugInfo::get_containing_function(FlatPtr address) const
  304. {
  305. for (const auto& scope : m_scopes) {
  306. if (!scope.is_function || address < scope.address_low || address >= scope.address_high)
  307. continue;
  308. return scope;
  309. }
  310. return {};
  311. }
  312. Vector<DebugInfo::SourcePosition> DebugInfo::source_lines_in_scope(VariablesScope const& scope) const
  313. {
  314. Vector<DebugInfo::SourcePosition> source_lines;
  315. for (const auto& line : m_sorted_lines) {
  316. if (line.address < scope.address_low)
  317. continue;
  318. if (line.address >= scope.address_high)
  319. break;
  320. source_lines.append(SourcePosition::from_line_info(line));
  321. }
  322. return source_lines;
  323. }
  324. DebugInfo::SourcePosition DebugInfo::SourcePosition::from_line_info(Dwarf::LineProgram::LineInfo const& line)
  325. {
  326. return { line.file, line.line, line.address };
  327. }
  328. DebugInfo::SourcePositionWithInlines DebugInfo::get_source_position_with_inlines(FlatPtr address) const
  329. {
  330. // If the address is in an "inline chain", this is the inner-most inlined position.
  331. auto inner_source_position = get_source_position(address);
  332. auto die = m_dwarf_info.get_die_at_address(address);
  333. if (!die.has_value() || die->tag() == Dwarf::EntryTag::SubroutineType) {
  334. // Inline chain is empty
  335. return SourcePositionWithInlines { inner_source_position, {} };
  336. }
  337. Vector<SourcePosition> inline_chain;
  338. auto insert_to_chain = [&](Dwarf::DIE const& die) {
  339. auto caller_source_path = get_source_path_of_inline(die);
  340. auto caller_line = get_line_of_inline(die);
  341. if (!caller_source_path.has_value() || !caller_line.has_value()) {
  342. return;
  343. }
  344. inline_chain.append({ String::formatted("{}/{}", caller_source_path->directory, caller_source_path->filename), caller_line.value() });
  345. };
  346. while (die->tag() == Dwarf::EntryTag::InlinedSubroutine) {
  347. insert_to_chain(*die);
  348. if (!die->parent_offset().has_value()) {
  349. break;
  350. }
  351. auto parent = die->compilation_unit().dwarf_info().get_cached_die_at_offset(die->parent_offset().value());
  352. if (!parent.has_value()) {
  353. break;
  354. }
  355. die = *parent;
  356. }
  357. return SourcePositionWithInlines { inner_source_position, inline_chain };
  358. }
  359. Optional<Dwarf::LineProgram::DirectoryAndFile> DebugInfo::get_source_path_of_inline(Dwarf::DIE const& die) const
  360. {
  361. auto caller_file = die.get_attribute(Dwarf::Attribute::CallFile);
  362. if (caller_file.has_value()) {
  363. u32 file_index = 0;
  364. if (caller_file->type == Dwarf::AttributeValue::Type::UnsignedNumber) {
  365. file_index = caller_file->data.as_unsigned;
  366. } else if (caller_file->type == Dwarf::AttributeValue::Type::SignedNumber) {
  367. // For some reason, the file_index is sometimes stored as a signed number.
  368. VERIFY(caller_file->data.as_signed >= 0);
  369. file_index = (u32)caller_file->data.as_signed;
  370. } else {
  371. return {};
  372. }
  373. return die.compilation_unit().line_program().get_directory_and_file(file_index);
  374. }
  375. return {};
  376. }
  377. Optional<uint32_t> DebugInfo::get_line_of_inline(Dwarf::DIE const& die) const
  378. {
  379. auto caller_line = die.get_attribute(Dwarf::Attribute::CallLine);
  380. if (!caller_line.has_value())
  381. return {};
  382. if (caller_line->type != Dwarf::AttributeValue::Type::UnsignedNumber)
  383. return {};
  384. return caller_line.value().data.as_unsigned;
  385. }
  386. }