Reader.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352
  1. /*
  2. * Copyright (c) 2020, Itamar S. <itamar8910@gmail.com>
  3. * Copyright (c) 2022, the SerenityOS developers.
  4. *
  5. * SPDX-License-Identifier: BSD-2-Clause
  6. */
  7. #include <AK/ByteReader.h>
  8. #include <AK/HashTable.h>
  9. #include <AK/JsonObject.h>
  10. #include <AK/JsonValue.h>
  11. #include <AK/LexicalPath.h>
  12. #include <LibCompress/Gzip.h>
  13. #include <LibCore/File.h>
  14. #include <LibCoredump/Reader.h>
  15. #include <signal_numbers.h>
  16. #include <string.h>
  17. #include <unistd.h>
  18. namespace Coredump {
  19. OwnPtr<Reader> Reader::create(StringView path)
  20. {
  21. auto file_or_error = Core::MappedFile::map(path);
  22. if (file_or_error.is_error())
  23. return {};
  24. if (!Compress::GzipDecompressor::is_likely_compressed(file_or_error.value()->bytes())) {
  25. // It's an uncompressed coredump.
  26. return AK::adopt_own_if_nonnull(new (nothrow) Reader(file_or_error.release_value()));
  27. }
  28. auto decompressed_data = decompress_coredump(file_or_error.value()->bytes());
  29. if (!decompressed_data.has_value())
  30. return {};
  31. return adopt_own_if_nonnull(new (nothrow) Reader(decompressed_data.release_value()));
  32. }
  33. Reader::Reader(ByteBuffer buffer)
  34. : Reader(buffer.bytes())
  35. {
  36. m_coredump_buffer = move(buffer);
  37. }
  38. Reader::Reader(NonnullRefPtr<Core::MappedFile> file)
  39. : Reader(file->bytes())
  40. {
  41. m_mapped_file = move(file);
  42. }
  43. Reader::Reader(ReadonlyBytes coredump_bytes)
  44. : m_coredump_bytes(coredump_bytes)
  45. , m_coredump_image(m_coredump_bytes)
  46. {
  47. size_t index = 0;
  48. m_coredump_image.for_each_program_header([this, &index](auto pheader) {
  49. if (pheader.type() == PT_NOTE) {
  50. m_notes_segment_index = index;
  51. return IterationDecision::Break;
  52. }
  53. ++index;
  54. return IterationDecision::Continue;
  55. });
  56. VERIFY(m_notes_segment_index != -1);
  57. }
  58. Optional<ByteBuffer> Reader::decompress_coredump(ReadonlyBytes raw_coredump)
  59. {
  60. auto decompressed_coredump = Compress::GzipDecompressor::decompress_all(raw_coredump);
  61. if (decompressed_coredump.has_value())
  62. return decompressed_coredump;
  63. // If we didn't manage to decompress it, try and parse it as decompressed coredump
  64. auto bytebuffer = ByteBuffer::copy(raw_coredump);
  65. if (bytebuffer.is_error())
  66. return {};
  67. return bytebuffer.release_value();
  68. }
  69. Reader::NotesEntryIterator::NotesEntryIterator(const u8* notes_data)
  70. : m_current(bit_cast<const ELF::Core::NotesEntry*>(notes_data))
  71. , start(notes_data)
  72. {
  73. }
  74. ELF::Core::NotesEntryHeader::Type Reader::NotesEntryIterator::type() const
  75. {
  76. VERIFY(m_current->header.type == ELF::Core::NotesEntryHeader::Type::ProcessInfo
  77. || m_current->header.type == ELF::Core::NotesEntryHeader::Type::MemoryRegionInfo
  78. || m_current->header.type == ELF::Core::NotesEntryHeader::Type::ThreadInfo
  79. || m_current->header.type == ELF::Core::NotesEntryHeader::Type::Metadata
  80. || m_current->header.type == ELF::Core::NotesEntryHeader::Type::Null);
  81. return m_current->header.type;
  82. }
  83. const ELF::Core::NotesEntry* Reader::NotesEntryIterator::current() const
  84. {
  85. return m_current;
  86. }
  87. void Reader::NotesEntryIterator::next()
  88. {
  89. VERIFY(!at_end());
  90. switch (type()) {
  91. case ELF::Core::NotesEntryHeader::Type::ProcessInfo: {
  92. const auto* current = bit_cast<const ELF::Core::ProcessInfo*>(m_current);
  93. m_current = bit_cast<const ELF::Core::NotesEntry*>(current->json_data + strlen(current->json_data) + 1);
  94. break;
  95. }
  96. case ELF::Core::NotesEntryHeader::Type::ThreadInfo: {
  97. const auto* current = bit_cast<const ELF::Core::ThreadInfo*>(m_current);
  98. m_current = bit_cast<const ELF::Core::NotesEntry*>(current + 1);
  99. break;
  100. }
  101. case ELF::Core::NotesEntryHeader::Type::MemoryRegionInfo: {
  102. const auto* current = bit_cast<const ELF::Core::MemoryRegionInfo*>(m_current);
  103. m_current = bit_cast<const ELF::Core::NotesEntry*>(current->region_name + strlen(current->region_name) + 1);
  104. break;
  105. }
  106. case ELF::Core::NotesEntryHeader::Type::Metadata: {
  107. const auto* current = bit_cast<const ELF::Core::Metadata*>(m_current);
  108. m_current = bit_cast<const ELF::Core::NotesEntry*>(current->json_data + strlen(current->json_data) + 1);
  109. break;
  110. }
  111. default:
  112. VERIFY_NOT_REACHED();
  113. }
  114. }
  115. bool Reader::NotesEntryIterator::at_end() const
  116. {
  117. return type() == ELF::Core::NotesEntryHeader::Type::Null;
  118. }
  119. Optional<FlatPtr> Reader::peek_memory(FlatPtr address) const
  120. {
  121. auto region = region_containing(address);
  122. if (!region.has_value())
  123. return {};
  124. FlatPtr offset_in_region = address - region->region_start;
  125. auto* region_data = bit_cast<const u8*>(image().program_header(region->program_header_index).raw_data());
  126. FlatPtr value { 0 };
  127. ByteReader::load(region_data + offset_in_region, value);
  128. return value;
  129. }
  130. const JsonObject Reader::process_info() const
  131. {
  132. const ELF::Core::ProcessInfo* process_info_notes_entry = nullptr;
  133. NotesEntryIterator it(bit_cast<const u8*>(m_coredump_image.program_header(m_notes_segment_index).raw_data()));
  134. for (; !it.at_end(); it.next()) {
  135. if (it.type() != ELF::Core::NotesEntryHeader::Type::ProcessInfo)
  136. continue;
  137. process_info_notes_entry = bit_cast<const ELF::Core::ProcessInfo*>(it.current());
  138. break;
  139. }
  140. if (!process_info_notes_entry)
  141. return {};
  142. auto process_info_json_value = JsonValue::from_string(process_info_notes_entry->json_data);
  143. if (process_info_json_value.is_error())
  144. return {};
  145. if (!process_info_json_value.value().is_object())
  146. return {};
  147. return process_info_json_value.value().as_object();
  148. // FIXME: Maybe just cache this on the Reader instance after first access.
  149. }
  150. Optional<MemoryRegionInfo> Reader::first_region_for_object(StringView object_name) const
  151. {
  152. Optional<MemoryRegionInfo> ret;
  153. for_each_memory_region_info([&ret, &object_name](auto& region_info) {
  154. if (region_info.object_name() == object_name) {
  155. ret = region_info;
  156. return IterationDecision::Break;
  157. }
  158. return IterationDecision::Continue;
  159. });
  160. return ret;
  161. }
  162. Optional<MemoryRegionInfo> Reader::region_containing(FlatPtr address) const
  163. {
  164. Optional<MemoryRegionInfo> ret;
  165. for_each_memory_region_info([&ret, address](const auto& region_info) {
  166. if (region_info.region_start <= address && region_info.region_end >= address) {
  167. ret = region_info;
  168. return IterationDecision::Break;
  169. }
  170. return IterationDecision::Continue;
  171. });
  172. return ret;
  173. }
  174. int Reader::process_pid() const
  175. {
  176. auto process_info = this->process_info();
  177. auto pid = process_info.get("pid");
  178. return pid.to_number<int>();
  179. }
  180. u8 Reader::process_termination_signal() const
  181. {
  182. auto process_info = this->process_info();
  183. auto termination_signal = process_info.get("termination_signal");
  184. auto signal_number = termination_signal.to_number<u8>();
  185. if (signal_number <= SIGINVAL || signal_number >= NSIG)
  186. return SIGINVAL;
  187. return signal_number;
  188. }
  189. String Reader::process_executable_path() const
  190. {
  191. auto process_info = this->process_info();
  192. auto executable_path = process_info.get("executable_path");
  193. return executable_path.as_string_or({});
  194. }
  195. Vector<String> Reader::process_arguments() const
  196. {
  197. auto process_info = this->process_info();
  198. auto arguments = process_info.get("arguments");
  199. if (!arguments.is_array())
  200. return {};
  201. Vector<String> vector;
  202. arguments.as_array().for_each([&](auto& value) {
  203. if (value.is_string())
  204. vector.append(value.as_string());
  205. });
  206. return vector;
  207. }
  208. Vector<String> Reader::process_environment() const
  209. {
  210. auto process_info = this->process_info();
  211. auto environment = process_info.get("environment");
  212. if (!environment.is_array())
  213. return {};
  214. Vector<String> vector;
  215. environment.as_array().for_each([&](auto& value) {
  216. if (value.is_string())
  217. vector.append(value.as_string());
  218. });
  219. return vector;
  220. }
  221. HashMap<String, String> Reader::metadata() const
  222. {
  223. const ELF::Core::Metadata* metadata_notes_entry = nullptr;
  224. NotesEntryIterator it(bit_cast<const u8*>(m_coredump_image.program_header(m_notes_segment_index).raw_data()));
  225. for (; !it.at_end(); it.next()) {
  226. if (it.type() != ELF::Core::NotesEntryHeader::Type::Metadata)
  227. continue;
  228. metadata_notes_entry = bit_cast<const ELF::Core::Metadata*>(it.current());
  229. break;
  230. }
  231. if (!metadata_notes_entry)
  232. return {};
  233. auto metadata_json_value = JsonValue::from_string(metadata_notes_entry->json_data);
  234. if (metadata_json_value.is_error())
  235. return {};
  236. if (!metadata_json_value.value().is_object())
  237. return {};
  238. HashMap<String, String> metadata;
  239. metadata_json_value.value().as_object().for_each_member([&](auto& key, auto& value) {
  240. metadata.set(key, value.as_string_or({}));
  241. });
  242. return metadata;
  243. }
  244. const Reader::LibraryData* Reader::library_containing(FlatPtr address) const
  245. {
  246. static HashMap<String, OwnPtr<LibraryData>> cached_libs;
  247. auto region = region_containing(address);
  248. if (!region.has_value())
  249. return {};
  250. auto name = region->object_name();
  251. String path = resolve_object_path(name);
  252. if (!cached_libs.contains(path)) {
  253. auto file_or_error = Core::MappedFile::map(path);
  254. if (file_or_error.is_error())
  255. return {};
  256. auto image = ELF::Image(file_or_error.value()->bytes());
  257. cached_libs.set(path, make<LibraryData>(name, static_cast<FlatPtr>(region->region_start), file_or_error.release_value(), move(image)));
  258. }
  259. auto lib_data = cached_libs.get(path).value();
  260. return lib_data;
  261. }
  262. String Reader::resolve_object_path(StringView name) const
  263. {
  264. // TODO: There are other places where similar method is implemented or would be useful.
  265. // (e.g. UserspaceEmulator, LibSymbolication, Profiler, and DynamicLinker itself)
  266. // We should consider creating unified implementation in the future.
  267. if (name.starts_with('/') || !Core::File::looks_like_shared_library(name)) {
  268. return name;
  269. }
  270. Vector<String> library_search_directories;
  271. // If LD_LIBRARY_PATH is present, check its folders first
  272. for (auto& environment_variable : process_environment()) {
  273. auto prefix = "LD_LIBRARY_PATH="sv;
  274. if (environment_variable.starts_with(prefix)) {
  275. auto ld_library_path = environment_variable.substring_view(prefix.length());
  276. // FIXME: This code won't handle folders with ":" in the name correctly.
  277. for (auto directory : ld_library_path.split_view(':')) {
  278. library_search_directories.append(directory);
  279. }
  280. }
  281. }
  282. // Add default paths that DynamicLinker uses
  283. library_search_directories.append("/usr/lib/"sv);
  284. library_search_directories.append("/usr/local/lib/"sv);
  285. // Search for the first readable library file
  286. for (auto& directory : library_search_directories) {
  287. auto full_path = LexicalPath::join(directory, name).string();
  288. if (access(full_path.characters(), R_OK) != 0)
  289. continue;
  290. return full_path;
  291. }
  292. return name;
  293. }
  294. void Reader::for_each_library(Function<void(LibraryInfo)> func) const
  295. {
  296. HashTable<String> libraries;
  297. for_each_memory_region_info([&](auto const& region) {
  298. auto name = region.object_name();
  299. if (name.is_null() || libraries.contains(name))
  300. return IterationDecision::Continue;
  301. libraries.set(name);
  302. String path = resolve_object_path(name);
  303. func(LibraryInfo { name, path, static_cast<FlatPtr>(region.region_start) });
  304. return IterationDecision::Continue;
  305. });
  306. }
  307. }