Profile.cpp 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "Profile.h"
  7. #include "DisassemblyModel.h"
  8. #include "ProfileModel.h"
  9. #include "SamplesModel.h"
  10. #include "SourceModel.h"
  11. #include <AK/HashTable.h>
  12. #include <AK/LexicalPath.h>
  13. #include <AK/NonnullOwnPtrVector.h>
  14. #include <AK/QuickSort.h>
  15. #include <AK/RefPtr.h>
  16. #include <AK/Try.h>
  17. #include <LibCore/MappedFile.h>
  18. #include <LibELF/Image.h>
  19. #include <LibSymbolication/Symbolication.h>
  20. #include <sys/stat.h>
  21. namespace Profiler {
  22. static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
  23. {
  24. quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
  25. return a->event_count() >= b->event_count();
  26. });
  27. for (auto& child : nodes)
  28. child->sort_children();
  29. }
  30. Profile::Profile(Vector<Process> processes, Vector<Event> events)
  31. : m_processes(move(processes))
  32. , m_events(move(events))
  33. , m_file_event_nodes(FileEventNode::create(""))
  34. {
  35. for (size_t i = 0; i < m_events.size(); ++i) {
  36. if (m_events[i].data.has<Event::SignpostData>())
  37. m_signpost_indices.append(i);
  38. }
  39. m_first_timestamp = m_events.first().timestamp;
  40. m_last_timestamp = m_events.last().timestamp;
  41. m_model = ProfileModel::create(*this);
  42. m_samples_model = SamplesModel::create(*this);
  43. m_signposts_model = SignpostsModel::create(*this);
  44. m_file_event_model = FileEventModel::create(*this);
  45. rebuild_tree();
  46. }
  47. GUI::Model& Profile::model()
  48. {
  49. return *m_model;
  50. }
  51. GUI::Model& Profile::samples_model()
  52. {
  53. return *m_samples_model;
  54. }
  55. GUI::Model& Profile::signposts_model()
  56. {
  57. return *m_signposts_model;
  58. }
  59. void Profile::rebuild_tree()
  60. {
  61. Vector<NonnullRefPtr<ProfileNode>> roots;
  62. auto find_or_create_process_node = [this, &roots](pid_t pid, EventSerialNumber serial) -> ProfileNode& {
  63. auto const* process = find_process(pid, serial);
  64. if (!process) {
  65. dbgln("Profile contains event for unknown process with pid={}, serial={}", pid, serial.to_number());
  66. VERIFY_NOT_REACHED();
  67. }
  68. for (auto root : roots) {
  69. if (&root->process() == process)
  70. return root;
  71. }
  72. auto new_root = ProfileNode::create_process_node(*process);
  73. roots.append(new_root);
  74. return new_root;
  75. };
  76. HashTable<FlatPtr> live_allocations;
  77. for_each_event_in_filter_range([&](Event const& event) {
  78. event.data.visit(
  79. [&](Event::MallocData const& data) {
  80. live_allocations.set(data.ptr);
  81. },
  82. [&](Event::FreeData const& data) {
  83. live_allocations.remove(data.ptr);
  84. },
  85. [&](auto&) {});
  86. });
  87. m_filtered_event_indices.clear();
  88. m_filtered_signpost_indices.clear();
  89. m_file_event_nodes->children().clear();
  90. for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
  91. auto& event = m_events.at(event_index);
  92. if (has_timestamp_filter_range()) {
  93. auto timestamp = event.timestamp;
  94. if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
  95. continue;
  96. }
  97. if (!process_filter_contains(event.pid, event.serial))
  98. continue;
  99. if (event.data.has<Event::SignpostData>()) {
  100. m_filtered_signpost_indices.append(event_index);
  101. continue;
  102. }
  103. m_filtered_event_indices.append(event_index);
  104. if (auto* malloc_data = event.data.get_pointer<Event::MallocData>(); malloc_data && !live_allocations.contains(malloc_data->ptr))
  105. continue;
  106. if (event.data.has<Event::FreeData>())
  107. continue;
  108. auto for_each_frame = [&]<typename Callback>(Callback callback) {
  109. if (!m_inverted) {
  110. for (size_t i = 0; i < event.frames.size(); ++i) {
  111. if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
  112. break;
  113. }
  114. } else {
  115. for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
  116. if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
  117. break;
  118. }
  119. }
  120. };
  121. if (!m_show_top_functions) {
  122. ProfileNode* node = nullptr;
  123. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  124. process_node.increment_event_count();
  125. for_each_frame([&](Frame const& frame, bool is_innermost_frame) {
  126. auto const& object_name = frame.object_name;
  127. auto const& symbol = frame.symbol;
  128. auto const& address = frame.address;
  129. auto const& offset = frame.offset;
  130. if (symbol.is_empty())
  131. return IterationDecision::Break;
  132. // FIXME: More cheating with intentional mixing of TID/PID here:
  133. if (!node)
  134. node = &process_node;
  135. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  136. node->increment_event_count();
  137. if (is_innermost_frame) {
  138. node->add_event_address(address);
  139. node->increment_self_count();
  140. }
  141. return IterationDecision::Continue;
  142. });
  143. } else {
  144. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  145. process_node.increment_event_count();
  146. for (size_t i = 0; i < event.frames.size(); ++i) {
  147. ProfileNode* node = nullptr;
  148. ProfileNode* root = nullptr;
  149. for (size_t j = i; j < event.frames.size(); ++j) {
  150. auto& frame = event.frames.at(j);
  151. auto& object_name = frame.object_name;
  152. auto& symbol = frame.symbol;
  153. auto& address = frame.address;
  154. auto& offset = frame.offset;
  155. if (symbol.is_empty())
  156. break;
  157. // FIXME: More PID/TID mixing cheats here:
  158. if (!node) {
  159. node = &find_or_create_process_node(event.pid, event.serial);
  160. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  161. root = node;
  162. root->will_track_seen_events(m_events.size());
  163. } else {
  164. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  165. }
  166. if (!root->has_seen_event(event_index)) {
  167. root->did_see_event(event_index);
  168. root->increment_event_count();
  169. } else if (node != root) {
  170. node->increment_event_count();
  171. }
  172. if (j == event.frames.size() - 1) {
  173. node->add_event_address(address);
  174. node->increment_self_count();
  175. }
  176. }
  177. }
  178. }
  179. if (event.data.has<Event::ReadData>()) {
  180. auto const& read_event = event.data.get<Event::ReadData>();
  181. auto& event_node = m_file_event_nodes->find_or_create_node(read_event.path);
  182. event_node.for_each_parent_node([&](FileEventNode& node) {
  183. node.increment_count();
  184. // Fixme: Currently events record 'timestamp' and 'start_timestamp' in ms resolution,
  185. // which results in most durations equal to zero. Increasing the resolution should
  186. // make the information more accurate.
  187. auto const duration = event.timestamp - read_event.start_timestamp;
  188. node.add_to_duration(duration);
  189. });
  190. }
  191. }
  192. sort_profile_nodes(roots);
  193. m_roots = move(roots);
  194. m_model->invalidate();
  195. }
  196. Optional<MappedObject> g_kernel_debuginfo_object;
  197. OwnPtr<Debug::DebugInfo> g_kernel_debug_info;
  198. ErrorOr<NonnullOwnPtr<Profile>> Profile::load_from_perfcore_file(StringView path)
  199. {
  200. auto file = TRY(Core::File::open(path, Core::File::OpenMode::Read));
  201. auto json = JsonValue::from_string(TRY(file->read_until_eof()));
  202. if (json.is_error() || !json.value().is_object())
  203. return Error::from_string_literal("Invalid perfcore format (not a JSON object)");
  204. auto const& object = json.value().as_object();
  205. if (!g_kernel_debuginfo_object.has_value()) {
  206. auto debuginfo_file_or_error = Core::MappedFile::map("/boot/Kernel.debug"sv);
  207. if (!debuginfo_file_or_error.is_error()) {
  208. auto debuginfo_file = debuginfo_file_or_error.release_value();
  209. auto debuginfo_image = ELF::Image(debuginfo_file->bytes());
  210. g_kernel_debuginfo_object = { { debuginfo_file, move(debuginfo_image) } };
  211. }
  212. }
  213. auto strings_value = object.get_array("strings"sv);
  214. if (!strings_value.has_value())
  215. return Error::from_string_literal("Malformed profile (strings is not an array)");
  216. auto const& strings = strings_value.value();
  217. HashMap<FlatPtr, DeprecatedString> profile_strings;
  218. for (FlatPtr string_id = 0; string_id < strings.size(); ++string_id) {
  219. auto const& value = strings.at(string_id);
  220. profile_strings.set(string_id, value.to_deprecated_string());
  221. }
  222. auto events_value = object.get_array("events"sv);
  223. if (!events_value.has_value())
  224. return Error::from_string_literal("Malformed profile (events is not an array)");
  225. auto const& perf_events = events_value.value();
  226. Vector<NonnullOwnPtr<Process>> all_processes;
  227. HashMap<pid_t, Process*> current_processes;
  228. Vector<Event> events;
  229. EventSerialNumber next_serial;
  230. for (auto const& perf_event_value : perf_events.values()) {
  231. auto const& perf_event = perf_event_value.as_object();
  232. Event event;
  233. event.serial = next_serial;
  234. next_serial.increment();
  235. event.timestamp = perf_event.get_u64("timestamp"sv).value_or(0);
  236. event.lost_samples = perf_event.get_u32("lost_samples"sv).value_or(0);
  237. event.pid = perf_event.get_i32("pid"sv).value_or(0);
  238. event.tid = perf_event.get_i32("tid"sv).value_or(0);
  239. auto type_string = perf_event.get_deprecated_string("type"sv).value_or({});
  240. if (type_string == "sample"sv) {
  241. event.data = Event::SampleData {};
  242. } else if (type_string == "malloc"sv) {
  243. event.data = Event::MallocData {
  244. .ptr = perf_event.get_addr("ptr"sv).value_or(0),
  245. .size = perf_event.get_integer<size_t>("size"sv).value_or(0),
  246. };
  247. } else if (type_string == "free"sv) {
  248. event.data = Event::FreeData {
  249. .ptr = perf_event.get_addr("ptr"sv).value_or(0),
  250. };
  251. } else if (type_string == "signpost"sv) {
  252. auto string_id = perf_event.get_addr("arg1"sv).value_or(0);
  253. event.data = Event::SignpostData {
  254. .string = profile_strings.get(string_id).value_or(DeprecatedString::formatted("Signpost #{}", string_id)),
  255. .arg = perf_event.get_addr("arg2"sv).value_or(0),
  256. };
  257. } else if (type_string == "mmap"sv) {
  258. auto ptr = perf_event.get_addr("ptr"sv).value_or(0);
  259. auto size = perf_event.get_integer<size_t>("size"sv).value_or(0);
  260. auto name = perf_event.get_deprecated_string("name"sv).value_or({});
  261. event.data = Event::MmapData {
  262. .ptr = ptr,
  263. .size = size,
  264. .name = name,
  265. };
  266. auto it = current_processes.find(event.pid);
  267. if (it != current_processes.end())
  268. it->value->library_metadata.handle_mmap(ptr, size, name);
  269. continue;
  270. } else if (type_string == "munmap"sv) {
  271. event.data = Event::MunmapData {
  272. .ptr = perf_event.get_addr("ptr"sv).value_or(0),
  273. .size = perf_event.get_integer<size_t>("size"sv).value_or(0),
  274. };
  275. continue;
  276. } else if (type_string == "process_create"sv) {
  277. auto parent_pid = perf_event.get_integer<pid_t>("parent_pid"sv).value_or(0);
  278. auto executable = perf_event.get_deprecated_string("executable"sv).value_or({});
  279. event.data = Event::ProcessCreateData {
  280. .parent_pid = parent_pid,
  281. .executable = executable,
  282. };
  283. auto sampled_process = TRY(adopt_nonnull_own_or_enomem(new (nothrow) Process {
  284. .pid = event.pid,
  285. .executable = executable,
  286. .basename = LexicalPath::basename(executable),
  287. .start_valid = event.serial,
  288. .end_valid = {},
  289. }));
  290. current_processes.set(sampled_process->pid, sampled_process);
  291. all_processes.append(move(sampled_process));
  292. continue;
  293. } else if (type_string == "process_exec"sv) {
  294. auto executable = perf_event.get_deprecated_string("executable"sv).value_or({});
  295. event.data = Event::ProcessExecData {
  296. .executable = executable,
  297. };
  298. auto* old_process = current_processes.get(event.pid).value();
  299. old_process->end_valid = event.serial;
  300. current_processes.remove(event.pid);
  301. auto sampled_process = TRY(adopt_nonnull_own_or_enomem(new (nothrow) Process {
  302. .pid = event.pid,
  303. .executable = executable,
  304. .basename = LexicalPath::basename(executable),
  305. .start_valid = event.serial,
  306. .end_valid = {},
  307. }));
  308. current_processes.set(sampled_process->pid, sampled_process);
  309. all_processes.append(move(sampled_process));
  310. continue;
  311. } else if (type_string == "process_exit"sv) {
  312. auto* old_process = current_processes.get(event.pid).value();
  313. old_process->end_valid = event.serial;
  314. current_processes.remove(event.pid);
  315. continue;
  316. } else if (type_string == "thread_create"sv) {
  317. auto parent_tid = perf_event.get_integer<pid_t>("parent_tid"sv).value_or(0);
  318. event.data = Event::ThreadCreateData {
  319. .parent_tid = parent_tid,
  320. };
  321. auto it = current_processes.find(event.pid);
  322. if (it != current_processes.end())
  323. it->value->handle_thread_create(event.tid, event.serial);
  324. continue;
  325. } else if (type_string == "thread_exit"sv) {
  326. auto it = current_processes.find(event.pid);
  327. if (it != current_processes.end())
  328. it->value->handle_thread_exit(event.tid, event.serial);
  329. continue;
  330. } else if (type_string == "read"sv) {
  331. auto const string_index = perf_event.get_addr("filename_index"sv).value_or(0);
  332. event.data = Event::ReadData {
  333. .fd = perf_event.get_integer<int>("fd"sv).value_or(0),
  334. .size = perf_event.get_integer<size_t>("size"sv).value_or(0),
  335. .path = profile_strings.get(string_index).value(),
  336. .start_timestamp = perf_event.get_integer<size_t>("start_timestamp"sv).value_or(0),
  337. .success = perf_event.get_bool("success"sv).value_or(false)
  338. };
  339. } else {
  340. dbgln("Unknown event type '{}'", type_string);
  341. VERIFY_NOT_REACHED();
  342. }
  343. auto maybe_kernel_base = Symbolication::kernel_base();
  344. auto stack = perf_event.get_array("stack"sv);
  345. VERIFY(stack.has_value());
  346. auto const& stack_array = stack.value();
  347. for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
  348. auto const& frame = stack_array.at(i);
  349. auto ptr = frame.to_number<u64>();
  350. u32 offset = 0;
  351. DeprecatedFlyString object_name;
  352. DeprecatedString symbol;
  353. if (maybe_kernel_base.has_value() && ptr >= maybe_kernel_base.value()) {
  354. if (g_kernel_debuginfo_object.has_value()) {
  355. symbol = g_kernel_debuginfo_object->elf.symbolicate(ptr - maybe_kernel_base.value(), &offset);
  356. } else {
  357. symbol = DeprecatedString::formatted("?? <{:p}>", ptr);
  358. }
  359. } else {
  360. auto it = current_processes.find(event.pid);
  361. // FIXME: This logic is kinda gnarly, find a way to clean it up.
  362. LibraryMetadata* library_metadata {};
  363. if (it != current_processes.end())
  364. library_metadata = &it->value->library_metadata;
  365. if (auto const* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
  366. object_name = library->name;
  367. symbol = library->symbolicate(ptr, &offset);
  368. } else {
  369. symbol = DeprecatedString::formatted("?? <{:p}>", ptr);
  370. }
  371. }
  372. event.frames.append({ object_name, symbol, (FlatPtr)ptr, offset });
  373. }
  374. if (event.frames.size() < 2)
  375. continue;
  376. FlatPtr innermost_frame_address = event.frames.at(1).address;
  377. event.in_kernel = maybe_kernel_base.has_value() && innermost_frame_address >= maybe_kernel_base.value();
  378. events.append(move(event));
  379. }
  380. if (events.is_empty())
  381. return Error::from_string_literal("No events captured (targeted process was never on CPU)");
  382. quick_sort(all_processes, [](auto& a, auto& b) {
  383. if (a->pid == b->pid)
  384. return a->start_valid < b->start_valid;
  385. return a->pid < b->pid;
  386. });
  387. Vector<Process> processes;
  388. for (auto& it : all_processes)
  389. processes.append(move(*it));
  390. return adopt_nonnull_own_or_enomem(new (nothrow) Profile(move(processes), move(events)));
  391. }
  392. void ProfileNode::sort_children()
  393. {
  394. sort_profile_nodes(m_children);
  395. }
  396. void Profile::set_timestamp_filter_range(u64 start, u64 end)
  397. {
  398. if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
  399. return;
  400. m_has_timestamp_filter_range = true;
  401. m_timestamp_filter_range_start = min(start, end);
  402. m_timestamp_filter_range_end = max(start, end);
  403. rebuild_tree();
  404. m_samples_model->invalidate();
  405. m_signposts_model->invalidate();
  406. }
  407. void Profile::clear_timestamp_filter_range()
  408. {
  409. if (!m_has_timestamp_filter_range)
  410. return;
  411. m_has_timestamp_filter_range = false;
  412. rebuild_tree();
  413. m_samples_model->invalidate();
  414. m_signposts_model->invalidate();
  415. }
  416. void Profile::add_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  417. {
  418. auto filter = ProcessFilter { pid, start_valid, end_valid };
  419. if (m_process_filters.contains_slow(filter))
  420. return;
  421. m_process_filters.append(move(filter));
  422. rebuild_tree();
  423. if (m_disassembly_model)
  424. m_disassembly_model->invalidate();
  425. m_samples_model->invalidate();
  426. m_signposts_model->invalidate();
  427. }
  428. void Profile::remove_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  429. {
  430. auto filter = ProcessFilter { pid, start_valid, end_valid };
  431. if (!m_process_filters.contains_slow(filter))
  432. return;
  433. m_process_filters.remove_first_matching([&filter](ProcessFilter const& other_filter) {
  434. return other_filter == filter;
  435. });
  436. rebuild_tree();
  437. if (m_disassembly_model)
  438. m_disassembly_model->invalidate();
  439. m_samples_model->invalidate();
  440. m_signposts_model->invalidate();
  441. }
  442. void Profile::clear_process_filter()
  443. {
  444. if (m_process_filters.is_empty())
  445. return;
  446. m_process_filters.clear();
  447. rebuild_tree();
  448. if (m_disassembly_model)
  449. m_disassembly_model->invalidate();
  450. m_samples_model->invalidate();
  451. m_signposts_model->invalidate();
  452. }
  453. bool Profile::process_filter_contains(pid_t pid, EventSerialNumber serial)
  454. {
  455. if (!has_process_filter())
  456. return true;
  457. return AK::any_of(m_process_filters,
  458. [&](auto const& process_filter) { return pid == process_filter.pid && serial >= process_filter.start_valid && serial <= process_filter.end_valid; });
  459. }
  460. void Profile::set_inverted(bool inverted)
  461. {
  462. if (m_inverted == inverted)
  463. return;
  464. m_inverted = inverted;
  465. rebuild_tree();
  466. }
  467. void Profile::set_show_top_functions(bool show)
  468. {
  469. if (m_show_top_functions == show)
  470. return;
  471. m_show_top_functions = show;
  472. rebuild_tree();
  473. }
  474. void Profile::set_show_percentages(bool show_percentages)
  475. {
  476. if (m_show_percentages == show_percentages)
  477. return;
  478. m_show_percentages = show_percentages;
  479. }
  480. void Profile::set_disassembly_index(GUI::ModelIndex const& index)
  481. {
  482. if (m_disassembly_index == index)
  483. return;
  484. m_disassembly_index = index;
  485. auto* node = static_cast<ProfileNode*>(index.internal_data());
  486. if (!node)
  487. m_disassembly_model = nullptr;
  488. else
  489. m_disassembly_model = DisassemblyModel::create(*this, *node);
  490. }
  491. GUI::Model* Profile::disassembly_model()
  492. {
  493. return m_disassembly_model;
  494. }
  495. void Profile::set_source_index(GUI::ModelIndex const& index)
  496. {
  497. if (m_source_index == index)
  498. return;
  499. m_source_index = index;
  500. auto* node = static_cast<ProfileNode*>(index.internal_data());
  501. if (!node)
  502. m_source_model = nullptr;
  503. else
  504. m_source_model = SourceModel::create(*this, *node);
  505. }
  506. GUI::Model* Profile::source_model()
  507. {
  508. return m_source_model;
  509. }
  510. GUI::Model* Profile::file_event_model()
  511. {
  512. return m_file_event_model;
  513. }
  514. ProfileNode::ProfileNode(Process const& process)
  515. : m_root(true)
  516. , m_process(process)
  517. {
  518. }
  519. ProfileNode::ProfileNode(Process const& process, DeprecatedFlyString const& object_name, DeprecatedString symbol, FlatPtr address, u32 offset, u64 timestamp, pid_t pid)
  520. : m_process(process)
  521. , m_symbol(move(symbol))
  522. , m_pid(pid)
  523. , m_address(address)
  524. , m_offset(offset)
  525. , m_timestamp(timestamp)
  526. {
  527. DeprecatedString object;
  528. if (object_name.ends_with(": .text"sv)) {
  529. object = object_name.view().substring_view(0, object_name.length() - 7);
  530. } else {
  531. object = object_name;
  532. }
  533. m_object_name = LexicalPath::basename(object);
  534. }
  535. }