Profile.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "Profile.h"
  7. #include "DisassemblyModel.h"
  8. #include "ProfileModel.h"
  9. #include "SamplesModel.h"
  10. #include <AK/HashTable.h>
  11. #include <AK/LexicalPath.h>
  12. #include <AK/MappedFile.h>
  13. #include <AK/NonnullOwnPtrVector.h>
  14. #include <AK/QuickSort.h>
  15. #include <AK/RefPtr.h>
  16. #include <LibCore/File.h>
  17. #include <LibELF/Image.h>
  18. #include <LibSymbolication/Symbolication.h>
  19. #include <sys/stat.h>
  20. namespace Profiler {
  21. static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
  22. {
  23. quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
  24. return a->event_count() >= b->event_count();
  25. });
  26. for (auto& child : nodes)
  27. child->sort_children();
  28. }
  29. Profile::Profile(Vector<Process> processes, Vector<Event> events)
  30. : m_processes(move(processes))
  31. , m_events(move(events))
  32. {
  33. m_first_timestamp = m_events.first().timestamp;
  34. m_last_timestamp = m_events.last().timestamp;
  35. m_model = ProfileModel::create(*this);
  36. m_samples_model = SamplesModel::create(*this);
  37. rebuild_tree();
  38. }
  39. GUI::Model& Profile::model()
  40. {
  41. return *m_model;
  42. }
  43. GUI::Model& Profile::samples_model()
  44. {
  45. return *m_samples_model;
  46. }
  47. void Profile::rebuild_tree()
  48. {
  49. Vector<NonnullRefPtr<ProfileNode>> roots;
  50. auto find_or_create_process_node = [this, &roots](pid_t pid, EventSerialNumber serial) -> ProfileNode& {
  51. auto* process = find_process(pid, serial);
  52. if (!process) {
  53. dbgln("Profile contains event for unknown process with pid={}, serial={}", pid, serial.to_number());
  54. VERIFY_NOT_REACHED();
  55. }
  56. for (auto root : roots) {
  57. if (&root->process() == process)
  58. return root;
  59. }
  60. auto new_root = ProfileNode::create_process_node(*process);
  61. roots.append(new_root);
  62. return new_root;
  63. };
  64. HashTable<FlatPtr> live_allocations;
  65. for_each_event_in_filter_range([&](auto& event) {
  66. if (event.type == "malloc"sv)
  67. live_allocations.set(event.ptr);
  68. else if (event.type == "free"sv)
  69. live_allocations.remove(event.ptr);
  70. });
  71. m_filtered_event_indices.clear();
  72. for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
  73. auto& event = m_events.at(event_index);
  74. if (has_timestamp_filter_range()) {
  75. auto timestamp = event.timestamp;
  76. if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
  77. continue;
  78. }
  79. if (!process_filter_contains(event.pid, event.serial))
  80. continue;
  81. m_filtered_event_indices.append(event_index);
  82. if (event.type == "malloc"sv && !live_allocations.contains(event.ptr))
  83. continue;
  84. if (event.type == "free"sv)
  85. continue;
  86. auto for_each_frame = [&]<typename Callback>(Callback callback) {
  87. if (!m_inverted) {
  88. for (size_t i = 0; i < event.frames.size(); ++i) {
  89. if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
  90. break;
  91. }
  92. } else {
  93. for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
  94. if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
  95. break;
  96. }
  97. }
  98. };
  99. if (!m_show_top_functions) {
  100. ProfileNode* node = nullptr;
  101. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  102. process_node.increment_event_count();
  103. for_each_frame([&](const Frame& frame, bool is_innermost_frame) {
  104. auto& object_name = frame.object_name;
  105. auto& symbol = frame.symbol;
  106. auto& address = frame.address;
  107. auto& offset = frame.offset;
  108. if (symbol.is_empty())
  109. return IterationDecision::Break;
  110. // FIXME: More cheating with intentional mixing of TID/PID here:
  111. if (!node)
  112. node = &process_node;
  113. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  114. node->increment_event_count();
  115. if (is_innermost_frame) {
  116. node->add_event_address(address);
  117. node->increment_self_count();
  118. }
  119. return IterationDecision::Continue;
  120. });
  121. } else {
  122. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  123. process_node.increment_event_count();
  124. for (size_t i = 0; i < event.frames.size(); ++i) {
  125. ProfileNode* node = nullptr;
  126. ProfileNode* root = nullptr;
  127. for (size_t j = i; j < event.frames.size(); ++j) {
  128. auto& frame = event.frames.at(j);
  129. auto& object_name = frame.object_name;
  130. auto& symbol = frame.symbol;
  131. auto& address = frame.address;
  132. auto& offset = frame.offset;
  133. if (symbol.is_empty())
  134. break;
  135. // FIXME: More PID/TID mixing cheats here:
  136. if (!node) {
  137. node = &find_or_create_process_node(event.pid, event.serial);
  138. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  139. root = node;
  140. root->will_track_seen_events(m_events.size());
  141. } else {
  142. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  143. }
  144. if (!root->has_seen_event(event_index)) {
  145. root->did_see_event(event_index);
  146. root->increment_event_count();
  147. } else if (node != root) {
  148. node->increment_event_count();
  149. }
  150. if (j == event.frames.size() - 1) {
  151. node->add_event_address(address);
  152. node->increment_self_count();
  153. }
  154. }
  155. }
  156. }
  157. }
  158. sort_profile_nodes(roots);
  159. m_roots = move(roots);
  160. m_model->invalidate();
  161. }
  162. Result<NonnullOwnPtr<Profile>, String> Profile::load_from_perfcore_file(const StringView& path)
  163. {
  164. auto file = Core::File::construct(path);
  165. if (!file->open(Core::OpenMode::ReadOnly))
  166. return String::formatted("Unable to open {}, error: {}", path, file->error_string());
  167. auto json = JsonValue::from_string(file->read_all());
  168. if (!json.has_value() || !json.value().is_object())
  169. return String { "Invalid perfcore format (not a JSON object)" };
  170. auto& object = json.value().as_object();
  171. auto file_or_error = MappedFile::map("/boot/Kernel.debug");
  172. OwnPtr<ELF::Image> kernel_elf;
  173. if (!file_or_error.is_error())
  174. kernel_elf = make<ELF::Image>(file_or_error.value()->bytes());
  175. auto events_value = object.get_ptr("events");
  176. if (!events_value || !events_value->is_array())
  177. return String { "Malformed profile (events is not an array)" };
  178. auto& perf_events = events_value->as_array();
  179. NonnullOwnPtrVector<Process> all_processes;
  180. HashMap<pid_t, Process*> current_processes;
  181. Vector<Event> events;
  182. EventSerialNumber next_serial;
  183. for (auto& perf_event_value : perf_events.values()) {
  184. auto& perf_event = perf_event_value.as_object();
  185. Event event;
  186. event.serial = next_serial;
  187. next_serial.increment();
  188. event.timestamp = perf_event.get("timestamp").to_number<u64>();
  189. event.lost_samples = perf_event.get("lost_samples").to_number<u32>();
  190. event.type = perf_event.get("type").to_string();
  191. event.pid = perf_event.get("pid").to_i32();
  192. event.tid = perf_event.get("tid").to_i32();
  193. if (event.type == "malloc"sv) {
  194. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  195. event.size = perf_event.get("size").to_number<size_t>();
  196. } else if (event.type == "free"sv) {
  197. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  198. } else if (event.type == "mmap"sv) {
  199. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  200. event.size = perf_event.get("size").to_number<size_t>();
  201. event.name = perf_event.get("name").to_string();
  202. auto it = current_processes.find(event.pid);
  203. if (it != current_processes.end())
  204. it->value->library_metadata.handle_mmap(event.ptr, event.size, event.name);
  205. continue;
  206. } else if (event.type == "munmap"sv) {
  207. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  208. event.size = perf_event.get("size").to_number<size_t>();
  209. continue;
  210. } else if (event.type == "process_create"sv) {
  211. event.parent_pid = perf_event.get("parent_pid").to_number<FlatPtr>();
  212. event.executable = perf_event.get("executable").to_string();
  213. auto sampled_process = adopt_own(*new Process {
  214. .pid = event.pid,
  215. .executable = event.executable,
  216. .basename = LexicalPath::basename(event.executable),
  217. .start_valid = event.serial,
  218. .end_valid = {},
  219. });
  220. current_processes.set(sampled_process->pid, sampled_process);
  221. all_processes.append(move(sampled_process));
  222. continue;
  223. } else if (event.type == "process_exec"sv) {
  224. event.executable = perf_event.get("executable").to_string();
  225. auto old_process = current_processes.get(event.pid).value();
  226. old_process->end_valid = event.serial;
  227. current_processes.remove(event.pid);
  228. auto sampled_process = adopt_own(*new Process {
  229. .pid = event.pid,
  230. .executable = event.executable,
  231. .basename = LexicalPath::basename(event.executable),
  232. .start_valid = event.serial,
  233. .end_valid = {},
  234. });
  235. current_processes.set(sampled_process->pid, sampled_process);
  236. all_processes.append(move(sampled_process));
  237. continue;
  238. } else if (event.type == "process_exit"sv) {
  239. auto old_process = current_processes.get(event.pid).value();
  240. old_process->end_valid = event.serial;
  241. current_processes.remove(event.pid);
  242. continue;
  243. } else if (event.type == "thread_create"sv) {
  244. event.parent_tid = perf_event.get("parent_tid").to_i32();
  245. auto it = current_processes.find(event.pid);
  246. if (it != current_processes.end())
  247. it->value->handle_thread_create(event.tid, event.serial);
  248. continue;
  249. } else if (event.type == "thread_exit"sv) {
  250. auto it = current_processes.find(event.pid);
  251. if (it != current_processes.end())
  252. it->value->handle_thread_exit(event.tid, event.serial);
  253. continue;
  254. }
  255. auto maybe_kernel_base = Symbolication::kernel_base();
  256. auto* stack = perf_event.get_ptr("stack");
  257. VERIFY(stack);
  258. auto& stack_array = stack->as_array();
  259. for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
  260. auto& frame = stack_array.at(i);
  261. auto ptr = frame.to_number<u64>();
  262. u32 offset = 0;
  263. FlyString object_name;
  264. String symbol;
  265. if (maybe_kernel_base.has_value() && ptr >= maybe_kernel_base.value()) {
  266. if (kernel_elf) {
  267. symbol = kernel_elf->symbolicate(ptr - maybe_kernel_base.value(), &offset);
  268. } else {
  269. symbol = String::formatted("?? <{:p}>", ptr);
  270. }
  271. } else {
  272. auto it = current_processes.find(event.pid);
  273. // FIXME: This logic is kinda gnarly, find a way to clean it up.
  274. LibraryMetadata* library_metadata {};
  275. if (it != current_processes.end())
  276. library_metadata = &it->value->library_metadata;
  277. if (auto* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
  278. object_name = library->name;
  279. symbol = library->symbolicate(ptr, &offset);
  280. } else {
  281. symbol = String::formatted("?? <{:p}>", ptr);
  282. }
  283. }
  284. event.frames.append({ object_name, symbol, (FlatPtr)ptr, offset });
  285. }
  286. if (event.frames.size() < 2)
  287. continue;
  288. FlatPtr innermost_frame_address = event.frames.at(1).address;
  289. event.in_kernel = maybe_kernel_base.has_value() && innermost_frame_address >= maybe_kernel_base.value();
  290. events.append(move(event));
  291. }
  292. if (events.is_empty())
  293. return String { "No events captured (targeted process was never on CPU)" };
  294. quick_sort(all_processes, [](auto& a, auto& b) {
  295. if (a.pid == b.pid)
  296. return a.start_valid < b.start_valid;
  297. else
  298. return a.pid < b.pid;
  299. });
  300. Vector<Process> processes;
  301. for (auto& it : all_processes)
  302. processes.append(move(it));
  303. return adopt_own(*new Profile(move(processes), move(events)));
  304. }
  305. void ProfileNode::sort_children()
  306. {
  307. sort_profile_nodes(m_children);
  308. }
  309. void Profile::set_timestamp_filter_range(u64 start, u64 end)
  310. {
  311. if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
  312. return;
  313. m_has_timestamp_filter_range = true;
  314. m_timestamp_filter_range_start = min(start, end);
  315. m_timestamp_filter_range_end = max(start, end);
  316. rebuild_tree();
  317. m_samples_model->invalidate();
  318. }
  319. void Profile::clear_timestamp_filter_range()
  320. {
  321. if (!m_has_timestamp_filter_range)
  322. return;
  323. m_has_timestamp_filter_range = false;
  324. rebuild_tree();
  325. m_samples_model->invalidate();
  326. }
  327. void Profile::add_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  328. {
  329. auto filter = ProcessFilter { pid, start_valid, end_valid };
  330. if (m_process_filters.contains_slow(filter))
  331. return;
  332. m_process_filters.append(move(filter));
  333. rebuild_tree();
  334. if (m_disassembly_model)
  335. m_disassembly_model->invalidate();
  336. m_samples_model->invalidate();
  337. }
  338. void Profile::remove_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  339. {
  340. auto filter = ProcessFilter { pid, start_valid, end_valid };
  341. if (!m_process_filters.contains_slow(filter))
  342. return;
  343. m_process_filters.remove_first_matching([&filter](ProcessFilter const& other_filter) {
  344. return other_filter == filter;
  345. });
  346. rebuild_tree();
  347. if (m_disassembly_model)
  348. m_disassembly_model->invalidate();
  349. m_samples_model->invalidate();
  350. }
  351. void Profile::clear_process_filter()
  352. {
  353. if (m_process_filters.is_empty())
  354. return;
  355. m_process_filters.clear();
  356. rebuild_tree();
  357. if (m_disassembly_model)
  358. m_disassembly_model->invalidate();
  359. m_samples_model->invalidate();
  360. }
  361. bool Profile::process_filter_contains(pid_t pid, EventSerialNumber serial)
  362. {
  363. if (!has_process_filter())
  364. return true;
  365. for (auto const& process_filter : m_process_filters)
  366. if (pid == process_filter.pid && serial >= process_filter.start_valid && serial <= process_filter.end_valid)
  367. return true;
  368. return false;
  369. }
  370. void Profile::set_inverted(bool inverted)
  371. {
  372. if (m_inverted == inverted)
  373. return;
  374. m_inverted = inverted;
  375. rebuild_tree();
  376. }
  377. void Profile::set_show_top_functions(bool show)
  378. {
  379. if (m_show_top_functions == show)
  380. return;
  381. m_show_top_functions = show;
  382. rebuild_tree();
  383. }
  384. void Profile::set_show_percentages(bool show_percentages)
  385. {
  386. if (m_show_percentages == show_percentages)
  387. return;
  388. m_show_percentages = show_percentages;
  389. }
  390. void Profile::set_disassembly_index(const GUI::ModelIndex& index)
  391. {
  392. if (m_disassembly_index == index)
  393. return;
  394. m_disassembly_index = index;
  395. auto* node = static_cast<ProfileNode*>(index.internal_data());
  396. if (!node)
  397. m_disassembly_model = nullptr;
  398. else
  399. m_disassembly_model = DisassemblyModel::create(*this, *node);
  400. }
  401. GUI::Model* Profile::disassembly_model()
  402. {
  403. return m_disassembly_model;
  404. }
  405. ProfileNode::ProfileNode(Process const& process)
  406. : m_root(true)
  407. , m_process(process)
  408. {
  409. }
  410. ProfileNode::ProfileNode(Process const& process, const String& object_name, String symbol, FlatPtr address, u32 offset, u64 timestamp, pid_t pid)
  411. : m_process(process)
  412. , m_symbol(move(symbol))
  413. , m_pid(pid)
  414. , m_address(address)
  415. , m_offset(offset)
  416. , m_timestamp(timestamp)
  417. {
  418. String object;
  419. if (object_name.ends_with(": .text"sv)) {
  420. object = object_name.view().substring_view(0, object_name.length() - 7);
  421. } else {
  422. object = object_name;
  423. }
  424. m_object_name = LexicalPath::basename(object);
  425. }
  426. }