Profile.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "Profile.h"
  7. #include "DisassemblyModel.h"
  8. #include "ProfileModel.h"
  9. #include "SamplesModel.h"
  10. #include <AK/HashTable.h>
  11. #include <AK/LexicalPath.h>
  12. #include <AK/MappedFile.h>
  13. #include <AK/NonnullOwnPtrVector.h>
  14. #include <AK/QuickSort.h>
  15. #include <AK/RefPtr.h>
  16. #include <LibCore/File.h>
  17. #include <LibELF/Image.h>
  18. #include <sys/stat.h>
  19. namespace Profiler {
  20. static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
  21. {
  22. quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
  23. return a->event_count() >= b->event_count();
  24. });
  25. for (auto& child : nodes)
  26. child->sort_children();
  27. }
  28. Profile::Profile(Vector<Process> processes, Vector<Event> events)
  29. : m_processes(move(processes))
  30. , m_events(move(events))
  31. {
  32. m_first_timestamp = m_events.first().timestamp;
  33. m_last_timestamp = m_events.last().timestamp;
  34. m_model = ProfileModel::create(*this);
  35. m_samples_model = SamplesModel::create(*this);
  36. rebuild_tree();
  37. }
  38. GUI::Model& Profile::model()
  39. {
  40. return *m_model;
  41. }
  42. GUI::Model& Profile::samples_model()
  43. {
  44. return *m_samples_model;
  45. }
  46. void Profile::rebuild_tree()
  47. {
  48. Vector<NonnullRefPtr<ProfileNode>> roots;
  49. auto find_or_create_process_node = [this, &roots](pid_t pid, EventSerialNumber serial) -> ProfileNode& {
  50. auto* process = find_process(pid, serial);
  51. if (!process) {
  52. dbgln("Profile contains event for unknown process with pid={}, serial={}", pid, serial.to_number());
  53. VERIFY_NOT_REACHED();
  54. }
  55. for (auto root : roots) {
  56. if (&root->process() == process)
  57. return root;
  58. }
  59. auto new_root = ProfileNode::create_process_node(*process);
  60. roots.append(new_root);
  61. return new_root;
  62. };
  63. HashTable<FlatPtr> live_allocations;
  64. for_each_event_in_filter_range([&](auto& event) {
  65. if (event.type == "malloc"sv)
  66. live_allocations.set(event.ptr);
  67. else if (event.type == "free"sv)
  68. live_allocations.remove(event.ptr);
  69. });
  70. m_filtered_event_indices.clear();
  71. for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
  72. auto& event = m_events.at(event_index);
  73. if (has_timestamp_filter_range()) {
  74. auto timestamp = event.timestamp;
  75. if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
  76. continue;
  77. }
  78. if (!process_filter_contains(event.pid, event.serial))
  79. continue;
  80. m_filtered_event_indices.append(event_index);
  81. if (event.type == "malloc"sv && !live_allocations.contains(event.ptr))
  82. continue;
  83. if (event.type == "free"sv)
  84. continue;
  85. auto for_each_frame = [&]<typename Callback>(Callback callback) {
  86. if (!m_inverted) {
  87. for (size_t i = 0; i < event.frames.size(); ++i) {
  88. if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
  89. break;
  90. }
  91. } else {
  92. for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
  93. if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
  94. break;
  95. }
  96. }
  97. };
  98. if (!m_show_top_functions) {
  99. ProfileNode* node = nullptr;
  100. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  101. process_node.increment_event_count();
  102. for_each_frame([&](const Frame& frame, bool is_innermost_frame) {
  103. auto& object_name = frame.object_name;
  104. auto& symbol = frame.symbol;
  105. auto& address = frame.address;
  106. auto& offset = frame.offset;
  107. if (symbol.is_empty())
  108. return IterationDecision::Break;
  109. // FIXME: More cheating with intentional mixing of TID/PID here:
  110. if (!node)
  111. node = &process_node;
  112. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  113. node->increment_event_count();
  114. if (is_innermost_frame) {
  115. node->add_event_address(address);
  116. node->increment_self_count();
  117. }
  118. return IterationDecision::Continue;
  119. });
  120. } else {
  121. auto& process_node = find_or_create_process_node(event.pid, event.serial);
  122. process_node.increment_event_count();
  123. for (size_t i = 0; i < event.frames.size(); ++i) {
  124. ProfileNode* node = nullptr;
  125. ProfileNode* root = nullptr;
  126. for (size_t j = i; j < event.frames.size(); ++j) {
  127. auto& frame = event.frames.at(j);
  128. auto& object_name = frame.object_name;
  129. auto& symbol = frame.symbol;
  130. auto& address = frame.address;
  131. auto& offset = frame.offset;
  132. if (symbol.is_empty())
  133. break;
  134. // FIXME: More PID/TID mixing cheats here:
  135. if (!node) {
  136. node = &find_or_create_process_node(event.pid, event.serial);
  137. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  138. root = node;
  139. root->will_track_seen_events(m_events.size());
  140. } else {
  141. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  142. }
  143. if (!root->has_seen_event(event_index)) {
  144. root->did_see_event(event_index);
  145. root->increment_event_count();
  146. } else if (node != root) {
  147. node->increment_event_count();
  148. }
  149. if (j == event.frames.size() - 1) {
  150. node->add_event_address(address);
  151. node->increment_self_count();
  152. }
  153. }
  154. }
  155. }
  156. }
  157. sort_profile_nodes(roots);
  158. m_roots = move(roots);
  159. m_model->update();
  160. }
  161. Result<NonnullOwnPtr<Profile>, String> Profile::load_from_perfcore_file(const StringView& path)
  162. {
  163. auto file = Core::File::construct(path);
  164. if (!file->open(Core::OpenMode::ReadOnly))
  165. return String::formatted("Unable to open {}, error: {}", path, file->error_string());
  166. auto json = JsonValue::from_string(file->read_all());
  167. if (!json.has_value() || !json.value().is_object())
  168. return String { "Invalid perfcore format (not a JSON object)" };
  169. auto& object = json.value().as_object();
  170. auto file_or_error = MappedFile::map("/boot/Kernel.debug");
  171. OwnPtr<ELF::Image> kernel_elf;
  172. if (!file_or_error.is_error())
  173. kernel_elf = make<ELF::Image>(file_or_error.value()->bytes());
  174. auto events_value = object.get_ptr("events");
  175. if (!events_value || !events_value->is_array())
  176. return String { "Malformed profile (events is not an array)" };
  177. auto& perf_events = events_value->as_array();
  178. NonnullOwnPtrVector<Process> all_processes;
  179. HashMap<pid_t, Process*> current_processes;
  180. Vector<Event> events;
  181. EventSerialNumber next_serial;
  182. for (auto& perf_event_value : perf_events.values()) {
  183. auto& perf_event = perf_event_value.as_object();
  184. Event event;
  185. event.serial = next_serial;
  186. next_serial.increment();
  187. event.timestamp = perf_event.get("timestamp").to_number<u64>();
  188. event.lost_samples = perf_event.get("lost_samples").to_number<u32>();
  189. event.type = perf_event.get("type").to_string();
  190. event.pid = perf_event.get("pid").to_i32();
  191. event.tid = perf_event.get("tid").to_i32();
  192. if (event.type == "malloc"sv) {
  193. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  194. event.size = perf_event.get("size").to_number<size_t>();
  195. } else if (event.type == "free"sv) {
  196. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  197. } else if (event.type == "mmap"sv) {
  198. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  199. event.size = perf_event.get("size").to_number<size_t>();
  200. event.name = perf_event.get("name").to_string();
  201. auto it = current_processes.find(event.pid);
  202. if (it != current_processes.end())
  203. it->value->library_metadata.handle_mmap(event.ptr, event.size, event.name);
  204. continue;
  205. } else if (event.type == "munmap"sv) {
  206. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  207. event.size = perf_event.get("size").to_number<size_t>();
  208. continue;
  209. } else if (event.type == "process_create"sv) {
  210. event.parent_pid = perf_event.get("parent_pid").to_number<FlatPtr>();
  211. event.executable = perf_event.get("executable").to_string();
  212. auto sampled_process = adopt_own(*new Process {
  213. .pid = event.pid,
  214. .executable = event.executable,
  215. .basename = LexicalPath::basename(event.executable),
  216. .start_valid = event.serial,
  217. .end_valid = {},
  218. });
  219. current_processes.set(sampled_process->pid, sampled_process);
  220. all_processes.append(move(sampled_process));
  221. continue;
  222. } else if (event.type == "process_exec"sv) {
  223. event.executable = perf_event.get("executable").to_string();
  224. auto old_process = current_processes.get(event.pid).value();
  225. old_process->end_valid = event.serial;
  226. current_processes.remove(event.pid);
  227. auto sampled_process = adopt_own(*new Process {
  228. .pid = event.pid,
  229. .executable = event.executable,
  230. .basename = LexicalPath::basename(event.executable),
  231. .start_valid = event.serial,
  232. .end_valid = {},
  233. });
  234. current_processes.set(sampled_process->pid, sampled_process);
  235. all_processes.append(move(sampled_process));
  236. continue;
  237. } else if (event.type == "process_exit"sv) {
  238. auto old_process = current_processes.get(event.pid).value();
  239. old_process->end_valid = event.serial;
  240. current_processes.remove(event.pid);
  241. continue;
  242. } else if (event.type == "thread_create"sv) {
  243. event.parent_tid = perf_event.get("parent_tid").to_i32();
  244. auto it = current_processes.find(event.pid);
  245. if (it != current_processes.end())
  246. it->value->handle_thread_create(event.tid, event.serial);
  247. continue;
  248. } else if (event.type == "thread_exit"sv) {
  249. auto it = current_processes.find(event.pid);
  250. if (it != current_processes.end())
  251. it->value->handle_thread_exit(event.tid, event.serial);
  252. continue;
  253. }
  254. auto* stack = perf_event.get_ptr("stack");
  255. VERIFY(stack);
  256. auto& stack_array = stack->as_array();
  257. for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
  258. auto& frame = stack_array.at(i);
  259. auto ptr = frame.to_number<u32>();
  260. u32 offset = 0;
  261. FlyString object_name;
  262. String symbol;
  263. if (ptr >= 0xc0000000) {
  264. if (kernel_elf) {
  265. symbol = kernel_elf->symbolicate(ptr, &offset);
  266. } else {
  267. symbol = String::formatted("?? <{:p}>", ptr);
  268. }
  269. } else {
  270. auto it = current_processes.find(event.pid);
  271. // FIXME: This logic is kinda gnarly, find a way to clean it up.
  272. LibraryMetadata* library_metadata {};
  273. if (it != current_processes.end())
  274. library_metadata = &it->value->library_metadata;
  275. if (auto* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
  276. object_name = library->name;
  277. symbol = library->symbolicate(ptr, &offset);
  278. } else {
  279. symbol = String::formatted("?? <{:p}>", ptr);
  280. }
  281. }
  282. event.frames.append({ object_name, symbol, ptr, offset });
  283. }
  284. if (event.frames.size() < 2)
  285. continue;
  286. FlatPtr innermost_frame_address = event.frames.at(1).address;
  287. event.in_kernel = innermost_frame_address >= 0xc0000000;
  288. events.append(move(event));
  289. }
  290. if (events.is_empty())
  291. return String { "No events captured (targeted process was never on CPU)" };
  292. quick_sort(all_processes, [](auto& a, auto& b) {
  293. if (a.pid == b.pid)
  294. return a.start_valid < b.start_valid;
  295. else
  296. return a.pid < b.pid;
  297. });
  298. Vector<Process> processes;
  299. for (auto& it : all_processes)
  300. processes.append(move(it));
  301. return adopt_own(*new Profile(move(processes), move(events)));
  302. }
  303. void ProfileNode::sort_children()
  304. {
  305. sort_profile_nodes(m_children);
  306. }
  307. void Profile::set_timestamp_filter_range(u64 start, u64 end)
  308. {
  309. if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
  310. return;
  311. m_has_timestamp_filter_range = true;
  312. m_timestamp_filter_range_start = min(start, end);
  313. m_timestamp_filter_range_end = max(start, end);
  314. rebuild_tree();
  315. m_samples_model->update();
  316. }
  317. void Profile::clear_timestamp_filter_range()
  318. {
  319. if (!m_has_timestamp_filter_range)
  320. return;
  321. m_has_timestamp_filter_range = false;
  322. rebuild_tree();
  323. m_samples_model->update();
  324. }
  325. void Profile::add_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  326. {
  327. auto filter = ProcessFilter { pid, start_valid, end_valid };
  328. if (m_process_filters.contains_slow(filter))
  329. return;
  330. m_process_filters.append(move(filter));
  331. rebuild_tree();
  332. if (m_disassembly_model)
  333. m_disassembly_model->update();
  334. m_samples_model->update();
  335. }
  336. void Profile::remove_process_filter(pid_t pid, EventSerialNumber start_valid, EventSerialNumber end_valid)
  337. {
  338. auto filter = ProcessFilter { pid, start_valid, end_valid };
  339. if (!m_process_filters.contains_slow(filter))
  340. return;
  341. m_process_filters.remove_first_matching([&filter](ProcessFilter const& other_filter) {
  342. return other_filter == filter;
  343. });
  344. rebuild_tree();
  345. if (m_disassembly_model)
  346. m_disassembly_model->update();
  347. m_samples_model->update();
  348. }
  349. void Profile::clear_process_filter()
  350. {
  351. if (m_process_filters.is_empty())
  352. return;
  353. m_process_filters.clear();
  354. rebuild_tree();
  355. if (m_disassembly_model)
  356. m_disassembly_model->update();
  357. m_samples_model->update();
  358. }
  359. bool Profile::process_filter_contains(pid_t pid, EventSerialNumber serial)
  360. {
  361. if (!has_process_filter())
  362. return true;
  363. for (auto const& process_filter : m_process_filters)
  364. if (pid == process_filter.pid && serial >= process_filter.start_valid && serial <= process_filter.end_valid)
  365. return true;
  366. return false;
  367. }
  368. void Profile::set_inverted(bool inverted)
  369. {
  370. if (m_inverted == inverted)
  371. return;
  372. m_inverted = inverted;
  373. rebuild_tree();
  374. }
  375. void Profile::set_show_top_functions(bool show)
  376. {
  377. if (m_show_top_functions == show)
  378. return;
  379. m_show_top_functions = show;
  380. rebuild_tree();
  381. }
  382. void Profile::set_show_percentages(bool show_percentages)
  383. {
  384. if (m_show_percentages == show_percentages)
  385. return;
  386. m_show_percentages = show_percentages;
  387. }
  388. void Profile::set_disassembly_index(const GUI::ModelIndex& index)
  389. {
  390. if (m_disassembly_index == index)
  391. return;
  392. m_disassembly_index = index;
  393. auto* node = static_cast<ProfileNode*>(index.internal_data());
  394. if (!node)
  395. m_disassembly_model = nullptr;
  396. else
  397. m_disassembly_model = DisassemblyModel::create(*this, *node);
  398. }
  399. GUI::Model* Profile::disassembly_model()
  400. {
  401. return m_disassembly_model;
  402. }
  403. ProfileNode::ProfileNode(Process const& process)
  404. : m_root(true)
  405. , m_process(process)
  406. {
  407. }
  408. ProfileNode::ProfileNode(Process const& process, const String& object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid)
  409. : m_process(process)
  410. , m_symbol(move(symbol))
  411. , m_pid(pid)
  412. , m_address(address)
  413. , m_offset(offset)
  414. , m_timestamp(timestamp)
  415. {
  416. String object;
  417. if (object_name.ends_with(": .text"sv)) {
  418. object = object_name.view().substring_view(0, object_name.length() - 7);
  419. } else {
  420. object = object_name;
  421. }
  422. m_object_name = LexicalPath::basename(object);
  423. }
  424. }