Profile.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "Profile.h"
  7. #include "DisassemblyModel.h"
  8. #include "ProfileModel.h"
  9. #include "SamplesModel.h"
  10. #include <AK/HashTable.h>
  11. #include <AK/LexicalPath.h>
  12. #include <AK/MappedFile.h>
  13. #include <AK/NonnullOwnPtrVector.h>
  14. #include <AK/QuickSort.h>
  15. #include <AK/RefPtr.h>
  16. #include <LibCore/File.h>
  17. #include <LibELF/Image.h>
  18. #include <sys/stat.h>
  19. static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
  20. {
  21. quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
  22. return a->event_count() >= b->event_count();
  23. });
  24. for (auto& child : nodes)
  25. child->sort_children();
  26. }
  27. Profile::Profile(Vector<Process> processes, Vector<Event> events)
  28. : m_processes(move(processes))
  29. , m_events(move(events))
  30. {
  31. m_first_timestamp = m_events.first().timestamp;
  32. m_last_timestamp = m_events.last().timestamp;
  33. m_model = ProfileModel::create(*this);
  34. m_samples_model = SamplesModel::create(*this);
  35. for (auto& event : m_events) {
  36. m_deepest_stack_depth = max((u32)event.frames.size(), m_deepest_stack_depth);
  37. }
  38. rebuild_tree();
  39. }
  40. Profile::~Profile()
  41. {
  42. }
  43. GUI::Model& Profile::model()
  44. {
  45. return *m_model;
  46. }
  47. GUI::Model& Profile::samples_model()
  48. {
  49. return *m_samples_model;
  50. }
  51. void Profile::rebuild_tree()
  52. {
  53. Vector<NonnullRefPtr<ProfileNode>> roots;
  54. auto find_or_create_root = [&roots](FlyString object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid) -> ProfileNode& {
  55. for (auto root : roots) {
  56. if (root->symbol() == symbol) {
  57. return root;
  58. }
  59. }
  60. auto new_root = ProfileNode::create(move(object_name), move(symbol), address, offset, timestamp, pid);
  61. roots.append(new_root);
  62. return new_root;
  63. };
  64. HashTable<FlatPtr> live_allocations;
  65. for_each_event_in_filter_range([&](auto& event) {
  66. if (event.type == "malloc")
  67. live_allocations.set(event.ptr);
  68. else if (event.type == "free")
  69. live_allocations.remove(event.ptr);
  70. });
  71. m_filtered_event_indices.clear();
  72. for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
  73. auto& event = m_events.at(event_index);
  74. if (has_timestamp_filter_range()) {
  75. auto timestamp = event.timestamp;
  76. if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
  77. continue;
  78. }
  79. if (has_process_filter()) {
  80. if (event.pid != m_process_filter_pid || event.timestamp < m_process_filter_start_valid || event.timestamp > m_process_filter_end_valid)
  81. continue;
  82. }
  83. m_filtered_event_indices.append(event_index);
  84. if (event.type == "malloc" && !live_allocations.contains(event.ptr))
  85. continue;
  86. if (event.type == "free")
  87. continue;
  88. auto for_each_frame = [&]<typename Callback>(Callback callback) {
  89. if (!m_inverted) {
  90. for (size_t i = 0; i < event.frames.size(); ++i) {
  91. if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
  92. break;
  93. }
  94. } else {
  95. for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
  96. if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
  97. break;
  98. }
  99. }
  100. };
  101. if (!m_show_top_functions) {
  102. ProfileNode* node = nullptr;
  103. for_each_frame([&](const Frame& frame, bool is_innermost_frame) {
  104. auto& object_name = frame.object_name;
  105. auto& symbol = frame.symbol;
  106. auto& address = frame.address;
  107. auto& offset = frame.offset;
  108. if (symbol.is_empty())
  109. return IterationDecision::Break;
  110. // FIXME: More cheating with intentional mixing of TID/PID here:
  111. if (!node)
  112. node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
  113. else
  114. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  115. node->increment_event_count();
  116. if (is_innermost_frame) {
  117. node->add_event_address(address);
  118. node->increment_self_count();
  119. }
  120. return IterationDecision::Continue;
  121. });
  122. } else {
  123. for (size_t i = 0; i < event.frames.size(); ++i) {
  124. ProfileNode* node = nullptr;
  125. ProfileNode* root = nullptr;
  126. for (size_t j = i; j < event.frames.size(); ++j) {
  127. auto& frame = event.frames.at(j);
  128. auto& object_name = frame.object_name;
  129. auto& symbol = frame.symbol;
  130. auto& address = frame.address;
  131. auto& offset = frame.offset;
  132. if (symbol.is_empty())
  133. break;
  134. // FIXME: More PID/TID mixing cheats here:
  135. if (!node) {
  136. node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
  137. root = node;
  138. root->will_track_seen_events(m_events.size());
  139. } else {
  140. node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
  141. }
  142. if (!root->has_seen_event(event_index)) {
  143. root->did_see_event(event_index);
  144. root->increment_event_count();
  145. } else if (node != root) {
  146. node->increment_event_count();
  147. }
  148. if (j == event.frames.size() - 1) {
  149. node->add_event_address(address);
  150. node->increment_self_count();
  151. }
  152. }
  153. }
  154. }
  155. }
  156. sort_profile_nodes(roots);
  157. m_roots = move(roots);
  158. m_model->update();
  159. }
  160. Result<NonnullOwnPtr<Profile>, String> Profile::load_from_perfcore_file(const StringView& path)
  161. {
  162. auto file = Core::File::construct(path);
  163. if (!file->open(Core::IODevice::ReadOnly))
  164. return String::formatted("Unable to open {}, error: {}", path, file->error_string());
  165. auto json = JsonValue::from_string(file->read_all());
  166. if (!json.has_value() || !json.value().is_object())
  167. return String { "Invalid perfcore format (not a JSON object)" };
  168. auto& object = json.value().as_object();
  169. auto file_or_error = MappedFile::map("/boot/Kernel");
  170. OwnPtr<ELF::Image> kernel_elf;
  171. if (!file_or_error.is_error())
  172. kernel_elf = make<ELF::Image>(file_or_error.value()->bytes());
  173. auto events_value = object.get("events");
  174. if (!events_value.is_array())
  175. return String { "Malformed profile (events is not an array)" };
  176. auto& perf_events = events_value.as_array();
  177. NonnullOwnPtrVector<Process> all_processes;
  178. HashMap<pid_t, Process*> current_processes;
  179. Vector<Event> events;
  180. for (auto& perf_event_value : perf_events.values()) {
  181. auto& perf_event = perf_event_value.as_object();
  182. Event event;
  183. event.timestamp = perf_event.get("timestamp").to_number<u64>();
  184. event.type = perf_event.get("type").to_string();
  185. event.pid = perf_event.get("pid").to_i32();
  186. event.tid = perf_event.get("tid").to_i32();
  187. if (event.type == "malloc") {
  188. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  189. event.size = perf_event.get("size").to_number<size_t>();
  190. } else if (event.type == "free") {
  191. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  192. } else if (event.type == "mmap") {
  193. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  194. event.size = perf_event.get("size").to_number<size_t>();
  195. event.name = perf_event.get("name").to_string();
  196. auto it = current_processes.find(event.pid);
  197. if (it != current_processes.end())
  198. it->value->library_metadata.handle_mmap(event.ptr, event.size, event.name);
  199. continue;
  200. } else if (event.type == "munmap") {
  201. event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
  202. event.size = perf_event.get("size").to_number<size_t>();
  203. continue;
  204. } else if (event.type == "process_create") {
  205. event.parent_pid = perf_event.get("parent_pid").to_number<FlatPtr>();
  206. event.executable = perf_event.get("executable").to_string();
  207. auto sampled_process = adopt_own(*new Process {
  208. .pid = event.pid,
  209. .executable = event.executable,
  210. .start_valid = event.timestamp,
  211. });
  212. current_processes.set(sampled_process->pid, sampled_process);
  213. all_processes.append(move(sampled_process));
  214. continue;
  215. } else if (event.type == "process_exec") {
  216. event.executable = perf_event.get("executable").to_string();
  217. auto old_process = current_processes.get(event.pid).value();
  218. old_process->end_valid = event.timestamp - 1;
  219. current_processes.remove(event.pid);
  220. auto sampled_process = adopt_own(*new Process {
  221. .pid = event.pid,
  222. .executable = event.executable,
  223. .start_valid = event.timestamp });
  224. current_processes.set(sampled_process->pid, sampled_process);
  225. all_processes.append(move(sampled_process));
  226. continue;
  227. } else if (event.type == "process_exit") {
  228. auto old_process = current_processes.get(event.pid).value();
  229. old_process->end_valid = event.timestamp - 1;
  230. current_processes.remove(event.pid);
  231. continue;
  232. } else if (event.type == "thread_create") {
  233. event.parent_tid = perf_event.get("parent_tid").to_i32();
  234. auto it = current_processes.find(event.pid);
  235. if (it != current_processes.end())
  236. it->value->handle_thread_create(event.tid, event.timestamp);
  237. continue;
  238. } else if (event.type == "thread_exit") {
  239. auto it = current_processes.find(event.pid);
  240. if (it != current_processes.end())
  241. it->value->handle_thread_exit(event.tid, event.timestamp);
  242. continue;
  243. }
  244. auto stack_array = perf_event.get("stack").as_array();
  245. for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
  246. auto& frame = stack_array.at(i);
  247. auto ptr = frame.to_number<u32>();
  248. u32 offset = 0;
  249. FlyString object_name;
  250. String symbol;
  251. if (ptr >= 0xc0000000) {
  252. if (kernel_elf) {
  253. symbol = kernel_elf->symbolicate(ptr, &offset);
  254. } else {
  255. symbol = String::formatted("?? <{:p}>", ptr);
  256. }
  257. } else {
  258. auto it = current_processes.find(event.pid);
  259. // FIXME: This logic is kinda gnarly, find a way to clean it up.
  260. LibraryMetadata* library_metadata {};
  261. if (it != current_processes.end())
  262. library_metadata = &it->value->library_metadata;
  263. if (auto* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
  264. object_name = library->name;
  265. symbol = library->symbolicate(ptr, &offset);
  266. } else {
  267. symbol = String::formatted("?? <{:p}>", ptr);
  268. }
  269. }
  270. event.frames.append({ object_name, symbol, ptr, offset });
  271. }
  272. if (event.frames.size() < 2)
  273. continue;
  274. FlatPtr innermost_frame_address = event.frames.at(1).address;
  275. event.in_kernel = innermost_frame_address >= 0xc0000000;
  276. events.append(move(event));
  277. }
  278. if (events.is_empty())
  279. return String { "No events captured (targeted process was never on CPU)" };
  280. quick_sort(all_processes, [](auto& a, auto& b) {
  281. if (a.pid == b.pid)
  282. return a.start_valid < b.start_valid;
  283. else
  284. return a.pid < b.pid;
  285. });
  286. Vector<Process> processes;
  287. for (auto& it : all_processes)
  288. processes.append(move(it));
  289. return adopt_own(*new Profile(move(processes), move(events)));
  290. }
  291. void ProfileNode::sort_children()
  292. {
  293. sort_profile_nodes(m_children);
  294. }
  295. void Profile::set_timestamp_filter_range(u64 start, u64 end)
  296. {
  297. if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
  298. return;
  299. m_has_timestamp_filter_range = true;
  300. m_timestamp_filter_range_start = min(start, end);
  301. m_timestamp_filter_range_end = max(start, end);
  302. rebuild_tree();
  303. m_samples_model->update();
  304. }
  305. void Profile::clear_timestamp_filter_range()
  306. {
  307. if (!m_has_timestamp_filter_range)
  308. return;
  309. m_has_timestamp_filter_range = false;
  310. rebuild_tree();
  311. m_samples_model->update();
  312. }
  313. void Profile::set_process_filter(pid_t pid, u64 start_valid, u64 end_valid)
  314. {
  315. if (m_has_process_filter && m_process_filter_pid == pid && m_process_filter_start_valid == start_valid && m_process_filter_end_valid == end_valid)
  316. return;
  317. m_has_process_filter = true;
  318. m_process_filter_pid = pid;
  319. m_process_filter_start_valid = start_valid;
  320. m_process_filter_end_valid = end_valid;
  321. rebuild_tree();
  322. if (m_disassembly_model)
  323. m_disassembly_model->update();
  324. m_samples_model->update();
  325. }
  326. void Profile::clear_process_filter()
  327. {
  328. if (!m_has_process_filter)
  329. return;
  330. m_has_process_filter = false;
  331. rebuild_tree();
  332. if (m_disassembly_model)
  333. m_disassembly_model->update();
  334. m_samples_model->update();
  335. }
  336. void Profile::set_inverted(bool inverted)
  337. {
  338. if (m_inverted == inverted)
  339. return;
  340. m_inverted = inverted;
  341. rebuild_tree();
  342. }
  343. void Profile::set_show_top_functions(bool show)
  344. {
  345. if (m_show_top_functions == show)
  346. return;
  347. m_show_top_functions = show;
  348. rebuild_tree();
  349. }
  350. void Profile::set_show_percentages(bool show_percentages)
  351. {
  352. if (m_show_percentages == show_percentages)
  353. return;
  354. m_show_percentages = show_percentages;
  355. }
  356. void Profile::set_disassembly_index(const GUI::ModelIndex& index)
  357. {
  358. if (m_disassembly_index == index)
  359. return;
  360. m_disassembly_index = index;
  361. auto* node = static_cast<ProfileNode*>(index.internal_data());
  362. m_disassembly_model = DisassemblyModel::create(*this, *node);
  363. }
  364. GUI::Model* Profile::disassembly_model()
  365. {
  366. return m_disassembly_model;
  367. }
  368. ProfileNode::ProfileNode(const String& object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid)
  369. : m_symbol(move(symbol))
  370. , m_pid(pid)
  371. , m_address(address)
  372. , m_offset(offset)
  373. , m_timestamp(timestamp)
  374. {
  375. String object;
  376. if (object_name.ends_with(": .text")) {
  377. object = object_name.view().substring_view(0, object_name.length() - 7);
  378. } else {
  379. object = object_name;
  380. }
  381. m_object_name = LexicalPath(object).basename();
  382. }
  383. const Process* ProfileNode::process(Profile& profile, u64 timestamp) const
  384. {
  385. return profile.find_process(m_pid, timestamp);
  386. }