PerformanceEventBuffer.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376
  1. /*
  2. * Copyright (c) 2020-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/JsonArraySerializer.h>
  7. #include <AK/JsonObjectSerializer.h>
  8. #include <AK/ScopeGuard.h>
  9. #include <Kernel/Arch/RegisterState.h>
  10. #include <Kernel/Arch/SmapDisabler.h>
  11. #include <Kernel/Arch/x86/SafeMem.h>
  12. #include <Kernel/FileSystem/Custody.h>
  13. #include <Kernel/KBufferBuilder.h>
  14. #include <Kernel/PerformanceEventBuffer.h>
  15. #include <Kernel/Process.h>
  16. namespace Kernel {
  17. PerformanceEventBuffer::PerformanceEventBuffer(NonnullOwnPtr<KBuffer> buffer)
  18. : m_buffer(move(buffer))
  19. {
  20. }
  21. NEVER_INLINE ErrorOr<void> PerformanceEventBuffer::append(int type, FlatPtr arg1, FlatPtr arg2, StringView arg3, Thread* current_thread, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> arg6)
  22. {
  23. FlatPtr base_pointer = (FlatPtr)__builtin_frame_address(0);
  24. return append_with_ip_and_bp(current_thread->pid(), current_thread->tid(), 0, base_pointer, type, 0, arg1, arg2, arg3, arg4, arg5, arg6);
  25. }
  26. static Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> raw_backtrace(FlatPtr bp, FlatPtr ip)
  27. {
  28. Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> backtrace;
  29. if (ip != 0)
  30. backtrace.unchecked_append(ip);
  31. FlatPtr stack_ptr_copy;
  32. FlatPtr stack_ptr = bp;
  33. // FIXME: Figure out how to remove this SmapDisabler without breaking profile stacks.
  34. SmapDisabler disabler;
  35. // NOTE: The stack should always have kernel frames first, followed by userspace frames.
  36. // If a userspace frame points back into kernel memory, something is afoot.
  37. bool is_walking_userspace_stack = false;
  38. while (stack_ptr) {
  39. void* fault_at;
  40. if (!safe_memcpy(&stack_ptr_copy, (void*)stack_ptr, sizeof(FlatPtr), fault_at))
  41. break;
  42. if (!Memory::is_user_address(VirtualAddress { stack_ptr })) {
  43. if (is_walking_userspace_stack) {
  44. dbgln("SHENANIGANS! Userspace stack points back into kernel memory");
  45. break;
  46. }
  47. } else {
  48. is_walking_userspace_stack = true;
  49. }
  50. FlatPtr retaddr;
  51. if (!safe_memcpy(&retaddr, (void*)(stack_ptr + sizeof(FlatPtr)), sizeof(FlatPtr), fault_at))
  52. break;
  53. if (retaddr == 0)
  54. break;
  55. backtrace.unchecked_append(retaddr);
  56. if (backtrace.size() == PerformanceEvent::max_stack_frame_count)
  57. break;
  58. stack_ptr = stack_ptr_copy;
  59. }
  60. return backtrace;
  61. }
  62. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid, RegisterState const& regs,
  63. int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, StringView arg3, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> arg6)
  64. {
  65. return append_with_ip_and_bp(pid, tid, regs.ip(), regs.bp(), type, lost_samples, arg1, arg2, arg3, arg4, arg5, arg6);
  66. }
  67. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid,
  68. FlatPtr ip, FlatPtr bp, int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, StringView arg3, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> arg6)
  69. {
  70. if (count() >= capacity())
  71. return ENOBUFS;
  72. if ((g_profiling_event_mask & type) == 0)
  73. return EINVAL;
  74. auto* current_thread = Thread::current();
  75. u32 enter_count = 0;
  76. if (current_thread)
  77. enter_count = current_thread->enter_profiler();
  78. ScopeGuard leave_profiler([&] {
  79. if (current_thread)
  80. current_thread->leave_profiler();
  81. });
  82. if (enter_count > 0)
  83. return EINVAL;
  84. PerformanceEvent event;
  85. event.type = type;
  86. event.lost_samples = lost_samples;
  87. switch (type) {
  88. case PERF_EVENT_SAMPLE:
  89. break;
  90. case PERF_EVENT_MALLOC:
  91. event.data.malloc.size = arg1;
  92. event.data.malloc.ptr = arg2;
  93. break;
  94. case PERF_EVENT_FREE:
  95. event.data.free.ptr = arg1;
  96. break;
  97. case PERF_EVENT_MMAP:
  98. event.data.mmap.ptr = arg1;
  99. event.data.mmap.size = arg2;
  100. memset(event.data.mmap.name, 0, sizeof(event.data.mmap.name));
  101. if (!arg3.is_empty())
  102. memcpy(event.data.mmap.name, arg3.characters_without_null_termination(), min(arg3.length(), sizeof(event.data.mmap.name) - 1));
  103. break;
  104. case PERF_EVENT_MUNMAP:
  105. event.data.munmap.ptr = arg1;
  106. event.data.munmap.size = arg2;
  107. break;
  108. case PERF_EVENT_PROCESS_CREATE:
  109. event.data.process_create.parent_pid = arg1;
  110. memset(event.data.process_create.executable, 0, sizeof(event.data.process_create.executable));
  111. if (!arg3.is_empty()) {
  112. memcpy(event.data.process_create.executable, arg3.characters_without_null_termination(),
  113. min(arg3.length(), sizeof(event.data.process_create.executable) - 1));
  114. }
  115. break;
  116. case PERF_EVENT_PROCESS_EXEC:
  117. memset(event.data.process_exec.executable, 0, sizeof(event.data.process_exec.executable));
  118. if (!arg3.is_empty()) {
  119. memcpy(event.data.process_exec.executable, arg3.characters_without_null_termination(),
  120. min(arg3.length(), sizeof(event.data.process_exec.executable) - 1));
  121. }
  122. break;
  123. case PERF_EVENT_PROCESS_EXIT:
  124. break;
  125. case PERF_EVENT_THREAD_CREATE:
  126. event.data.thread_create.parent_tid = arg1;
  127. break;
  128. case PERF_EVENT_THREAD_EXIT:
  129. break;
  130. case PERF_EVENT_CONTEXT_SWITCH:
  131. event.data.context_switch.next_pid = arg1;
  132. event.data.context_switch.next_tid = arg2;
  133. break;
  134. case PERF_EVENT_KMALLOC:
  135. event.data.kmalloc.size = arg1;
  136. event.data.kmalloc.ptr = arg2;
  137. break;
  138. case PERF_EVENT_KFREE:
  139. event.data.kfree.size = arg1;
  140. event.data.kfree.ptr = arg2;
  141. break;
  142. case PERF_EVENT_PAGE_FAULT:
  143. break;
  144. case PERF_EVENT_SYSCALL:
  145. break;
  146. case PERF_EVENT_SIGNPOST:
  147. event.data.signpost.arg1 = arg1;
  148. event.data.signpost.arg2 = arg2;
  149. break;
  150. case PERF_EVENT_READ:
  151. event.data.read.fd = arg1;
  152. event.data.read.size = arg2;
  153. event.data.read.filename_index = arg4;
  154. event.data.read.start_timestamp = arg5;
  155. event.data.read.success = !arg6.is_error();
  156. break;
  157. default:
  158. return EINVAL;
  159. }
  160. auto backtrace = raw_backtrace(bp, ip);
  161. event.stack_size = min(sizeof(event.stack) / sizeof(FlatPtr), static_cast<size_t>(backtrace.size()));
  162. memcpy(event.stack, backtrace.data(), event.stack_size * sizeof(FlatPtr));
  163. event.pid = pid.value();
  164. event.tid = tid.value();
  165. event.timestamp = TimeManagement::the().uptime_ms();
  166. at(m_count++) = event;
  167. return {};
  168. }
  169. PerformanceEvent& PerformanceEventBuffer::at(size_t index)
  170. {
  171. VERIFY(index < capacity());
  172. auto* events = reinterpret_cast<PerformanceEvent*>(m_buffer->data());
  173. return events[index];
  174. }
  175. template<typename Serializer>
  176. ErrorOr<void> PerformanceEventBuffer::to_json_impl(Serializer& object) const
  177. {
  178. {
  179. auto strings = TRY(object.add_array("strings"));
  180. Vector<KString*> strings_sorted_by_index;
  181. TRY(strings_sorted_by_index.try_resize(m_strings.size()));
  182. for (auto& entry : m_strings) {
  183. strings_sorted_by_index[entry.value] = const_cast<Kernel::KString*>(entry.key.ptr());
  184. }
  185. for (size_t i = 0; i < m_strings.size(); i++) {
  186. TRY(strings.add(strings_sorted_by_index[i]->view()));
  187. }
  188. TRY(strings.finish());
  189. }
  190. bool show_kernel_addresses = Process::current().is_superuser();
  191. auto array = TRY(object.add_array("events"));
  192. bool seen_first_sample = false;
  193. for (size_t i = 0; i < m_count; ++i) {
  194. auto const& event = at(i);
  195. if (!show_kernel_addresses) {
  196. if (event.type == PERF_EVENT_KMALLOC || event.type == PERF_EVENT_KFREE)
  197. continue;
  198. }
  199. auto event_object = TRY(array.add_object());
  200. switch (event.type) {
  201. case PERF_EVENT_SAMPLE:
  202. TRY(event_object.add("type", "sample"));
  203. break;
  204. case PERF_EVENT_MALLOC:
  205. TRY(event_object.add("type", "malloc"));
  206. TRY(event_object.add("ptr", static_cast<u64>(event.data.malloc.ptr)));
  207. TRY(event_object.add("size", static_cast<u64>(event.data.malloc.size)));
  208. break;
  209. case PERF_EVENT_FREE:
  210. TRY(event_object.add("type", "free"));
  211. TRY(event_object.add("ptr", static_cast<u64>(event.data.free.ptr)));
  212. break;
  213. case PERF_EVENT_MMAP:
  214. TRY(event_object.add("type", "mmap"));
  215. TRY(event_object.add("ptr", static_cast<u64>(event.data.mmap.ptr)));
  216. TRY(event_object.add("size", static_cast<u64>(event.data.mmap.size)));
  217. TRY(event_object.add("name", event.data.mmap.name));
  218. break;
  219. case PERF_EVENT_MUNMAP:
  220. TRY(event_object.add("type", "munmap"));
  221. TRY(event_object.add("ptr", static_cast<u64>(event.data.munmap.ptr)));
  222. TRY(event_object.add("size", static_cast<u64>(event.data.munmap.size)));
  223. break;
  224. case PERF_EVENT_PROCESS_CREATE:
  225. TRY(event_object.add("type", "process_create"));
  226. TRY(event_object.add("parent_pid", static_cast<u64>(event.data.process_create.parent_pid)));
  227. TRY(event_object.add("executable", event.data.process_create.executable));
  228. break;
  229. case PERF_EVENT_PROCESS_EXEC:
  230. TRY(event_object.add("type", "process_exec"));
  231. TRY(event_object.add("executable", event.data.process_exec.executable));
  232. break;
  233. case PERF_EVENT_PROCESS_EXIT:
  234. TRY(event_object.add("type", "process_exit"));
  235. break;
  236. case PERF_EVENT_THREAD_CREATE:
  237. TRY(event_object.add("type", "thread_create"));
  238. TRY(event_object.add("parent_tid", static_cast<u64>(event.data.thread_create.parent_tid)));
  239. break;
  240. case PERF_EVENT_THREAD_EXIT:
  241. TRY(event_object.add("type", "thread_exit"));
  242. break;
  243. case PERF_EVENT_CONTEXT_SWITCH:
  244. TRY(event_object.add("type", "context_switch"));
  245. TRY(event_object.add("next_pid", static_cast<u64>(event.data.context_switch.next_pid)));
  246. TRY(event_object.add("next_tid", static_cast<u64>(event.data.context_switch.next_tid)));
  247. break;
  248. case PERF_EVENT_KMALLOC:
  249. TRY(event_object.add("type", "kmalloc"));
  250. TRY(event_object.add("ptr", static_cast<u64>(event.data.kmalloc.ptr)));
  251. TRY(event_object.add("size", static_cast<u64>(event.data.kmalloc.size)));
  252. break;
  253. case PERF_EVENT_KFREE:
  254. TRY(event_object.add("type", "kfree"));
  255. TRY(event_object.add("ptr", static_cast<u64>(event.data.kfree.ptr)));
  256. TRY(event_object.add("size", static_cast<u64>(event.data.kfree.size)));
  257. break;
  258. case PERF_EVENT_PAGE_FAULT:
  259. TRY(event_object.add("type", "page_fault"));
  260. break;
  261. case PERF_EVENT_SYSCALL:
  262. TRY(event_object.add("type", "syscall"));
  263. break;
  264. case PERF_EVENT_SIGNPOST:
  265. TRY(event_object.add("type"sv, "signpost"sv));
  266. TRY(event_object.add("arg1"sv, event.data.signpost.arg1));
  267. TRY(event_object.add("arg2"sv, event.data.signpost.arg2));
  268. break;
  269. case PERF_EVENT_READ:
  270. TRY(event_object.add("type", "read"));
  271. TRY(event_object.add("fd", event.data.read.fd));
  272. TRY(event_object.add("size"sv, event.data.read.size));
  273. TRY(event_object.add("filename_index"sv, event.data.read.filename_index));
  274. TRY(event_object.add("start_timestamp"sv, event.data.read.start_timestamp));
  275. TRY(event_object.add("success"sv, event.data.read.success));
  276. break;
  277. }
  278. TRY(event_object.add("pid", event.pid));
  279. TRY(event_object.add("tid", event.tid));
  280. TRY(event_object.add("timestamp", event.timestamp));
  281. TRY(event_object.add("lost_samples", seen_first_sample ? event.lost_samples : 0));
  282. if (event.type == PERF_EVENT_SAMPLE)
  283. seen_first_sample = true;
  284. auto stack_array = TRY(event_object.add_array("stack"));
  285. for (size_t j = 0; j < event.stack_size; ++j) {
  286. auto address = event.stack[j];
  287. if (!show_kernel_addresses && !Memory::is_user_address(VirtualAddress { address }))
  288. address = 0xdeadc0de;
  289. TRY(stack_array.add(address));
  290. }
  291. TRY(stack_array.finish());
  292. TRY(event_object.finish());
  293. }
  294. TRY(array.finish());
  295. TRY(object.finish());
  296. return {};
  297. }
  298. ErrorOr<void> PerformanceEventBuffer::to_json(KBufferBuilder& builder) const
  299. {
  300. auto object = TRY(JsonObjectSerializer<>::try_create(builder));
  301. return to_json_impl(object);
  302. }
  303. OwnPtr<PerformanceEventBuffer> PerformanceEventBuffer::try_create_with_size(size_t buffer_size)
  304. {
  305. auto buffer_or_error = KBuffer::try_create_with_size(buffer_size, Memory::Region::Access::ReadWrite, "Performance events", AllocationStrategy::AllocateNow);
  306. if (buffer_or_error.is_error())
  307. return {};
  308. return adopt_own_if_nonnull(new (nothrow) PerformanceEventBuffer(buffer_or_error.release_value()));
  309. }
  310. ErrorOr<void> PerformanceEventBuffer::add_process(Process const& process, ProcessEventType event_type)
  311. {
  312. SpinlockLocker locker(process.address_space().get_lock());
  313. OwnPtr<KString> executable;
  314. if (process.executable())
  315. executable = TRY(process.executable()->try_serialize_absolute_path());
  316. else
  317. executable = TRY(KString::formatted("<{}>", process.name()));
  318. TRY(append_with_ip_and_bp(process.pid(), 0, 0, 0,
  319. event_type == ProcessEventType::Create ? PERF_EVENT_PROCESS_CREATE : PERF_EVENT_PROCESS_EXEC,
  320. 0, process.pid().value(), 0, executable->view()));
  321. ErrorOr<void> result;
  322. process.for_each_thread([&](auto& thread) {
  323. result = append_with_ip_and_bp(process.pid(), thread.tid().value(),
  324. 0, 0, PERF_EVENT_THREAD_CREATE, 0, 0, 0, nullptr);
  325. return result.is_error() ? IterationDecision::Break : IterationDecision::Continue;
  326. });
  327. TRY(result);
  328. for (auto const& region : process.address_space().regions()) {
  329. TRY(append_with_ip_and_bp(process.pid(), 0,
  330. 0, 0, PERF_EVENT_MMAP, 0, region.range().base().get(), region.range().size(), region.name()));
  331. }
  332. return {};
  333. }
  334. ErrorOr<FlatPtr> PerformanceEventBuffer::register_string(NonnullOwnPtr<KString> string)
  335. {
  336. auto it = m_strings.find(string);
  337. if (it != m_strings.end()) {
  338. return it->value;
  339. }
  340. auto new_index = m_strings.size();
  341. TRY(m_strings.try_set(move(string), move(new_index)));
  342. return new_index;
  343. }
  344. }