PerformanceEventBuffer.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380
  1. /*
  2. * Copyright (c) 2020-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/JsonArraySerializer.h>
  7. #include <AK/JsonObjectSerializer.h>
  8. #include <AK/ScopeGuard.h>
  9. #include <Kernel/Arch/RegisterState.h>
  10. #include <Kernel/Arch/SafeMem.h>
  11. #include <Kernel/Arch/SmapDisabler.h>
  12. #include <Kernel/FileSystem/Custody.h>
  13. #include <Kernel/KBufferBuilder.h>
  14. #include <Kernel/PerformanceEventBuffer.h>
  15. #include <Kernel/Tasks/Process.h>
  16. #include <Kernel/Time/TimeManagement.h>
  17. namespace Kernel {
  18. PerformanceEventBuffer::PerformanceEventBuffer(NonnullOwnPtr<KBuffer> buffer)
  19. : m_buffer(move(buffer))
  20. {
  21. }
  22. NEVER_INLINE ErrorOr<void> PerformanceEventBuffer::append(int type, FlatPtr arg1, FlatPtr arg2, StringView arg3, Thread* current_thread, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> const& arg6)
  23. {
  24. FlatPtr base_pointer = (FlatPtr)__builtin_frame_address(0);
  25. return append_with_ip_and_bp(current_thread->pid(), current_thread->tid(), 0, base_pointer, type, 0, arg1, arg2, arg3, arg4, arg5, arg6);
  26. }
  27. static Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> raw_backtrace(FlatPtr bp, FlatPtr ip)
  28. {
  29. Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> backtrace;
  30. if (ip != 0)
  31. backtrace.unchecked_append(ip);
  32. FlatPtr stack_ptr_copy;
  33. FlatPtr stack_ptr = bp;
  34. // FIXME: Figure out how to remove this SmapDisabler without breaking profile stacks.
  35. SmapDisabler disabler;
  36. // NOTE: The stack should always have kernel frames first, followed by userspace frames.
  37. // If a userspace frame points back into kernel memory, something is afoot.
  38. bool is_walking_userspace_stack = false;
  39. while (stack_ptr) {
  40. void* fault_at;
  41. if (!safe_memcpy(&stack_ptr_copy, (void*)stack_ptr, sizeof(FlatPtr), fault_at))
  42. break;
  43. if (!Memory::is_user_address(VirtualAddress { stack_ptr })) {
  44. if (is_walking_userspace_stack) {
  45. dbgln("SHENANIGANS! Userspace stack points back into kernel memory");
  46. break;
  47. }
  48. } else {
  49. is_walking_userspace_stack = true;
  50. }
  51. FlatPtr retaddr;
  52. if (!safe_memcpy(&retaddr, (void*)(stack_ptr + sizeof(FlatPtr)), sizeof(FlatPtr), fault_at))
  53. break;
  54. if (retaddr == 0)
  55. break;
  56. backtrace.unchecked_append(retaddr);
  57. if (backtrace.size() == PerformanceEvent::max_stack_frame_count)
  58. break;
  59. stack_ptr = stack_ptr_copy;
  60. }
  61. return backtrace;
  62. }
  63. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid, RegisterState const& regs,
  64. int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, StringView arg3, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> const& arg6)
  65. {
  66. return append_with_ip_and_bp(pid, tid, regs.ip(), regs.bp(), type, lost_samples, arg1, arg2, arg3, arg4, arg5, arg6);
  67. }
  68. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid,
  69. FlatPtr ip, FlatPtr bp, int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, StringView arg3, FlatPtr arg4, u64 arg5, ErrorOr<FlatPtr> const& arg6)
  70. {
  71. if (count() >= capacity())
  72. return ENOBUFS;
  73. if ((g_profiling_event_mask & type) == 0)
  74. return EINVAL;
  75. auto* current_thread = Thread::current();
  76. u32 enter_count = 0;
  77. if (current_thread)
  78. enter_count = current_thread->enter_profiler();
  79. ScopeGuard leave_profiler([&] {
  80. if (current_thread)
  81. current_thread->leave_profiler();
  82. });
  83. if (enter_count > 0)
  84. return EINVAL;
  85. PerformanceEvent event;
  86. event.type = type;
  87. event.lost_samples = lost_samples;
  88. switch (type) {
  89. case PERF_EVENT_SAMPLE:
  90. break;
  91. case PERF_EVENT_MALLOC:
  92. event.data.malloc.size = arg1;
  93. event.data.malloc.ptr = arg2;
  94. break;
  95. case PERF_EVENT_FREE:
  96. event.data.free.ptr = arg1;
  97. break;
  98. case PERF_EVENT_MMAP:
  99. event.data.mmap.ptr = arg1;
  100. event.data.mmap.size = arg2;
  101. memset(event.data.mmap.name, 0, sizeof(event.data.mmap.name));
  102. if (!arg3.is_empty())
  103. memcpy(event.data.mmap.name, arg3.characters_without_null_termination(), min(arg3.length(), sizeof(event.data.mmap.name) - 1));
  104. break;
  105. case PERF_EVENT_MUNMAP:
  106. event.data.munmap.ptr = arg1;
  107. event.data.munmap.size = arg2;
  108. break;
  109. case PERF_EVENT_PROCESS_CREATE:
  110. event.data.process_create.parent_pid = arg1;
  111. memset(event.data.process_create.executable, 0, sizeof(event.data.process_create.executable));
  112. if (!arg3.is_empty()) {
  113. memcpy(event.data.process_create.executable, arg3.characters_without_null_termination(),
  114. min(arg3.length(), sizeof(event.data.process_create.executable) - 1));
  115. }
  116. break;
  117. case PERF_EVENT_PROCESS_EXEC:
  118. memset(event.data.process_exec.executable, 0, sizeof(event.data.process_exec.executable));
  119. if (!arg3.is_empty()) {
  120. memcpy(event.data.process_exec.executable, arg3.characters_without_null_termination(),
  121. min(arg3.length(), sizeof(event.data.process_exec.executable) - 1));
  122. }
  123. break;
  124. case PERF_EVENT_PROCESS_EXIT:
  125. break;
  126. case PERF_EVENT_THREAD_CREATE:
  127. event.data.thread_create.parent_tid = arg1;
  128. break;
  129. case PERF_EVENT_THREAD_EXIT:
  130. break;
  131. case PERF_EVENT_CONTEXT_SWITCH:
  132. event.data.context_switch.next_pid = arg1;
  133. event.data.context_switch.next_tid = arg2;
  134. break;
  135. case PERF_EVENT_KMALLOC:
  136. event.data.kmalloc.size = arg1;
  137. event.data.kmalloc.ptr = arg2;
  138. break;
  139. case PERF_EVENT_KFREE:
  140. event.data.kfree.size = arg1;
  141. event.data.kfree.ptr = arg2;
  142. break;
  143. case PERF_EVENT_PAGE_FAULT:
  144. break;
  145. case PERF_EVENT_SYSCALL:
  146. break;
  147. case PERF_EVENT_SIGNPOST:
  148. event.data.signpost.arg1 = arg1;
  149. event.data.signpost.arg2 = arg2;
  150. break;
  151. case PERF_EVENT_READ:
  152. event.data.read.fd = arg1;
  153. event.data.read.size = arg2;
  154. event.data.read.filename_index = arg4;
  155. event.data.read.start_timestamp = arg5;
  156. event.data.read.success = !arg6.is_error();
  157. break;
  158. default:
  159. return EINVAL;
  160. }
  161. auto backtrace = raw_backtrace(bp, ip);
  162. event.stack_size = min(sizeof(event.stack) / sizeof(FlatPtr), static_cast<size_t>(backtrace.size()));
  163. memcpy(event.stack, backtrace.data(), event.stack_size * sizeof(FlatPtr));
  164. event.pid = pid.value();
  165. event.tid = tid.value();
  166. event.timestamp = TimeManagement::the().uptime_ms();
  167. at(m_count++) = event;
  168. return {};
  169. }
  170. PerformanceEvent& PerformanceEventBuffer::at(size_t index)
  171. {
  172. VERIFY(index < capacity());
  173. auto* events = reinterpret_cast<PerformanceEvent*>(m_buffer->data());
  174. return events[index];
  175. }
  176. template<typename Serializer>
  177. ErrorOr<void> PerformanceEventBuffer::to_json_impl(Serializer& object) const
  178. {
  179. {
  180. auto strings = TRY(object.add_array("strings"sv));
  181. Vector<KString*> strings_sorted_by_index;
  182. TRY(strings_sorted_by_index.try_resize(m_strings.size()));
  183. for (auto& entry : m_strings) {
  184. strings_sorted_by_index[entry.value] = const_cast<Kernel::KString*>(entry.key.ptr());
  185. }
  186. for (size_t i = 0; i < m_strings.size(); i++) {
  187. TRY(strings.add(strings_sorted_by_index[i]->view()));
  188. }
  189. TRY(strings.finish());
  190. }
  191. auto current_process_credentials = Process::current().credentials();
  192. bool show_kernel_addresses = current_process_credentials->is_superuser();
  193. auto array = TRY(object.add_array("events"sv));
  194. bool seen_first_sample = false;
  195. for (size_t i = 0; i < m_count; ++i) {
  196. auto const& event = at(i);
  197. if (!show_kernel_addresses) {
  198. if (event.type == PERF_EVENT_KMALLOC || event.type == PERF_EVENT_KFREE)
  199. continue;
  200. }
  201. auto event_object = TRY(array.add_object());
  202. switch (event.type) {
  203. case PERF_EVENT_SAMPLE:
  204. TRY(event_object.add("type"sv, "sample"));
  205. break;
  206. case PERF_EVENT_MALLOC:
  207. TRY(event_object.add("type"sv, "malloc"));
  208. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.malloc.ptr)));
  209. TRY(event_object.add("size"sv, static_cast<u64>(event.data.malloc.size)));
  210. break;
  211. case PERF_EVENT_FREE:
  212. TRY(event_object.add("type"sv, "free"));
  213. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.free.ptr)));
  214. break;
  215. case PERF_EVENT_MMAP:
  216. TRY(event_object.add("type"sv, "mmap"));
  217. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.mmap.ptr)));
  218. TRY(event_object.add("size"sv, static_cast<u64>(event.data.mmap.size)));
  219. TRY(event_object.add("name"sv, event.data.mmap.name));
  220. break;
  221. case PERF_EVENT_MUNMAP:
  222. TRY(event_object.add("type"sv, "munmap"));
  223. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.munmap.ptr)));
  224. TRY(event_object.add("size"sv, static_cast<u64>(event.data.munmap.size)));
  225. break;
  226. case PERF_EVENT_PROCESS_CREATE:
  227. TRY(event_object.add("type"sv, "process_create"));
  228. TRY(event_object.add("parent_pid"sv, static_cast<u64>(event.data.process_create.parent_pid)));
  229. TRY(event_object.add("executable"sv, event.data.process_create.executable));
  230. break;
  231. case PERF_EVENT_PROCESS_EXEC:
  232. TRY(event_object.add("type"sv, "process_exec"));
  233. TRY(event_object.add("executable"sv, event.data.process_exec.executable));
  234. break;
  235. case PERF_EVENT_PROCESS_EXIT:
  236. TRY(event_object.add("type"sv, "process_exit"));
  237. break;
  238. case PERF_EVENT_THREAD_CREATE:
  239. TRY(event_object.add("type"sv, "thread_create"));
  240. TRY(event_object.add("parent_tid"sv, static_cast<u64>(event.data.thread_create.parent_tid)));
  241. break;
  242. case PERF_EVENT_THREAD_EXIT:
  243. TRY(event_object.add("type"sv, "thread_exit"));
  244. break;
  245. case PERF_EVENT_CONTEXT_SWITCH:
  246. TRY(event_object.add("type"sv, "context_switch"));
  247. TRY(event_object.add("next_pid"sv, static_cast<u64>(event.data.context_switch.next_pid)));
  248. TRY(event_object.add("next_tid"sv, static_cast<u64>(event.data.context_switch.next_tid)));
  249. break;
  250. case PERF_EVENT_KMALLOC:
  251. TRY(event_object.add("type"sv, "kmalloc"));
  252. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.kmalloc.ptr)));
  253. TRY(event_object.add("size"sv, static_cast<u64>(event.data.kmalloc.size)));
  254. break;
  255. case PERF_EVENT_KFREE:
  256. TRY(event_object.add("type"sv, "kfree"));
  257. TRY(event_object.add("ptr"sv, static_cast<u64>(event.data.kfree.ptr)));
  258. TRY(event_object.add("size"sv, static_cast<u64>(event.data.kfree.size)));
  259. break;
  260. case PERF_EVENT_PAGE_FAULT:
  261. TRY(event_object.add("type"sv, "page_fault"));
  262. break;
  263. case PERF_EVENT_SYSCALL:
  264. TRY(event_object.add("type"sv, "syscall"));
  265. break;
  266. case PERF_EVENT_SIGNPOST:
  267. TRY(event_object.add("type"sv, "signpost"sv));
  268. TRY(event_object.add("arg1"sv, event.data.signpost.arg1));
  269. TRY(event_object.add("arg2"sv, event.data.signpost.arg2));
  270. break;
  271. case PERF_EVENT_READ:
  272. TRY(event_object.add("type"sv, "read"));
  273. TRY(event_object.add("fd"sv, event.data.read.fd));
  274. TRY(event_object.add("size"sv, event.data.read.size));
  275. TRY(event_object.add("filename_index"sv, event.data.read.filename_index));
  276. TRY(event_object.add("start_timestamp"sv, event.data.read.start_timestamp));
  277. TRY(event_object.add("success"sv, event.data.read.success));
  278. break;
  279. }
  280. TRY(event_object.add("pid"sv, event.pid));
  281. TRY(event_object.add("tid"sv, event.tid));
  282. TRY(event_object.add("timestamp"sv, event.timestamp));
  283. TRY(event_object.add("lost_samples"sv, seen_first_sample ? event.lost_samples : 0));
  284. if (event.type == PERF_EVENT_SAMPLE)
  285. seen_first_sample = true;
  286. auto stack_array = TRY(event_object.add_array("stack"sv));
  287. for (size_t j = 0; j < event.stack_size; ++j) {
  288. auto address = event.stack[j];
  289. if (!show_kernel_addresses && !Memory::is_user_address(VirtualAddress { address }))
  290. address = 0xdeadc0de;
  291. TRY(stack_array.add(address));
  292. }
  293. TRY(stack_array.finish());
  294. TRY(event_object.finish());
  295. }
  296. TRY(array.finish());
  297. TRY(object.finish());
  298. return {};
  299. }
  300. ErrorOr<void> PerformanceEventBuffer::to_json(KBufferBuilder& builder) const
  301. {
  302. auto object = TRY(JsonObjectSerializer<>::try_create(builder));
  303. return to_json_impl(object);
  304. }
  305. OwnPtr<PerformanceEventBuffer> PerformanceEventBuffer::try_create_with_size(size_t buffer_size)
  306. {
  307. auto buffer_or_error = KBuffer::try_create_with_size("Performance events"sv, buffer_size, Memory::Region::Access::ReadWrite, AllocationStrategy::AllocateNow);
  308. if (buffer_or_error.is_error())
  309. return {};
  310. return adopt_own_if_nonnull(new (nothrow) PerformanceEventBuffer(buffer_or_error.release_value()));
  311. }
  312. ErrorOr<void> PerformanceEventBuffer::add_process(Process const& process, ProcessEventType event_type)
  313. {
  314. OwnPtr<KString> executable;
  315. if (process.executable()) {
  316. executable = TRY(process.executable()->try_serialize_absolute_path());
  317. } else {
  318. executable = TRY(process.name().with([&](auto& process_name) {
  319. return KString::formatted("<{}>", process_name->view());
  320. }));
  321. }
  322. TRY(append_with_ip_and_bp(process.pid(), 0, 0, 0,
  323. event_type == ProcessEventType::Create ? PERF_EVENT_PROCESS_CREATE : PERF_EVENT_PROCESS_EXEC,
  324. 0, process.pid().value(), 0, executable->view()));
  325. ErrorOr<void> result;
  326. process.for_each_thread([&](auto& thread) {
  327. result = append_with_ip_and_bp(process.pid(), thread.tid().value(),
  328. 0, 0, PERF_EVENT_THREAD_CREATE, 0, 0, 0, {});
  329. return result.is_error() ? IterationDecision::Break : IterationDecision::Continue;
  330. });
  331. TRY(result);
  332. return process.address_space().with([&](auto& space) -> ErrorOr<void> {
  333. for (auto const& region : space->region_tree().regions()) {
  334. TRY(append_with_ip_and_bp(process.pid(), 0,
  335. 0, 0, PERF_EVENT_MMAP, 0, region.range().base().get(), region.range().size(), region.name()));
  336. }
  337. return {};
  338. });
  339. }
  340. ErrorOr<FlatPtr> PerformanceEventBuffer::register_string(NonnullOwnPtr<KString> string)
  341. {
  342. auto it = m_strings.find(string);
  343. if (it != m_strings.end()) {
  344. return it->value;
  345. }
  346. auto new_index = m_strings.size();
  347. TRY(m_strings.try_set(move(string), move(new_index)));
  348. return new_index;
  349. }
  350. }