PerformanceEventBuffer.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322
  1. /*
  2. * Copyright (c) 2020-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/JsonArraySerializer.h>
  7. #include <AK/JsonObjectSerializer.h>
  8. #include <AK/ScopeGuard.h>
  9. #include <Kernel/Arch/RegisterState.h>
  10. #include <Kernel/Arch/SmapDisabler.h>
  11. #include <Kernel/FileSystem/Custody.h>
  12. #include <Kernel/KBufferBuilder.h>
  13. #include <Kernel/PerformanceEventBuffer.h>
  14. #include <Kernel/Process.h>
  15. namespace Kernel {
  16. PerformanceEventBuffer::PerformanceEventBuffer(NonnullOwnPtr<KBuffer> buffer)
  17. : m_buffer(move(buffer))
  18. {
  19. }
  20. NEVER_INLINE ErrorOr<void> PerformanceEventBuffer::append(int type, FlatPtr arg1, FlatPtr arg2, const StringView& arg3, Thread* current_thread)
  21. {
  22. FlatPtr ebp;
  23. asm volatile("movl %%ebp, %%eax"
  24. : "=a"(ebp));
  25. return append_with_ip_and_bp(current_thread->pid(), current_thread->tid(), 0, ebp, type, 0, arg1, arg2, arg3);
  26. }
  27. static Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> raw_backtrace(FlatPtr bp, FlatPtr ip)
  28. {
  29. Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> backtrace;
  30. if (ip != 0)
  31. backtrace.append(ip);
  32. FlatPtr stack_ptr_copy;
  33. FlatPtr stack_ptr = bp;
  34. // FIXME: Figure out how to remove this SmapDisabler without breaking profile stacks.
  35. SmapDisabler disabler;
  36. while (stack_ptr) {
  37. void* fault_at;
  38. if (!safe_memcpy(&stack_ptr_copy, (void*)stack_ptr, sizeof(FlatPtr), fault_at))
  39. break;
  40. FlatPtr retaddr;
  41. if (!safe_memcpy(&retaddr, (void*)(stack_ptr + sizeof(FlatPtr)), sizeof(FlatPtr), fault_at))
  42. break;
  43. if (retaddr == 0)
  44. break;
  45. backtrace.append(retaddr);
  46. if (backtrace.size() == PerformanceEvent::max_stack_frame_count)
  47. break;
  48. stack_ptr = stack_ptr_copy;
  49. }
  50. return backtrace;
  51. }
  52. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid, const RegisterState& regs,
  53. int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, const StringView& arg3)
  54. {
  55. return append_with_ip_and_bp(pid, tid, regs.ip(), regs.bp(), type, lost_samples, arg1, arg2, arg3);
  56. }
  57. ErrorOr<void> PerformanceEventBuffer::append_with_ip_and_bp(ProcessID pid, ThreadID tid,
  58. FlatPtr ip, FlatPtr bp, int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, const StringView& arg3)
  59. {
  60. if (count() >= capacity())
  61. return ENOBUFS;
  62. if ((g_profiling_event_mask & type) == 0)
  63. return EINVAL;
  64. auto current_thread = Thread::current();
  65. u32 enter_count = 0;
  66. if (current_thread)
  67. enter_count = current_thread->enter_profiler();
  68. ScopeGuard leave_profiler([&] {
  69. if (current_thread)
  70. current_thread->leave_profiler();
  71. });
  72. if (enter_count > 0)
  73. return EINVAL;
  74. PerformanceEvent event;
  75. event.type = type;
  76. event.lost_samples = lost_samples;
  77. switch (type) {
  78. case PERF_EVENT_SAMPLE:
  79. break;
  80. case PERF_EVENT_MALLOC:
  81. event.data.malloc.size = arg1;
  82. event.data.malloc.ptr = arg2;
  83. break;
  84. case PERF_EVENT_FREE:
  85. event.data.free.ptr = arg1;
  86. break;
  87. case PERF_EVENT_MMAP:
  88. event.data.mmap.ptr = arg1;
  89. event.data.mmap.size = arg2;
  90. memset(event.data.mmap.name, 0, sizeof(event.data.mmap.name));
  91. if (!arg3.is_empty())
  92. memcpy(event.data.mmap.name, arg3.characters_without_null_termination(), min(arg3.length(), sizeof(event.data.mmap.name) - 1));
  93. break;
  94. case PERF_EVENT_MUNMAP:
  95. event.data.munmap.ptr = arg1;
  96. event.data.munmap.size = arg2;
  97. break;
  98. case PERF_EVENT_PROCESS_CREATE:
  99. event.data.process_create.parent_pid = arg1;
  100. memset(event.data.process_create.executable, 0, sizeof(event.data.process_create.executable));
  101. if (!arg3.is_empty()) {
  102. memcpy(event.data.process_create.executable, arg3.characters_without_null_termination(),
  103. min(arg3.length(), sizeof(event.data.process_create.executable) - 1));
  104. }
  105. break;
  106. case PERF_EVENT_PROCESS_EXEC:
  107. memset(event.data.process_exec.executable, 0, sizeof(event.data.process_exec.executable));
  108. if (!arg3.is_empty()) {
  109. memcpy(event.data.process_exec.executable, arg3.characters_without_null_termination(),
  110. min(arg3.length(), sizeof(event.data.process_exec.executable) - 1));
  111. }
  112. break;
  113. case PERF_EVENT_PROCESS_EXIT:
  114. break;
  115. case PERF_EVENT_THREAD_CREATE:
  116. event.data.thread_create.parent_tid = arg1;
  117. break;
  118. case PERF_EVENT_THREAD_EXIT:
  119. break;
  120. case PERF_EVENT_CONTEXT_SWITCH:
  121. event.data.context_switch.next_pid = arg1;
  122. event.data.context_switch.next_tid = arg2;
  123. break;
  124. case PERF_EVENT_KMALLOC:
  125. event.data.kmalloc.size = arg1;
  126. event.data.kmalloc.ptr = arg2;
  127. break;
  128. case PERF_EVENT_KFREE:
  129. event.data.kfree.size = arg1;
  130. event.data.kfree.ptr = arg2;
  131. break;
  132. case PERF_EVENT_PAGE_FAULT:
  133. break;
  134. case PERF_EVENT_SYSCALL:
  135. break;
  136. case PERF_EVENT_SIGNPOST:
  137. event.data.signpost.arg1 = arg1;
  138. event.data.signpost.arg2 = arg2;
  139. break;
  140. default:
  141. return EINVAL;
  142. }
  143. auto backtrace = raw_backtrace(bp, ip);
  144. event.stack_size = min(sizeof(event.stack) / sizeof(FlatPtr), static_cast<size_t>(backtrace.size()));
  145. memcpy(event.stack, backtrace.data(), event.stack_size * sizeof(FlatPtr));
  146. event.pid = pid.value();
  147. event.tid = tid.value();
  148. event.timestamp = TimeManagement::the().uptime_ms();
  149. at(m_count++) = event;
  150. return {};
  151. }
  152. PerformanceEvent& PerformanceEventBuffer::at(size_t index)
  153. {
  154. VERIFY(index < capacity());
  155. auto* events = reinterpret_cast<PerformanceEvent*>(m_buffer->data());
  156. return events[index];
  157. }
  158. template<typename Serializer>
  159. ErrorOr<void> PerformanceEventBuffer::to_json_impl(Serializer& object) const
  160. {
  161. {
  162. auto strings = object.add_array("strings");
  163. for (auto& it : m_strings) {
  164. strings.add(it->view());
  165. }
  166. }
  167. auto array = object.add_array("events");
  168. bool seen_first_sample = false;
  169. for (size_t i = 0; i < m_count; ++i) {
  170. auto& event = at(i);
  171. auto event_object = array.add_object();
  172. switch (event.type) {
  173. case PERF_EVENT_SAMPLE:
  174. event_object.add("type", "sample");
  175. break;
  176. case PERF_EVENT_MALLOC:
  177. event_object.add("type", "malloc");
  178. event_object.add("ptr", static_cast<u64>(event.data.malloc.ptr));
  179. event_object.add("size", static_cast<u64>(event.data.malloc.size));
  180. break;
  181. case PERF_EVENT_FREE:
  182. event_object.add("type", "free");
  183. event_object.add("ptr", static_cast<u64>(event.data.free.ptr));
  184. break;
  185. case PERF_EVENT_MMAP:
  186. event_object.add("type", "mmap");
  187. event_object.add("ptr", static_cast<u64>(event.data.mmap.ptr));
  188. event_object.add("size", static_cast<u64>(event.data.mmap.size));
  189. event_object.add("name", event.data.mmap.name);
  190. break;
  191. case PERF_EVENT_MUNMAP:
  192. event_object.add("type", "munmap");
  193. event_object.add("ptr", static_cast<u64>(event.data.munmap.ptr));
  194. event_object.add("size", static_cast<u64>(event.data.munmap.size));
  195. break;
  196. case PERF_EVENT_PROCESS_CREATE:
  197. event_object.add("type", "process_create");
  198. event_object.add("parent_pid", static_cast<u64>(event.data.process_create.parent_pid));
  199. event_object.add("executable", event.data.process_create.executable);
  200. break;
  201. case PERF_EVENT_PROCESS_EXEC:
  202. event_object.add("type", "process_exec");
  203. event_object.add("executable", event.data.process_exec.executable);
  204. break;
  205. case PERF_EVENT_PROCESS_EXIT:
  206. event_object.add("type", "process_exit");
  207. break;
  208. case PERF_EVENT_THREAD_CREATE:
  209. event_object.add("type", "thread_create");
  210. event_object.add("parent_tid", static_cast<u64>(event.data.thread_create.parent_tid));
  211. break;
  212. case PERF_EVENT_THREAD_EXIT:
  213. event_object.add("type", "thread_exit");
  214. break;
  215. case PERF_EVENT_CONTEXT_SWITCH:
  216. event_object.add("type", "context_switch");
  217. event_object.add("next_pid", static_cast<u64>(event.data.context_switch.next_pid));
  218. event_object.add("next_tid", static_cast<u64>(event.data.context_switch.next_tid));
  219. break;
  220. case PERF_EVENT_KMALLOC:
  221. event_object.add("type", "kmalloc");
  222. event_object.add("ptr", static_cast<u64>(event.data.kmalloc.ptr));
  223. event_object.add("size", static_cast<u64>(event.data.kmalloc.size));
  224. break;
  225. case PERF_EVENT_KFREE:
  226. event_object.add("type", "kfree");
  227. event_object.add("ptr", static_cast<u64>(event.data.kfree.ptr));
  228. event_object.add("size", static_cast<u64>(event.data.kfree.size));
  229. break;
  230. case PERF_EVENT_PAGE_FAULT:
  231. event_object.add("type", "page_fault");
  232. break;
  233. case PERF_EVENT_SYSCALL:
  234. event_object.add("type", "syscall");
  235. break;
  236. case PERF_EVENT_SIGNPOST:
  237. event_object.add("type"sv, "signpost"sv);
  238. event_object.add("arg1"sv, event.data.signpost.arg1);
  239. event_object.add("arg2"sv, event.data.signpost.arg2);
  240. break;
  241. }
  242. event_object.add("pid", event.pid);
  243. event_object.add("tid", event.tid);
  244. event_object.add("timestamp", event.timestamp);
  245. event_object.add("lost_samples", seen_first_sample ? event.lost_samples : 0);
  246. if (event.type == PERF_EVENT_SAMPLE)
  247. seen_first_sample = true;
  248. auto stack_array = event_object.add_array("stack");
  249. for (size_t j = 0; j < event.stack_size; ++j) {
  250. stack_array.add(event.stack[j]);
  251. }
  252. stack_array.finish();
  253. event_object.finish();
  254. }
  255. array.finish();
  256. object.finish();
  257. return {};
  258. }
  259. ErrorOr<void> PerformanceEventBuffer::to_json(KBufferBuilder& builder) const
  260. {
  261. JsonObjectSerializer object(builder);
  262. return to_json_impl(object);
  263. }
  264. OwnPtr<PerformanceEventBuffer> PerformanceEventBuffer::try_create_with_size(size_t buffer_size)
  265. {
  266. auto buffer_or_error = KBuffer::try_create_with_size(buffer_size, Memory::Region::Access::ReadWrite, "Performance events", AllocationStrategy::AllocateNow);
  267. if (buffer_or_error.is_error())
  268. return {};
  269. return adopt_own_if_nonnull(new (nothrow) PerformanceEventBuffer(buffer_or_error.release_value()));
  270. }
  271. void PerformanceEventBuffer::add_process(const Process& process, ProcessEventType event_type)
  272. {
  273. SpinlockLocker locker(process.address_space().get_lock());
  274. String executable;
  275. if (process.executable())
  276. executable = process.executable()->absolute_path();
  277. else
  278. executable = String::formatted("<{}>", process.name());
  279. [[maybe_unused]] auto rc = append_with_ip_and_bp(process.pid(), 0, 0, 0,
  280. event_type == ProcessEventType::Create ? PERF_EVENT_PROCESS_CREATE : PERF_EVENT_PROCESS_EXEC,
  281. 0, process.pid().value(), 0, executable);
  282. process.for_each_thread([&](auto& thread) {
  283. [[maybe_unused]] auto rc = append_with_ip_and_bp(process.pid(), thread.tid().value(),
  284. 0, 0, PERF_EVENT_THREAD_CREATE, 0, 0, 0, nullptr);
  285. });
  286. for (auto& region : process.address_space().regions()) {
  287. [[maybe_unused]] auto rc = append_with_ip_and_bp(process.pid(), 0,
  288. 0, 0, PERF_EVENT_MMAP, 0, region->range().base().get(), region->range().size(), region->name());
  289. }
  290. }
  291. ErrorOr<FlatPtr> PerformanceEventBuffer::register_string(NonnullOwnPtr<KString> string)
  292. {
  293. FlatPtr string_id = m_strings.size();
  294. TRY(m_strings.try_set(move(string)));
  295. return string_id;
  296. }
  297. }