PerformanceEventBuffer.cpp 9.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253
  1. /*
  2. * Copyright (c) 2020-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/JsonArraySerializer.h>
  7. #include <AK/JsonObject.h>
  8. #include <AK/JsonObjectSerializer.h>
  9. #include <Kernel/Arch/x86/SmapDisabler.h>
  10. #include <Kernel/FileSystem/Custody.h>
  11. #include <Kernel/KBufferBuilder.h>
  12. #include <Kernel/PerformanceEventBuffer.h>
  13. #include <Kernel/Process.h>
  14. namespace Kernel {
  15. PerformanceEventBuffer::PerformanceEventBuffer(NonnullOwnPtr<KBuffer> buffer)
  16. : m_buffer(move(buffer))
  17. {
  18. }
  19. NEVER_INLINE KResult PerformanceEventBuffer::append(int type, FlatPtr arg1, FlatPtr arg2, const StringView& arg3, Thread* current_thread)
  20. {
  21. FlatPtr ebp;
  22. asm volatile("movl %%ebp, %%eax"
  23. : "=a"(ebp));
  24. return append_with_eip_and_ebp(current_thread->pid(), current_thread->tid(), 0, ebp, type, 0, arg1, arg2, arg3);
  25. }
  26. static Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> raw_backtrace(FlatPtr ebp, FlatPtr eip)
  27. {
  28. Vector<FlatPtr, PerformanceEvent::max_stack_frame_count> backtrace;
  29. if (eip != 0)
  30. backtrace.append(eip);
  31. FlatPtr stack_ptr_copy;
  32. FlatPtr stack_ptr = (FlatPtr)ebp;
  33. // FIXME: Figure out how to remove this SmapDisabler without breaking profile stacks.
  34. SmapDisabler disabler;
  35. while (stack_ptr) {
  36. void* fault_at;
  37. if (!safe_memcpy(&stack_ptr_copy, (void*)stack_ptr, sizeof(FlatPtr), fault_at))
  38. break;
  39. FlatPtr retaddr;
  40. if (!safe_memcpy(&retaddr, (void*)(stack_ptr + sizeof(FlatPtr)), sizeof(FlatPtr), fault_at))
  41. break;
  42. if (retaddr == 0)
  43. break;
  44. backtrace.append(retaddr);
  45. if (backtrace.size() == PerformanceEvent::max_stack_frame_count)
  46. break;
  47. stack_ptr = stack_ptr_copy;
  48. }
  49. return backtrace;
  50. }
  51. KResult PerformanceEventBuffer::append_with_eip_and_ebp(ProcessID pid, ThreadID tid,
  52. u32 eip, u32 ebp, int type, u32 lost_samples, FlatPtr arg1, FlatPtr arg2, const StringView& arg3)
  53. {
  54. if (count() >= capacity())
  55. return ENOBUFS;
  56. if ((g_profiling_event_mask & type) == 0)
  57. return EINVAL;
  58. PerformanceEvent event;
  59. event.type = type;
  60. event.lost_samples = lost_samples;
  61. switch (type) {
  62. case PERF_EVENT_SAMPLE:
  63. break;
  64. case PERF_EVENT_MALLOC:
  65. event.data.malloc.size = arg1;
  66. event.data.malloc.ptr = arg2;
  67. break;
  68. case PERF_EVENT_FREE:
  69. event.data.free.ptr = arg1;
  70. break;
  71. case PERF_EVENT_MMAP:
  72. event.data.mmap.ptr = arg1;
  73. event.data.mmap.size = arg2;
  74. memset(event.data.mmap.name, 0, sizeof(event.data.mmap.name));
  75. if (!arg3.is_empty())
  76. memcpy(event.data.mmap.name, arg3.characters_without_null_termination(), min(arg3.length(), sizeof(event.data.mmap.name) - 1));
  77. break;
  78. case PERF_EVENT_MUNMAP:
  79. event.data.munmap.ptr = arg1;
  80. event.data.munmap.size = arg2;
  81. break;
  82. case PERF_EVENT_PROCESS_CREATE:
  83. event.data.process_create.parent_pid = arg1;
  84. memset(event.data.process_create.executable, 0, sizeof(event.data.process_create.executable));
  85. if (!arg3.is_empty()) {
  86. memcpy(event.data.process_create.executable, arg3.characters_without_null_termination(),
  87. min(arg3.length(), sizeof(event.data.process_create.executable) - 1));
  88. }
  89. break;
  90. case PERF_EVENT_PROCESS_EXEC:
  91. memset(event.data.process_exec.executable, 0, sizeof(event.data.process_exec.executable));
  92. if (!arg3.is_empty()) {
  93. memcpy(event.data.process_exec.executable, arg3.characters_without_null_termination(),
  94. min(arg3.length(), sizeof(event.data.process_exec.executable) - 1));
  95. }
  96. break;
  97. case PERF_EVENT_PROCESS_EXIT:
  98. break;
  99. case PERF_EVENT_THREAD_CREATE:
  100. event.data.thread_create.parent_tid = arg1;
  101. break;
  102. case PERF_EVENT_THREAD_EXIT:
  103. break;
  104. case PERF_EVENT_CONTEXT_SWITCH:
  105. event.data.context_switch.next_pid = arg1;
  106. event.data.context_switch.next_tid = arg2;
  107. break;
  108. default:
  109. return EINVAL;
  110. }
  111. auto backtrace = raw_backtrace(ebp, eip);
  112. event.stack_size = min(sizeof(event.stack) / sizeof(FlatPtr), static_cast<size_t>(backtrace.size()));
  113. memcpy(event.stack, backtrace.data(), event.stack_size * sizeof(FlatPtr));
  114. event.pid = pid.value();
  115. event.tid = tid.value();
  116. event.timestamp = TimeManagement::the().uptime_ms();
  117. at(m_count++) = event;
  118. return KSuccess;
  119. }
  120. PerformanceEvent& PerformanceEventBuffer::at(size_t index)
  121. {
  122. VERIFY(index < capacity());
  123. auto* events = reinterpret_cast<PerformanceEvent*>(m_buffer->data());
  124. return events[index];
  125. }
  126. template<typename Serializer>
  127. bool PerformanceEventBuffer::to_json_impl(Serializer& object) const
  128. {
  129. auto array = object.add_array("events");
  130. bool seen_first_sample = false;
  131. for (size_t i = 0; i < m_count; ++i) {
  132. auto& event = at(i);
  133. auto event_object = array.add_object();
  134. switch (event.type) {
  135. case PERF_EVENT_SAMPLE:
  136. event_object.add("type", "sample");
  137. break;
  138. case PERF_EVENT_MALLOC:
  139. event_object.add("type", "malloc");
  140. event_object.add("ptr", static_cast<u64>(event.data.malloc.ptr));
  141. event_object.add("size", static_cast<u64>(event.data.malloc.size));
  142. break;
  143. case PERF_EVENT_FREE:
  144. event_object.add("type", "free");
  145. event_object.add("ptr", static_cast<u64>(event.data.free.ptr));
  146. break;
  147. case PERF_EVENT_MMAP:
  148. event_object.add("type", "mmap");
  149. event_object.add("ptr", static_cast<u64>(event.data.mmap.ptr));
  150. event_object.add("size", static_cast<u64>(event.data.mmap.size));
  151. event_object.add("name", event.data.mmap.name);
  152. break;
  153. case PERF_EVENT_MUNMAP:
  154. event_object.add("type", "munmap");
  155. event_object.add("ptr", static_cast<u64>(event.data.munmap.ptr));
  156. event_object.add("size", static_cast<u64>(event.data.munmap.size));
  157. break;
  158. case PERF_EVENT_PROCESS_CREATE:
  159. event_object.add("type", "process_create");
  160. event_object.add("parent_pid", static_cast<u64>(event.data.process_create.parent_pid));
  161. event_object.add("executable", event.data.process_create.executable);
  162. break;
  163. case PERF_EVENT_PROCESS_EXEC:
  164. event_object.add("type", "process_exec");
  165. event_object.add("executable", event.data.process_exec.executable);
  166. break;
  167. case PERF_EVENT_PROCESS_EXIT:
  168. event_object.add("type", "process_exit");
  169. break;
  170. case PERF_EVENT_THREAD_CREATE:
  171. event_object.add("type", "thread_create");
  172. event_object.add("parent_tid", static_cast<u64>(event.data.thread_create.parent_tid));
  173. break;
  174. case PERF_EVENT_THREAD_EXIT:
  175. event_object.add("type", "thread_exit");
  176. break;
  177. case PERF_EVENT_CONTEXT_SWITCH:
  178. event_object.add("type", "context_switch");
  179. event_object.add("next_pid", static_cast<u64>(event.data.context_switch.next_pid));
  180. event_object.add("next_tid", static_cast<u64>(event.data.context_switch.next_tid));
  181. break;
  182. }
  183. event_object.add("pid", event.pid);
  184. event_object.add("tid", event.tid);
  185. event_object.add("timestamp", event.timestamp);
  186. event_object.add("lost_samples", seen_first_sample ? event.lost_samples : 0);
  187. if (event.type == PERF_EVENT_SAMPLE)
  188. seen_first_sample = true;
  189. auto stack_array = event_object.add_array("stack");
  190. for (size_t j = 0; j < event.stack_size; ++j) {
  191. stack_array.add(event.stack[j]);
  192. }
  193. stack_array.finish();
  194. event_object.finish();
  195. }
  196. array.finish();
  197. object.finish();
  198. return true;
  199. }
  200. bool PerformanceEventBuffer::to_json(KBufferBuilder& builder) const
  201. {
  202. JsonObjectSerializer object(builder);
  203. return to_json_impl(object);
  204. }
  205. OwnPtr<PerformanceEventBuffer> PerformanceEventBuffer::try_create_with_size(size_t buffer_size)
  206. {
  207. auto buffer = KBuffer::try_create_with_size(buffer_size, Region::Access::Read | Region::Access::Write, "Performance events", AllocationStrategy::AllocateNow);
  208. if (!buffer)
  209. return {};
  210. return adopt_own(*new PerformanceEventBuffer(buffer.release_nonnull()));
  211. }
  212. void PerformanceEventBuffer::add_process(const Process& process, ProcessEventType event_type)
  213. {
  214. ScopedSpinLock locker(process.space().get_lock());
  215. String executable;
  216. if (process.executable())
  217. executable = process.executable()->absolute_path();
  218. else
  219. executable = String::formatted("<{}>", process.name());
  220. [[maybe_unused]] auto rc = append_with_eip_and_ebp(process.pid(), 0, 0, 0,
  221. event_type == ProcessEventType::Create ? PERF_EVENT_PROCESS_CREATE : PERF_EVENT_PROCESS_EXEC,
  222. 0, process.pid().value(), 0, executable);
  223. process.for_each_thread([&](auto& thread) {
  224. [[maybe_unused]] auto rc = append_with_eip_and_ebp(process.pid(), thread.tid().value(),
  225. 0, 0, PERF_EVENT_THREAD_CREATE, 0, 0, 0, nullptr);
  226. });
  227. for (auto& region : process.space().regions()) {
  228. [[maybe_unused]] auto rc = append_with_eip_and_ebp(process.pid(), 0,
  229. 0, 0, PERF_EVENT_MMAP, 0, region->range().base().get(), region->range().size(), region->name());
  230. }
  231. }
  232. }