mirror of
				https://github.com/RGBCube/serenity
				synced 2025-10-25 08:42:06 +00:00 
			
		
		
		
	 eb798d5538
			
		
	
	
		eb798d5538
		
	
	
	
	
		
			
			This turns the perfcore format into more a log than it was before, which lets us properly log process, thread and region creation/destruction. This also makes it unnecessary to dump the process' regions every time it is scheduled like we did before. Incidentally this also fixes 'profile -c' because we previously ended up incorrectly dumping the parent's region map into the profile data. Log-based mmap support enables profiling shared libraries which are loaded at runtime, e.g. via dlopen(). This enables profiling both the parent and child process for programs which use execve(). Previously we'd discard the profiling data for the old process. The Profiler tool has been updated to not treat thread IDs as process IDs anymore. This enables support for processes with more than one thread. Also, there's a new widget to filter which process should be displayed.
		
			
				
	
	
		
			461 lines
		
	
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			461 lines
		
	
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
 | |
|  *
 | |
|  * SPDX-License-Identifier: BSD-2-Clause
 | |
|  */
 | |
| 
 | |
| #include "Profile.h"
 | |
| #include "DisassemblyModel.h"
 | |
| #include "ProfileModel.h"
 | |
| #include "SamplesModel.h"
 | |
| #include <AK/HashTable.h>
 | |
| #include <AK/LexicalPath.h>
 | |
| #include <AK/MappedFile.h>
 | |
| #include <AK/NonnullOwnPtrVector.h>
 | |
| #include <AK/QuickSort.h>
 | |
| #include <AK/RefPtr.h>
 | |
| #include <LibCore/File.h>
 | |
| #include <LibELF/Image.h>
 | |
| #include <sys/stat.h>
 | |
| 
 | |
| static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
 | |
| {
 | |
|     quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
 | |
|         return a->event_count() >= b->event_count();
 | |
|     });
 | |
| 
 | |
|     for (auto& child : nodes)
 | |
|         child->sort_children();
 | |
| }
 | |
| 
 | |
| Profile::Profile(Vector<Process> processes, Vector<Event> events)
 | |
|     : m_processes(move(processes))
 | |
|     , m_events(move(events))
 | |
| {
 | |
|     m_first_timestamp = m_events.first().timestamp;
 | |
|     m_last_timestamp = m_events.last().timestamp;
 | |
| 
 | |
|     m_model = ProfileModel::create(*this);
 | |
|     m_samples_model = SamplesModel::create(*this);
 | |
| 
 | |
|     for (auto& event : m_events) {
 | |
|         m_deepest_stack_depth = max((u32)event.frames.size(), m_deepest_stack_depth);
 | |
|     }
 | |
| 
 | |
|     rebuild_tree();
 | |
| }
 | |
| 
 | |
| Profile::~Profile()
 | |
| {
 | |
| }
 | |
| 
 | |
| GUI::Model& Profile::model()
 | |
| {
 | |
|     return *m_model;
 | |
| }
 | |
| 
 | |
| GUI::Model& Profile::samples_model()
 | |
| {
 | |
|     return *m_samples_model;
 | |
| }
 | |
| 
 | |
| void Profile::rebuild_tree()
 | |
| {
 | |
|     Vector<NonnullRefPtr<ProfileNode>> roots;
 | |
| 
 | |
|     auto find_or_create_root = [&roots](FlyString object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid) -> ProfileNode& {
 | |
|         for (auto root : roots) {
 | |
|             if (root->symbol() == symbol) {
 | |
|                 return root;
 | |
|             }
 | |
|         }
 | |
|         auto new_root = ProfileNode::create(move(object_name), move(symbol), address, offset, timestamp, pid);
 | |
|         roots.append(new_root);
 | |
|         return new_root;
 | |
|     };
 | |
| 
 | |
|     HashTable<FlatPtr> live_allocations;
 | |
| 
 | |
|     for_each_event_in_filter_range([&](auto& event) {
 | |
|         if (event.type == "malloc")
 | |
|             live_allocations.set(event.ptr);
 | |
|         else if (event.type == "free")
 | |
|             live_allocations.remove(event.ptr);
 | |
|     });
 | |
| 
 | |
|     m_filtered_event_indices.clear();
 | |
| 
 | |
|     for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
 | |
|         auto& event = m_events.at(event_index);
 | |
| 
 | |
|         if (has_timestamp_filter_range()) {
 | |
|             auto timestamp = event.timestamp;
 | |
|             if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
 | |
|                 continue;
 | |
|         }
 | |
| 
 | |
|         if (has_process_filter()) {
 | |
|             if (event.pid != m_process_filter_pid || event.timestamp < m_process_filter_start_valid || event.timestamp > m_process_filter_end_valid)
 | |
|                 continue;
 | |
|         }
 | |
| 
 | |
|         m_filtered_event_indices.append(event_index);
 | |
| 
 | |
|         if (event.type == "malloc" && !live_allocations.contains(event.ptr))
 | |
|             continue;
 | |
| 
 | |
|         if (event.type == "free")
 | |
|             continue;
 | |
| 
 | |
|         auto for_each_frame = [&]<typename Callback>(Callback callback) {
 | |
|             if (!m_inverted) {
 | |
|                 for (size_t i = 0; i < event.frames.size(); ++i) {
 | |
|                     if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
 | |
|                         break;
 | |
|                 }
 | |
|             } else {
 | |
|                 for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
 | |
|                     if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
 | |
|                         break;
 | |
|                 }
 | |
|             }
 | |
|         };
 | |
| 
 | |
|         if (!m_show_top_functions) {
 | |
|             ProfileNode* node = nullptr;
 | |
|             for_each_frame([&](const Frame& frame, bool is_innermost_frame) {
 | |
|                 auto& object_name = frame.object_name;
 | |
|                 auto& symbol = frame.symbol;
 | |
|                 auto& address = frame.address;
 | |
|                 auto& offset = frame.offset;
 | |
| 
 | |
|                 if (symbol.is_empty())
 | |
|                     return IterationDecision::Break;
 | |
| 
 | |
|                 // FIXME: More cheating with intentional mixing of TID/PID here:
 | |
|                 if (!node)
 | |
|                     node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
 | |
|                 else
 | |
|                     node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
 | |
| 
 | |
|                 node->increment_event_count();
 | |
|                 if (is_innermost_frame) {
 | |
|                     node->add_event_address(address);
 | |
|                     node->increment_self_count();
 | |
|                 }
 | |
|                 return IterationDecision::Continue;
 | |
|             });
 | |
|         } else {
 | |
|             for (size_t i = 0; i < event.frames.size(); ++i) {
 | |
|                 ProfileNode* node = nullptr;
 | |
|                 ProfileNode* root = nullptr;
 | |
|                 for (size_t j = i; j < event.frames.size(); ++j) {
 | |
|                     auto& frame = event.frames.at(j);
 | |
|                     auto& object_name = frame.object_name;
 | |
|                     auto& symbol = frame.symbol;
 | |
|                     auto& address = frame.address;
 | |
|                     auto& offset = frame.offset;
 | |
|                     if (symbol.is_empty())
 | |
|                         break;
 | |
| 
 | |
|                     // FIXME: More PID/TID mixing cheats here:
 | |
|                     if (!node) {
 | |
|                         node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
 | |
|                         root = node;
 | |
|                         root->will_track_seen_events(m_events.size());
 | |
|                     } else {
 | |
|                         node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
 | |
|                     }
 | |
| 
 | |
|                     if (!root->has_seen_event(event_index)) {
 | |
|                         root->did_see_event(event_index);
 | |
|                         root->increment_event_count();
 | |
|                     } else if (node != root) {
 | |
|                         node->increment_event_count();
 | |
|                     }
 | |
| 
 | |
|                     if (j == event.frames.size() - 1) {
 | |
|                         node->add_event_address(address);
 | |
|                         node->increment_self_count();
 | |
|                     }
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     sort_profile_nodes(roots);
 | |
| 
 | |
|     m_roots = move(roots);
 | |
|     m_model->update();
 | |
| }
 | |
| 
 | |
| Result<NonnullOwnPtr<Profile>, String> Profile::load_from_perfcore_file(const StringView& path)
 | |
| {
 | |
|     auto file = Core::File::construct(path);
 | |
|     if (!file->open(Core::IODevice::ReadOnly))
 | |
|         return String::formatted("Unable to open {}, error: {}", path, file->error_string());
 | |
| 
 | |
|     auto json = JsonValue::from_string(file->read_all());
 | |
|     if (!json.has_value() || !json.value().is_object())
 | |
|         return String { "Invalid perfcore format (not a JSON object)" };
 | |
| 
 | |
|     auto& object = json.value().as_object();
 | |
| 
 | |
|     auto file_or_error = MappedFile::map("/boot/Kernel");
 | |
|     OwnPtr<ELF::Image> kernel_elf;
 | |
|     if (!file_or_error.is_error())
 | |
|         kernel_elf = make<ELF::Image>(file_or_error.value()->bytes());
 | |
| 
 | |
|     auto events_value = object.get("events");
 | |
|     if (!events_value.is_array())
 | |
|         return String { "Malformed profile (events is not an array)" };
 | |
| 
 | |
|     auto& perf_events = events_value.as_array();
 | |
| 
 | |
|     NonnullOwnPtrVector<Process> all_processes;
 | |
|     HashMap<pid_t, Process*> current_processes;
 | |
|     Vector<Event> events;
 | |
| 
 | |
|     for (auto& perf_event_value : perf_events.values()) {
 | |
|         auto& perf_event = perf_event_value.as_object();
 | |
| 
 | |
|         Event event;
 | |
| 
 | |
|         event.timestamp = perf_event.get("timestamp").to_number<u64>();
 | |
|         event.type = perf_event.get("type").to_string();
 | |
|         event.pid = perf_event.get("pid").to_i32();
 | |
|         event.tid = perf_event.get("tid").to_i32();
 | |
| 
 | |
|         if (event.type == "malloc") {
 | |
|             event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
 | |
|             event.size = perf_event.get("size").to_number<size_t>();
 | |
|         } else if (event.type == "free") {
 | |
|             event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
 | |
|         } else if (event.type == "mmap") {
 | |
|             event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
 | |
|             event.size = perf_event.get("size").to_number<size_t>();
 | |
|             event.name = perf_event.get("name").to_string();
 | |
| 
 | |
|             auto it = current_processes.find(event.pid);
 | |
|             if (it != current_processes.end())
 | |
|                 it->value->library_metadata.handle_mmap(event.ptr, event.size, event.name);
 | |
|             continue;
 | |
|         } else if (event.type == "munmap") {
 | |
|             event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
 | |
|             event.size = perf_event.get("size").to_number<size_t>();
 | |
|             continue;
 | |
|         } else if (event.type == "process_create") {
 | |
|             event.parent_pid = perf_event.get("parent_pid").to_number<FlatPtr>();
 | |
|             event.executable = perf_event.get("executable").to_string();
 | |
| 
 | |
|             auto sampled_process = adopt_own(*new Process {
 | |
|                 .pid = event.pid,
 | |
|                 .executable = event.executable,
 | |
|                 .start_valid = event.timestamp,
 | |
|             });
 | |
| 
 | |
|             current_processes.set(sampled_process->pid, sampled_process);
 | |
|             all_processes.append(move(sampled_process));
 | |
|             continue;
 | |
|         } else if (event.type == "process_exec") {
 | |
|             event.executable = perf_event.get("executable").to_string();
 | |
| 
 | |
|             auto old_process = current_processes.get(event.pid).value();
 | |
|             old_process->end_valid = event.timestamp - 1;
 | |
| 
 | |
|             current_processes.remove(event.pid);
 | |
| 
 | |
|             auto sampled_process = adopt_own(*new Process {
 | |
|                 .pid = event.pid,
 | |
|                 .executable = event.executable,
 | |
|                 .start_valid = event.timestamp });
 | |
| 
 | |
|             current_processes.set(sampled_process->pid, sampled_process);
 | |
|             all_processes.append(move(sampled_process));
 | |
|             continue;
 | |
|         } else if (event.type == "process_exit") {
 | |
|             auto old_process = current_processes.get(event.pid).value();
 | |
|             old_process->end_valid = event.timestamp - 1;
 | |
| 
 | |
|             current_processes.remove(event.pid);
 | |
|             continue;
 | |
|         } else if (event.type == "thread_create") {
 | |
|             event.parent_tid = perf_event.get("parent_tid").to_i32();
 | |
|             auto it = current_processes.find(event.pid);
 | |
|             if (it != current_processes.end())
 | |
|                 it->value->handle_thread_create(event.tid, event.timestamp);
 | |
|             continue;
 | |
|         } else if (event.type == "thread_exit") {
 | |
|             auto it = current_processes.find(event.pid);
 | |
|             if (it != current_processes.end())
 | |
|                 it->value->handle_thread_exit(event.tid, event.timestamp);
 | |
|             continue;
 | |
|         }
 | |
| 
 | |
|         auto stack_array = perf_event.get("stack").as_array();
 | |
|         for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
 | |
|             auto& frame = stack_array.at(i);
 | |
|             auto ptr = frame.to_number<u32>();
 | |
|             u32 offset = 0;
 | |
|             FlyString object_name;
 | |
|             String symbol;
 | |
| 
 | |
|             if (ptr >= 0xc0000000) {
 | |
|                 if (kernel_elf) {
 | |
|                     symbol = kernel_elf->symbolicate(ptr, &offset);
 | |
|                 } else {
 | |
|                     symbol = String::formatted("?? <{:p}>", ptr);
 | |
|                 }
 | |
|             } else {
 | |
|                 auto it = current_processes.find(event.pid);
 | |
|                 // FIXME: This logic is kinda gnarly, find a way to clean it up.
 | |
|                 LibraryMetadata* library_metadata {};
 | |
|                 if (it != current_processes.end())
 | |
|                     library_metadata = &it->value->library_metadata;
 | |
|                 if (auto* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
 | |
|                     object_name = library->name;
 | |
|                     symbol = library->symbolicate(ptr, &offset);
 | |
|                 } else {
 | |
|                     symbol = String::formatted("?? <{:p}>", ptr);
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             event.frames.append({ object_name, symbol, ptr, offset });
 | |
|         }
 | |
| 
 | |
|         if (event.frames.size() < 2)
 | |
|             continue;
 | |
| 
 | |
|         FlatPtr innermost_frame_address = event.frames.at(1).address;
 | |
|         event.in_kernel = innermost_frame_address >= 0xc0000000;
 | |
| 
 | |
|         events.append(move(event));
 | |
|     }
 | |
| 
 | |
|     if (events.is_empty())
 | |
|         return String { "No events captured (targeted process was never on CPU)" };
 | |
| 
 | |
|     quick_sort(all_processes, [](auto& a, auto& b) {
 | |
|         if (a.pid == b.pid)
 | |
|             return a.start_valid < b.start_valid;
 | |
|         else
 | |
|             return a.pid < b.pid;
 | |
|     });
 | |
| 
 | |
|     Vector<Process> processes;
 | |
|     for (auto& it : all_processes)
 | |
|         processes.append(move(it));
 | |
| 
 | |
|     return adopt_own(*new Profile(move(processes), move(events)));
 | |
| }
 | |
| 
 | |
| void ProfileNode::sort_children()
 | |
| {
 | |
|     sort_profile_nodes(m_children);
 | |
| }
 | |
| 
 | |
| void Profile::set_timestamp_filter_range(u64 start, u64 end)
 | |
| {
 | |
|     if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
 | |
|         return;
 | |
|     m_has_timestamp_filter_range = true;
 | |
| 
 | |
|     m_timestamp_filter_range_start = min(start, end);
 | |
|     m_timestamp_filter_range_end = max(start, end);
 | |
| 
 | |
|     rebuild_tree();
 | |
|     m_samples_model->update();
 | |
| }
 | |
| 
 | |
| void Profile::clear_timestamp_filter_range()
 | |
| {
 | |
|     if (!m_has_timestamp_filter_range)
 | |
|         return;
 | |
|     m_has_timestamp_filter_range = false;
 | |
|     rebuild_tree();
 | |
|     m_samples_model->update();
 | |
| }
 | |
| 
 | |
| void Profile::set_process_filter(pid_t pid, u64 start_valid, u64 end_valid)
 | |
| {
 | |
|     if (m_has_process_filter && m_process_filter_pid == pid && m_process_filter_start_valid == start_valid && m_process_filter_end_valid == end_valid)
 | |
|         return;
 | |
|     m_has_process_filter = true;
 | |
| 
 | |
|     m_process_filter_pid = pid;
 | |
|     m_process_filter_start_valid = start_valid;
 | |
|     m_process_filter_end_valid = end_valid;
 | |
| 
 | |
|     rebuild_tree();
 | |
|     if (m_disassembly_model)
 | |
|         m_disassembly_model->update();
 | |
|     m_samples_model->update();
 | |
| }
 | |
| void Profile::clear_process_filter()
 | |
| {
 | |
|     if (!m_has_process_filter)
 | |
|         return;
 | |
|     m_has_process_filter = false;
 | |
|     rebuild_tree();
 | |
|     if (m_disassembly_model)
 | |
|         m_disassembly_model->update();
 | |
|     m_samples_model->update();
 | |
| }
 | |
| 
 | |
| void Profile::set_inverted(bool inverted)
 | |
| {
 | |
|     if (m_inverted == inverted)
 | |
|         return;
 | |
|     m_inverted = inverted;
 | |
|     rebuild_tree();
 | |
| }
 | |
| 
 | |
| void Profile::set_show_top_functions(bool show)
 | |
| {
 | |
|     if (m_show_top_functions == show)
 | |
|         return;
 | |
|     m_show_top_functions = show;
 | |
|     rebuild_tree();
 | |
| }
 | |
| 
 | |
| void Profile::set_show_percentages(bool show_percentages)
 | |
| {
 | |
|     if (m_show_percentages == show_percentages)
 | |
|         return;
 | |
|     m_show_percentages = show_percentages;
 | |
| }
 | |
| 
 | |
| void Profile::set_disassembly_index(const GUI::ModelIndex& index)
 | |
| {
 | |
|     if (m_disassembly_index == index)
 | |
|         return;
 | |
|     m_disassembly_index = index;
 | |
|     auto* node = static_cast<ProfileNode*>(index.internal_data());
 | |
|     m_disassembly_model = DisassemblyModel::create(*this, *node);
 | |
| }
 | |
| 
 | |
| GUI::Model* Profile::disassembly_model()
 | |
| {
 | |
|     return m_disassembly_model;
 | |
| }
 | |
| 
 | |
| ProfileNode::ProfileNode(const String& object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid)
 | |
|     : m_symbol(move(symbol))
 | |
|     , m_pid(pid)
 | |
|     , m_address(address)
 | |
|     , m_offset(offset)
 | |
|     , m_timestamp(timestamp)
 | |
| {
 | |
|     String object;
 | |
|     if (object_name.ends_with(": .text")) {
 | |
|         object = object_name.view().substring_view(0, object_name.length() - 7);
 | |
|     } else {
 | |
|         object = object_name;
 | |
|     }
 | |
|     m_object_name = LexicalPath(object).basename();
 | |
| }
 | |
| 
 | |
| const Process* ProfileNode::process(Profile& profile, u64 timestamp) const
 | |
| {
 | |
|     return profile.find_process(m_pid, timestamp);
 | |
| }
 |