mirror of
https://github.com/RGBCube/serenity
synced 2025-05-15 17:14:58 +00:00

Hiding those frames doesn't really make sense. They're a major contributor to a process' spent CPU time and show up in a lot of profiles. That however is because those processes really do spend quite a bit of time in the scheduler by doing lots of context switches, like WindowServer when responding to IPC calls. Instead of hiding these for aesthetic reasons we should instead improve the scheduler.
491 lines
16 KiB
C++
491 lines
16 KiB
C++
/*
|
|
* Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#include "Profile.h"
|
|
#include "DisassemblyModel.h"
|
|
#include "ProfileModel.h"
|
|
#include "SamplesModel.h"
|
|
#include <AK/HashTable.h>
|
|
#include <AK/LexicalPath.h>
|
|
#include <AK/MappedFile.h>
|
|
#include <AK/NonnullOwnPtrVector.h>
|
|
#include <AK/QuickSort.h>
|
|
#include <AK/RefPtr.h>
|
|
#include <LibCore/File.h>
|
|
#include <LibELF/Image.h>
|
|
#include <sys/stat.h>
|
|
|
|
namespace Profiler {
|
|
|
|
static void sort_profile_nodes(Vector<NonnullRefPtr<ProfileNode>>& nodes)
|
|
{
|
|
quick_sort(nodes.begin(), nodes.end(), [](auto& a, auto& b) {
|
|
return a->event_count() >= b->event_count();
|
|
});
|
|
|
|
for (auto& child : nodes)
|
|
child->sort_children();
|
|
}
|
|
|
|
Profile::Profile(Vector<Process> processes, Vector<Event> events)
|
|
: m_processes(move(processes))
|
|
, m_events(move(events))
|
|
{
|
|
m_first_timestamp = m_events.first().timestamp;
|
|
m_last_timestamp = m_events.last().timestamp;
|
|
|
|
m_model = ProfileModel::create(*this);
|
|
m_samples_model = SamplesModel::create(*this);
|
|
|
|
for (auto& event : m_events) {
|
|
m_deepest_stack_depth = max((u32)event.frames.size(), m_deepest_stack_depth);
|
|
}
|
|
|
|
rebuild_tree();
|
|
}
|
|
|
|
Profile::~Profile()
|
|
{
|
|
}
|
|
|
|
GUI::Model& Profile::model()
|
|
{
|
|
return *m_model;
|
|
}
|
|
|
|
GUI::Model& Profile::samples_model()
|
|
{
|
|
return *m_samples_model;
|
|
}
|
|
|
|
void Profile::rebuild_tree()
|
|
{
|
|
Vector<NonnullRefPtr<ProfileNode>> roots;
|
|
|
|
auto find_or_create_root = [&roots](FlyString object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid) -> ProfileNode& {
|
|
for (auto root : roots) {
|
|
if (root->symbol() == symbol) {
|
|
return root;
|
|
}
|
|
}
|
|
auto new_root = ProfileNode::create(move(object_name), move(symbol), address, offset, timestamp, pid);
|
|
roots.append(new_root);
|
|
return new_root;
|
|
};
|
|
|
|
HashTable<FlatPtr> live_allocations;
|
|
|
|
for_each_event_in_filter_range([&](auto& event) {
|
|
if (event.type == "malloc"sv)
|
|
live_allocations.set(event.ptr);
|
|
else if (event.type == "free"sv)
|
|
live_allocations.remove(event.ptr);
|
|
});
|
|
|
|
m_filtered_event_indices.clear();
|
|
|
|
for (size_t event_index = 0; event_index < m_events.size(); ++event_index) {
|
|
auto& event = m_events.at(event_index);
|
|
|
|
if (has_timestamp_filter_range()) {
|
|
auto timestamp = event.timestamp;
|
|
if (timestamp < m_timestamp_filter_range_start || timestamp > m_timestamp_filter_range_end)
|
|
continue;
|
|
}
|
|
|
|
if (!process_filter_contains(event.pid, event.timestamp))
|
|
continue;
|
|
|
|
m_filtered_event_indices.append(event_index);
|
|
|
|
if (event.type == "malloc"sv && !live_allocations.contains(event.ptr))
|
|
continue;
|
|
|
|
if (event.type == "free"sv)
|
|
continue;
|
|
|
|
auto for_each_frame = [&]<typename Callback>(Callback callback) {
|
|
if (!m_inverted) {
|
|
for (size_t i = 0; i < event.frames.size(); ++i) {
|
|
if (callback(event.frames.at(i), i == event.frames.size() - 1) == IterationDecision::Break)
|
|
break;
|
|
}
|
|
} else {
|
|
for (ssize_t i = event.frames.size() - 1; i >= 0; --i) {
|
|
if (callback(event.frames.at(i), static_cast<size_t>(i) == event.frames.size() - 1) == IterationDecision::Break)
|
|
break;
|
|
}
|
|
}
|
|
};
|
|
|
|
if (!m_show_top_functions) {
|
|
ProfileNode* node = nullptr;
|
|
for_each_frame([&](const Frame& frame, bool is_innermost_frame) {
|
|
auto& object_name = frame.object_name;
|
|
auto& symbol = frame.symbol;
|
|
auto& address = frame.address;
|
|
auto& offset = frame.offset;
|
|
|
|
if (symbol.is_empty())
|
|
return IterationDecision::Break;
|
|
|
|
// FIXME: More cheating with intentional mixing of TID/PID here:
|
|
if (!node)
|
|
node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
|
|
else
|
|
node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
|
|
|
|
node->increment_event_count();
|
|
if (is_innermost_frame) {
|
|
node->add_event_address(address);
|
|
node->increment_self_count();
|
|
}
|
|
return IterationDecision::Continue;
|
|
});
|
|
} else {
|
|
for (size_t i = 0; i < event.frames.size(); ++i) {
|
|
ProfileNode* node = nullptr;
|
|
ProfileNode* root = nullptr;
|
|
for (size_t j = i; j < event.frames.size(); ++j) {
|
|
auto& frame = event.frames.at(j);
|
|
auto& object_name = frame.object_name;
|
|
auto& symbol = frame.symbol;
|
|
auto& address = frame.address;
|
|
auto& offset = frame.offset;
|
|
if (symbol.is_empty())
|
|
break;
|
|
|
|
// FIXME: More PID/TID mixing cheats here:
|
|
if (!node) {
|
|
node = &find_or_create_root(object_name, symbol, address, offset, event.timestamp, event.pid);
|
|
root = node;
|
|
root->will_track_seen_events(m_events.size());
|
|
} else {
|
|
node = &node->find_or_create_child(object_name, symbol, address, offset, event.timestamp, event.pid);
|
|
}
|
|
|
|
if (!root->has_seen_event(event_index)) {
|
|
root->did_see_event(event_index);
|
|
root->increment_event_count();
|
|
} else if (node != root) {
|
|
node->increment_event_count();
|
|
}
|
|
|
|
if (j == event.frames.size() - 1) {
|
|
node->add_event_address(address);
|
|
node->increment_self_count();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
sort_profile_nodes(roots);
|
|
|
|
m_roots = move(roots);
|
|
m_model->update();
|
|
}
|
|
|
|
Result<NonnullOwnPtr<Profile>, String> Profile::load_from_perfcore_file(const StringView& path)
|
|
{
|
|
auto file = Core::File::construct(path);
|
|
if (!file->open(Core::OpenMode::ReadOnly))
|
|
return String::formatted("Unable to open {}, error: {}", path, file->error_string());
|
|
|
|
auto json = JsonValue::from_string(file->read_all());
|
|
if (!json.has_value() || !json.value().is_object())
|
|
return String { "Invalid perfcore format (not a JSON object)" };
|
|
|
|
auto& object = json.value().as_object();
|
|
|
|
auto file_or_error = MappedFile::map("/boot/Kernel");
|
|
OwnPtr<ELF::Image> kernel_elf;
|
|
if (!file_or_error.is_error())
|
|
kernel_elf = make<ELF::Image>(file_or_error.value()->bytes());
|
|
|
|
auto events_value = object.get_ptr("events");
|
|
if (!events_value || !events_value->is_array())
|
|
return String { "Malformed profile (events is not an array)" };
|
|
|
|
auto& perf_events = events_value->as_array();
|
|
|
|
NonnullOwnPtrVector<Process> all_processes;
|
|
HashMap<pid_t, Process*> current_processes;
|
|
Vector<Event> events;
|
|
|
|
for (auto& perf_event_value : perf_events.values()) {
|
|
auto& perf_event = perf_event_value.as_object();
|
|
|
|
Event event;
|
|
|
|
event.timestamp = perf_event.get("timestamp").to_number<u64>();
|
|
event.lost_samples = perf_event.get("lost_samples").to_number<u32>();
|
|
event.type = perf_event.get("type").to_string();
|
|
event.pid = perf_event.get("pid").to_i32();
|
|
event.tid = perf_event.get("tid").to_i32();
|
|
|
|
if (event.type == "malloc"sv) {
|
|
event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
|
|
event.size = perf_event.get("size").to_number<size_t>();
|
|
} else if (event.type == "free"sv) {
|
|
event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
|
|
} else if (event.type == "mmap"sv) {
|
|
event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
|
|
event.size = perf_event.get("size").to_number<size_t>();
|
|
event.name = perf_event.get("name").to_string();
|
|
|
|
auto it = current_processes.find(event.pid);
|
|
if (it != current_processes.end())
|
|
it->value->library_metadata.handle_mmap(event.ptr, event.size, event.name);
|
|
continue;
|
|
} else if (event.type == "munmap"sv) {
|
|
event.ptr = perf_event.get("ptr").to_number<FlatPtr>();
|
|
event.size = perf_event.get("size").to_number<size_t>();
|
|
continue;
|
|
} else if (event.type == "process_create"sv) {
|
|
event.parent_pid = perf_event.get("parent_pid").to_number<FlatPtr>();
|
|
event.executable = perf_event.get("executable").to_string();
|
|
|
|
auto sampled_process = adopt_own(*new Process {
|
|
.pid = event.pid,
|
|
.executable = event.executable,
|
|
.start_valid = event.timestamp,
|
|
});
|
|
|
|
current_processes.set(sampled_process->pid, sampled_process);
|
|
all_processes.append(move(sampled_process));
|
|
continue;
|
|
} else if (event.type == "process_exec"sv) {
|
|
event.executable = perf_event.get("executable").to_string();
|
|
|
|
auto old_process = current_processes.get(event.pid).value();
|
|
old_process->end_valid = event.timestamp - 1;
|
|
|
|
current_processes.remove(event.pid);
|
|
|
|
auto sampled_process = adopt_own(*new Process {
|
|
.pid = event.pid,
|
|
.executable = event.executable,
|
|
.start_valid = event.timestamp });
|
|
|
|
current_processes.set(sampled_process->pid, sampled_process);
|
|
all_processes.append(move(sampled_process));
|
|
continue;
|
|
} else if (event.type == "process_exit"sv) {
|
|
auto old_process = current_processes.get(event.pid).value();
|
|
old_process->end_valid = event.timestamp - 1;
|
|
|
|
current_processes.remove(event.pid);
|
|
continue;
|
|
} else if (event.type == "thread_create"sv) {
|
|
event.parent_tid = perf_event.get("parent_tid").to_i32();
|
|
auto it = current_processes.find(event.pid);
|
|
if (it != current_processes.end())
|
|
it->value->handle_thread_create(event.tid, event.timestamp);
|
|
continue;
|
|
} else if (event.type == "thread_exit"sv) {
|
|
auto it = current_processes.find(event.pid);
|
|
if (it != current_processes.end())
|
|
it->value->handle_thread_exit(event.tid, event.timestamp);
|
|
continue;
|
|
}
|
|
|
|
auto* stack = perf_event.get_ptr("stack");
|
|
VERIFY(stack);
|
|
auto& stack_array = stack->as_array();
|
|
for (ssize_t i = stack_array.values().size() - 1; i >= 0; --i) {
|
|
auto& frame = stack_array.at(i);
|
|
auto ptr = frame.to_number<u32>();
|
|
u32 offset = 0;
|
|
FlyString object_name;
|
|
String symbol;
|
|
|
|
if (ptr >= 0xc0000000) {
|
|
if (kernel_elf) {
|
|
symbol = kernel_elf->symbolicate(ptr, &offset);
|
|
} else {
|
|
symbol = String::formatted("?? <{:p}>", ptr);
|
|
}
|
|
} else {
|
|
auto it = current_processes.find(event.pid);
|
|
// FIXME: This logic is kinda gnarly, find a way to clean it up.
|
|
LibraryMetadata* library_metadata {};
|
|
if (it != current_processes.end())
|
|
library_metadata = &it->value->library_metadata;
|
|
if (auto* library = library_metadata ? library_metadata->library_containing(ptr) : nullptr) {
|
|
object_name = library->name;
|
|
symbol = library->symbolicate(ptr, &offset);
|
|
} else {
|
|
symbol = String::formatted("?? <{:p}>", ptr);
|
|
}
|
|
}
|
|
|
|
event.frames.append({ object_name, symbol, ptr, offset });
|
|
}
|
|
|
|
if (event.frames.size() < 2)
|
|
continue;
|
|
|
|
FlatPtr innermost_frame_address = event.frames.at(1).address;
|
|
event.in_kernel = innermost_frame_address >= 0xc0000000;
|
|
|
|
events.append(move(event));
|
|
}
|
|
|
|
if (events.is_empty())
|
|
return String { "No events captured (targeted process was never on CPU)" };
|
|
|
|
quick_sort(all_processes, [](auto& a, auto& b) {
|
|
if (a.pid == b.pid)
|
|
return a.start_valid < b.start_valid;
|
|
else
|
|
return a.pid < b.pid;
|
|
});
|
|
|
|
Vector<Process> processes;
|
|
for (auto& it : all_processes)
|
|
processes.append(move(it));
|
|
|
|
return adopt_own(*new Profile(move(processes), move(events)));
|
|
}
|
|
|
|
void ProfileNode::sort_children()
|
|
{
|
|
sort_profile_nodes(m_children);
|
|
}
|
|
|
|
void Profile::set_timestamp_filter_range(u64 start, u64 end)
|
|
{
|
|
if (m_has_timestamp_filter_range && m_timestamp_filter_range_start == start && m_timestamp_filter_range_end == end)
|
|
return;
|
|
m_has_timestamp_filter_range = true;
|
|
|
|
m_timestamp_filter_range_start = min(start, end);
|
|
m_timestamp_filter_range_end = max(start, end);
|
|
|
|
rebuild_tree();
|
|
m_samples_model->update();
|
|
}
|
|
|
|
void Profile::clear_timestamp_filter_range()
|
|
{
|
|
if (!m_has_timestamp_filter_range)
|
|
return;
|
|
m_has_timestamp_filter_range = false;
|
|
rebuild_tree();
|
|
m_samples_model->update();
|
|
}
|
|
|
|
void Profile::add_process_filter(pid_t pid, u64 start_valid, u64 end_valid)
|
|
{
|
|
auto filter = ProcessFilter { pid, start_valid, end_valid };
|
|
if (m_process_filters.contains_slow(filter))
|
|
return;
|
|
m_process_filters.append(move(filter));
|
|
|
|
rebuild_tree();
|
|
if (m_disassembly_model)
|
|
m_disassembly_model->update();
|
|
m_samples_model->update();
|
|
}
|
|
|
|
void Profile::remove_process_filter(pid_t pid, u64 start_valid, u64 end_valid)
|
|
{
|
|
auto filter = ProcessFilter { pid, start_valid, end_valid };
|
|
if (!m_process_filters.contains_slow(filter))
|
|
return;
|
|
m_process_filters.remove_first_matching([&filter](ProcessFilter const& other_filter) {
|
|
return other_filter == filter;
|
|
});
|
|
|
|
rebuild_tree();
|
|
if (m_disassembly_model)
|
|
m_disassembly_model->update();
|
|
m_samples_model->update();
|
|
}
|
|
|
|
void Profile::clear_process_filter()
|
|
{
|
|
if (m_process_filters.is_empty())
|
|
return;
|
|
m_process_filters.clear();
|
|
rebuild_tree();
|
|
if (m_disassembly_model)
|
|
m_disassembly_model->update();
|
|
m_samples_model->update();
|
|
}
|
|
|
|
bool Profile::process_filter_contains(pid_t pid, u32 timestamp)
|
|
{
|
|
if (!has_process_filter())
|
|
return true;
|
|
|
|
for (auto const& process_filter : m_process_filters)
|
|
if (pid == process_filter.pid && timestamp >= process_filter.start_valid && timestamp <= process_filter.end_valid)
|
|
return true;
|
|
|
|
return false;
|
|
}
|
|
|
|
void Profile::set_inverted(bool inverted)
|
|
{
|
|
if (m_inverted == inverted)
|
|
return;
|
|
m_inverted = inverted;
|
|
rebuild_tree();
|
|
}
|
|
|
|
void Profile::set_show_top_functions(bool show)
|
|
{
|
|
if (m_show_top_functions == show)
|
|
return;
|
|
m_show_top_functions = show;
|
|
rebuild_tree();
|
|
}
|
|
|
|
void Profile::set_show_percentages(bool show_percentages)
|
|
{
|
|
if (m_show_percentages == show_percentages)
|
|
return;
|
|
m_show_percentages = show_percentages;
|
|
}
|
|
|
|
void Profile::set_disassembly_index(const GUI::ModelIndex& index)
|
|
{
|
|
if (m_disassembly_index == index)
|
|
return;
|
|
m_disassembly_index = index;
|
|
auto* node = static_cast<ProfileNode*>(index.internal_data());
|
|
m_disassembly_model = DisassemblyModel::create(*this, *node);
|
|
}
|
|
|
|
GUI::Model* Profile::disassembly_model()
|
|
{
|
|
return m_disassembly_model;
|
|
}
|
|
|
|
ProfileNode::ProfileNode(const String& object_name, String symbol, u32 address, u32 offset, u64 timestamp, pid_t pid)
|
|
: m_symbol(move(symbol))
|
|
, m_pid(pid)
|
|
, m_address(address)
|
|
, m_offset(offset)
|
|
, m_timestamp(timestamp)
|
|
{
|
|
String object;
|
|
if (object_name.ends_with(": .text"sv)) {
|
|
object = object_name.view().substring_view(0, object_name.length() - 7);
|
|
} else {
|
|
object = object_name;
|
|
}
|
|
m_object_name = LexicalPath(object).basename();
|
|
}
|
|
|
|
const Process* ProfileNode::process(Profile& profile, u64 timestamp) const
|
|
{
|
|
return profile.find_process(m_pid, timestamp);
|
|
}
|
|
|
|
}
|