blob: 951472bca07936c47cc000baa46590bcbe70ea40 [file] [log] [blame]
/*
* Copyright (C) 2022 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "src/trace_processor/util/profile_builder.h"
#include <algorithm>
#include <cstdint>
#include <deque>
#include <iostream>
#include <iterator>
#include <optional>
#include <vector>
#include "perfetto/base/logging.h"
#include "perfetto/ext/base/string_utils.h"
#include "perfetto/ext/base/string_view.h"
#include "perfetto/ext/trace_processor/demangle.h"
#include "protos/third_party/pprof/profile.pbzero.h"
#include "src/trace_processor/containers/null_term_string_view.h"
#include "src/trace_processor/containers/string_pool.h"
#include "src/trace_processor/storage/trace_storage.h"
#include "src/trace_processor/types/trace_processor_context.h"
#include "src/trace_processor/util/annotated_callsites.h"
namespace perfetto {
namespace trace_processor {
namespace {
using protos::pbzero::Stack;
using third_party::perftools::profiles::pbzero::Profile;
using third_party::perftools::profiles::pbzero::Sample;
base::StringView ToString(CallsiteAnnotation annotation) {
switch (annotation) {
case CallsiteAnnotation::kNone:
return "";
case CallsiteAnnotation::kArtAot:
return "aot";
case CallsiteAnnotation::kArtInterpreted:
return "interp";
case CallsiteAnnotation::kArtJit:
return "jit";
case CallsiteAnnotation::kCommonFrame:
return "common-frame";
case CallsiteAnnotation::kCommonFrameInterp:
return "common-frame-interp";
}
PERFETTO_FATAL("For GCC");
}
} // namespace
GProfileBuilder::StringTable::StringTable(
protozero::HeapBuffered<third_party::perftools::profiles::pbzero::Profile>*
result,
const StringPool* string_pool)
: string_pool_(*string_pool), result_(*result) {
// String at index 0 of the string table must be the empty string (see
// profile.proto)
int64_t empty_index = WriteString("");
PERFETTO_CHECK(empty_index == kEmptyStringIndex);
}
int64_t GProfileBuilder::StringTable::InternString(base::StringView str) {
if (str.empty()) {
return kEmptyStringIndex;
}
auto hash = str.Hash();
auto it = seen_strings_.find(hash);
if (it != seen_strings_.end()) {
return it->second;
}
auto pool_id = string_pool_.GetId(str);
int64_t index = pool_id ? InternString(*pool_id) : WriteString(str);
seen_strings_.insert({hash, index});
return index;
}
int64_t GProfileBuilder::StringTable::InternString(
StringPool::Id string_pool_id) {
auto it = seen_string_pool_ids_.find(string_pool_id);
if (it != seen_string_pool_ids_.end()) {
return it->second;
}
NullTermStringView str = string_pool_.Get(string_pool_id);
int64_t index = str.empty() ? kEmptyStringIndex : WriteString(str);
seen_string_pool_ids_.insert({string_pool_id, index});
return index;
}
int64_t GProfileBuilder::StringTable::GetAnnotatedString(
StringPool::Id str,
CallsiteAnnotation annotation) {
if (str.is_null() || annotation == CallsiteAnnotation::kNone) {
return InternString(str);
}
return GetAnnotatedString(string_pool_.Get(str), annotation);
}
int64_t GProfileBuilder::StringTable::GetAnnotatedString(
base::StringView str,
CallsiteAnnotation annotation) {
if (str.empty() || annotation == CallsiteAnnotation::kNone) {
return InternString(str);
}
return InternString(base::StringView(
str.ToStdString() + " [" + ToString(annotation).ToStdString() + "]"));
}
int64_t GProfileBuilder::StringTable::WriteString(base::StringView str) {
result_->add_string_table(str.data(), str.size());
return next_index_++;
}
GProfileBuilder::MappingKey::MappingKey(
const tables::StackProfileMappingTable::ConstRowReference& mapping,
StringTable& string_table) {
size = static_cast<uint64_t>(mapping.end() - mapping.start());
file_offset = static_cast<uint64_t>(mapping.exact_offset());
build_id_or_filename = string_table.InternString(mapping.build_id());
if (build_id_or_filename == kEmptyStringIndex) {
build_id_or_filename = string_table.InternString(mapping.name());
}
}
GProfileBuilder::Mapping::Mapping(
const tables::StackProfileMappingTable::ConstRowReference& mapping,
const StringPool& string_pool,
StringTable& string_table)
: memory_start(static_cast<uint64_t>(mapping.start())),
memory_limit(static_cast<uint64_t>(mapping.end())),
file_offset(static_cast<uint64_t>(mapping.exact_offset())),
filename(string_table.InternString(mapping.name())),
build_id(string_table.InternString(mapping.build_id())),
filename_str(string_pool.Get(mapping.name()).ToStdString()) {}
// Do some very basic scoring.
int64_t GProfileBuilder::Mapping::ComputeMainBinaryScore() const {
constexpr const char* kBadSuffixes[] = {".so"};
constexpr const char* kBadPrefixes[] = {"/apex", "/system", "/[", "["};
int64_t score = 0;
if (build_id != kEmptyStringIndex) {
score += 10;
}
if (filename != kEmptyStringIndex) {
score += 10;
}
if (debug_info.has_functions) {
score += 10;
}
if (debug_info.has_filenames) {
score += 10;
}
if (debug_info.has_line_numbers) {
score += 10;
}
if (debug_info.has_inline_frames) {
score += 10;
}
if (memory_limit == memory_start) {
score -= 1000;
}
for (const char* suffix : kBadSuffixes) {
if (base::EndsWith(filename_str, suffix)) {
score -= 1000;
break;
}
}
for (const char* prefix : kBadPrefixes) {
if (base::StartsWith(filename_str, prefix)) {
score -= 1000;
break;
}
}
return score;
}
bool GProfileBuilder::SampleAggregator::AddSample(
const protozero::PackedVarInt& location_ids,
const std::vector<int64_t>& values) {
SerializedLocationId key(location_ids.data(),
location_ids.data() + location_ids.size());
std::vector<int64_t>* agg_values = samples_.Find(key);
if (!agg_values) {
samples_.Insert(std::move(key), values);
return true;
}
// All samples must have the same number of values.
if (values.size() != agg_values->size()) {
return false;
}
std::transform(values.begin(), values.end(), agg_values->begin(),
agg_values->begin(), std::plus<int64_t>());
return true;
}
void GProfileBuilder::SampleAggregator::WriteTo(Profile& profile) {
protozero::PackedVarInt values;
for (auto it = samples_.GetIterator(); it; ++it) {
values.Reset();
for (int64_t value : it.value()) {
values.Append(value);
}
Sample* sample = profile.add_sample();
sample->set_value(values);
// Map key is the serialized varint. Just append the bytes.
sample->AppendBytes(Sample::kLocationIdFieldNumber, it.key().data(),
it.key().size());
}
}
GProfileBuilder::GProfileBuilder(const TraceProcessorContext* context,
const std::vector<ValueType>& sample_types)
: context_(*context),
string_table_(&result_, &context->storage->string_pool()),
annotations_(context) {
// Make sure the empty function always gets id 0 which will be ignored
// when writing the proto file.
functions_.insert(
{Function{kEmptyStringIndex, kEmptyStringIndex, kEmptyStringIndex},
kNullFunctionId});
WriteSampleTypes(sample_types);
}
GProfileBuilder::~GProfileBuilder() = default;
void GProfileBuilder::WriteSampleTypes(
const std::vector<ValueType>& sample_types) {
for (const auto& value_type : sample_types) {
// Write strings first
int64_t type =
string_table_.InternString(base::StringView(value_type.type));
int64_t unit =
string_table_.InternString(base::StringView(value_type.unit));
// Add message later, remember protozero does not allow you to
// interleave these write calls.
auto* sample_type = result_->add_sample_type();
sample_type->set_type(type);
sample_type->set_unit(unit);
}
}
bool GProfileBuilder::AddSample(const Stack::Decoder& stack,
const std::vector<int64_t>& values) {
PERFETTO_CHECK(!finalized_);
auto it = stack.entries();
if (!it) {
return true;
}
auto next = it;
++next;
if (!next) {
Stack::Entry::Decoder entry(it->as_bytes());
if (entry.has_callsite_id() || entry.has_annotated_callsite_id()) {
bool annotated = entry.has_annotated_callsite_id();
uint32_t callsite_id = entry.has_callsite_id()
? entry.callsite_id()
: entry.annotated_callsite_id();
return samples_.AddSample(
GetLocationIdsForCallsite(CallsiteId(callsite_id), annotated),
values);
}
}
// Note pprof orders the stacks leafs first. That is also the ordering
// StackBlob uses for entries
protozero::PackedVarInt location_ids;
for (; it; ++it) {
Stack::Entry::Decoder entry(it->as_bytes());
if (entry.has_name()) {
location_ids.Append(
WriteFakeLocationIfNeeded(entry.name().ToStdString()));
} else if (entry.has_callsite_id() || entry.has_annotated_callsite_id()) {
bool annotated = entry.has_annotated_callsite_id();
uint32_t callsite_id = entry.has_callsite_id()
? entry.callsite_id()
: entry.annotated_callsite_id();
const protozero::PackedVarInt& ids =
GetLocationIdsForCallsite(CallsiteId(callsite_id), annotated);
for (auto* p = ids.data(); p < ids.data() + ids.size();) {
uint64_t location_id;
p = protozero::proto_utils::ParseVarInt(p, ids.data() + ids.size(),
&location_id);
location_ids.Append(location_id);
}
} else if (entry.has_frame_id()) {
location_ids.Append(WriteLocationIfNeeded(FrameId(entry.frame_id()),
CallsiteAnnotation::kNone));
}
}
return samples_.AddSample(location_ids, values);
}
void GProfileBuilder::Finalize() {
if (finalized_) {
return;
}
WriteMappings();
WriteFunctions();
WriteLocations();
samples_.WriteTo(*result_.get());
finalized_ = true;
}
std::string GProfileBuilder::Build() {
Finalize();
return result_.SerializeAsString();
}
const protozero::PackedVarInt& GProfileBuilder::GetLocationIdsForCallsite(
const CallsiteId& callsite_id,
bool annotated) {
auto it = cached_location_ids_.find({callsite_id, annotated});
if (it != cached_location_ids_.end()) {
return it->second;
}
protozero::PackedVarInt& location_ids =
cached_location_ids_[{callsite_id, annotated}];
const auto& cs_table = context_.storage->stack_profile_callsite_table();
std::optional<tables::StackProfileCallsiteTable::ConstRowReference>
start_ref = cs_table.FindById(callsite_id);
if (!start_ref) {
return location_ids;
}
location_ids.Append(WriteLocationIfNeeded(
start_ref->frame_id(), annotated ? annotations_.GetAnnotation(*start_ref)
: CallsiteAnnotation::kNone));
std::optional<CallsiteId> parent_id = start_ref->parent_id();
while (parent_id) {
auto parent_ref = cs_table.FindById(*parent_id);
location_ids.Append(WriteLocationIfNeeded(
parent_ref->frame_id(), annotated
? annotations_.GetAnnotation(*parent_ref)
: CallsiteAnnotation::kNone));
parent_id = parent_ref->parent_id();
}
return location_ids;
}
uint64_t GProfileBuilder::WriteLocationIfNeeded(FrameId frame_id,
CallsiteAnnotation annotation) {
AnnotatedFrameId key{frame_id, annotation};
auto it = seen_locations_.find(key);
if (it != seen_locations_.end()) {
return it->second;
}
auto& frames = context_.storage->stack_profile_frame_table();
auto frame = *frames.FindById(key.frame_id);
const auto& mappings = context_.storage->stack_profile_mapping_table();
auto mapping = *mappings.FindById(frame.mapping());
uint64_t mapping_id = WriteMappingIfNeeded(mapping);
uint64_t& id =
locations_[Location{mapping_id, static_cast<uint64_t>(frame.rel_pc()),
GetLines(frame, key.annotation, mapping_id)}];
if (id == 0) {
id = locations_.size();
}
seen_locations_.insert({key, id});
return id;
}
uint64_t GProfileBuilder::WriteFakeLocationIfNeeded(const std::string& name) {
int64_t name_id = string_table_.InternString(base::StringView(name));
auto it = seen_fake_locations_.find(name_id);
if (it != seen_fake_locations_.end()) {
return it->second;
}
uint64_t& id =
locations_[Location{0, 0, {{WriteFakeFunctionIfNeeded(name_id), 0}}}];
if (id == 0) {
id = locations_.size();
}
seen_fake_locations_.insert({name_id, id});
return id;
}
void GProfileBuilder::WriteLocations() {
for (const auto& entry : locations_) {
auto* location = result_->add_location();
location->set_id(entry.second);
location->set_mapping_id(entry.first.mapping_id);
if (entry.first.mapping_id != 0) {
location->set_address(entry.first.rel_pc +
GetMapping(entry.first.mapping_id).memory_start);
}
for (const Line& line : entry.first.lines) {
auto* l = location->add_line();
l->set_function_id(line.function_id);
if (line.line != 0) {
l->set_line(line.line);
}
}
}
}
std::vector<GProfileBuilder::Line> GProfileBuilder::GetLines(
const tables::StackProfileFrameTable::ConstRowReference& frame,
CallsiteAnnotation annotation,
uint64_t mapping_id) {
std::vector<Line> lines =
GetLinesForSymbolSetId(frame.symbol_set_id(), annotation, mapping_id);
if (!lines.empty()) {
return lines;
}
if (uint64_t function_id =
WriteFunctionIfNeeded(frame, annotation, mapping_id);
function_id != kNullFunctionId) {
lines.push_back({function_id, 0});
}
return lines;
}
std::vector<GProfileBuilder::Line> GProfileBuilder::GetLinesForSymbolSetId(
std::optional<uint32_t> symbol_set_id,
CallsiteAnnotation annotation,
uint64_t mapping_id) {
if (!symbol_set_id) {
return {};
}
auto& symbols = context_.storage->symbol_table();
using RowRef =
perfetto::trace_processor::tables::SymbolTable::ConstRowReference;
std::vector<RowRef> symbol_set;
for (auto it = symbols.FilterToIterator(
{symbols.symbol_set_id().eq(*symbol_set_id)});
it; ++it) {
symbol_set.push_back(it.row_reference());
}
std::sort(symbol_set.begin(), symbol_set.end(),
[](const RowRef& a, const RowRef& b) { return a.id() < b.id(); });
std::vector<GProfileBuilder::Line> lines;
for (const RowRef& symbol : symbol_set) {
if (uint64_t function_id =
WriteFunctionIfNeeded(symbol, annotation, mapping_id);
function_id != kNullFunctionId) {
lines.push_back({function_id, symbol.line_number()});
}
}
GetMapping(mapping_id).debug_info.has_inline_frames = true;
GetMapping(mapping_id).debug_info.has_line_numbers = true;
return lines;
}
uint64_t GProfileBuilder::WriteFakeFunctionIfNeeded(int64_t name_id) {
auto ins = functions_.insert(
{Function{name_id, kEmptyStringIndex, kEmptyStringIndex},
functions_.size() + 1});
return ins.first->second;
}
uint64_t GProfileBuilder::WriteFunctionIfNeeded(
const tables::SymbolTable::ConstRowReference& symbol,
CallsiteAnnotation annotation,
uint64_t mapping_id) {
int64_t name = string_table_.GetAnnotatedString(symbol.name(), annotation);
int64_t filename = string_table_.InternString(symbol.source_file());
auto ins = functions_.insert(
{Function{name, kEmptyStringIndex, filename}, functions_.size() + 1});
uint64_t id = ins.first->second;
if (ins.second) {
if (name != kEmptyStringIndex) {
GetMapping(mapping_id).debug_info.has_functions = true;
}
if (filename != kEmptyStringIndex) {
GetMapping(mapping_id).debug_info.has_filenames = true;
}
}
return id;
}
int64_t GProfileBuilder::GetNameForFrame(
const tables::StackProfileFrameTable::ConstRowReference& frame,
CallsiteAnnotation annotation) {
NullTermStringView system_name = context_.storage->GetString(frame.name());
int64_t name = kEmptyStringIndex;
if (frame.deobfuscated_name()) {
name = string_table_.GetAnnotatedString(*frame.deobfuscated_name(),
annotation);
} else if (!system_name.empty()) {
std::unique_ptr<char, base::FreeDeleter> demangled =
demangle::Demangle(system_name.c_str());
if (demangled) {
name = string_table_.GetAnnotatedString(demangled.get(), annotation);
} else {
// demangling failed, expected if the name wasn't mangled. In any case
// reuse the system_name as this is what UI will usually display.
name = string_table_.GetAnnotatedString(frame.name(), annotation);
}
}
return name;
}
int64_t GProfileBuilder::GetSystemNameForFrame(
const tables::StackProfileFrameTable::ConstRowReference& frame) {
return string_table_.InternString(frame.name());
}
uint64_t GProfileBuilder::WriteFunctionIfNeeded(
const tables::StackProfileFrameTable::ConstRowReference& frame,
CallsiteAnnotation annotation,
uint64_t mapping_id) {
AnnotatedFrameId key{frame.id(), annotation};
auto it = seen_functions_.find(key);
if (it != seen_functions_.end()) {
return it->second;
}
auto ins = functions_.insert(
{Function{GetNameForFrame(frame, annotation),
GetSystemNameForFrame(frame), kEmptyStringIndex},
functions_.size() + 1});
uint64_t id = ins.first->second;
seen_functions_.insert({key, id});
if (ins.second && (ins.first->first.name != kEmptyStringIndex ||
ins.first->first.system_name != kEmptyStringIndex)) {
GetMapping(mapping_id).debug_info.has_functions = true;
}
return id;
}
void GProfileBuilder::WriteFunctions() {
for (const auto& entry : functions_) {
if (entry.second == kNullFunctionId) {
continue;
}
auto* func = result_->add_function();
func->set_id(entry.second);
if (entry.first.name != 0) {
func->set_name(entry.first.name);
}
if (entry.first.system_name != 0) {
func->set_system_name(entry.first.system_name);
}
if (entry.first.filename != 0) {
func->set_filename(entry.first.filename);
}
}
}
uint64_t GProfileBuilder::WriteMappingIfNeeded(
const tables::StackProfileMappingTable::ConstRowReference& mapping_ref) {
auto it = seen_mappings_.find(mapping_ref.id());
if (it != seen_mappings_.end()) {
return it->second;
}
auto ins = mapping_keys_.insert(
{MappingKey(mapping_ref, string_table_), mapping_keys_.size() + 1});
if (ins.second) {
mappings_.push_back(
Mapping(mapping_ref, context_.storage->string_pool(), string_table_));
}
return ins.first->second;
}
void GProfileBuilder::WriteMapping(uint64_t mapping_id) {
const Mapping& mapping = GetMapping(mapping_id);
auto m = result_->add_mapping();
m->set_id(mapping_id);
m->set_memory_start(mapping.memory_start);
m->set_memory_limit(mapping.memory_limit);
m->set_file_offset(mapping.file_offset);
m->set_filename(mapping.filename);
m->set_build_id(mapping.build_id);
m->set_has_functions(mapping.debug_info.has_functions);
m->set_has_filenames(mapping.debug_info.has_filenames);
m->set_has_line_numbers(mapping.debug_info.has_line_numbers);
m->set_has_inline_frames(mapping.debug_info.has_inline_frames);
}
void GProfileBuilder::WriteMappings() {
// The convention in pprof files is to write the mapping for the main
// binary first. So lets do just that.
std::optional<uint64_t> main_mapping_id = GuessMainBinary();
if (main_mapping_id) {
WriteMapping(*main_mapping_id);
}
for (size_t i = 0; i < mappings_.size(); ++i) {
uint64_t mapping_id = i + 1;
if (main_mapping_id && *main_mapping_id == mapping_id) {
continue;
}
WriteMapping(mapping_id);
}
}
std::optional<uint64_t> GProfileBuilder::GuessMainBinary() const {
std::vector<int64_t> mapping_scores;
for (const auto& mapping : mappings_) {
mapping_scores.push_back(mapping.ComputeMainBinaryScore());
}
auto it = std::max_element(mapping_scores.begin(), mapping_scores.end());
if (it == mapping_scores.end()) {
return std::nullopt;
}
return static_cast<uint64_t>(std::distance(mapping_scores.begin(), it) + 1);
}
} // namespace trace_processor
} // namespace perfetto