src/profiling/perf/perf_producer.cc - third_party/perfetto - Git at Google

 /*
  * Copyright (C) 2019 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #include "src/profiling/perf/perf_producer.h"

 #include <utility>

 #include <unistd.h>

 #include <unwindstack/Error.h>
 #include <unwindstack/Unwinder.h>

 #include "perfetto/base/logging.h"
 #include "perfetto/base/task_runner.h"
 #include "perfetto/ext/base/metatrace.h"
 #include "perfetto/ext/base/weak_ptr.h"
 #include "perfetto/ext/tracing/core/basic_types.h"
 #include "perfetto/ext/tracing/core/producer.h"
 #include "perfetto/ext/tracing/core/tracing_service.h"
 #include "perfetto/ext/tracing/ipc/producer_ipc_client.h"
 #include "perfetto/tracing/core/data_source_config.h"
 #include "perfetto/tracing/core/data_source_descriptor.h"
 #include "src/profiling/common/callstack_trie.h"
 #include "src/profiling/common/proc_utils.h"
 #include "src/profiling/common/unwind_support.h"
 #include "src/profiling/perf/common_types.h"
 #include "src/profiling/perf/event_reader.h"

 #include "protos/perfetto/config/profiling/perf_event_config.pbzero.h"
 #include "protos/perfetto/trace/profiling/profile_packet.pbzero.h"
 #include "protos/perfetto/trace/trace_packet.pbzero.h"

 namespace perfetto {
 namespace profiling {
 namespace {

 constexpr uint32_t kReadTickPeriodMs = 200;
 // TODO(rsavitski): this is better calculated (at setup) from the buffer and
 // sample sizes.
 constexpr size_t kMaxSamplesPerCpuPerReadTick = 64;
 // TODO(rsavitski): make this part of the config (for slow test platforms).
 constexpr uint32_t kProcDescriptorTimeoutMs = 400;

 constexpr uint32_t kInitialConnectionBackoffMs = 100;
 constexpr uint32_t kMaxConnectionBackoffMs = 30 * 1000;

 constexpr char kProducerName[] = "perfetto.traced_perf";
 constexpr char kDataSourceName[] = "linux.perf";

 size_t NumberOfCpus() {
   return static_cast<size_t>(sysconf(_SC_NPROCESSORS_CONF));
 }

 uint64_t NowMs() {
   return static_cast<uint64_t>(base::GetWallTimeMs().count());
 }

 protos::pbzero::Profiling::CpuMode ToCpuModeEnum(uint16_t perf_cpu_mode) {
   using Profiling = protos::pbzero::Profiling;
   switch (perf_cpu_mode) {
     case PERF_RECORD_MISC_KERNEL:
       return Profiling::MODE_KERNEL;
     case PERF_RECORD_MISC_USER:
       return Profiling::MODE_USER;
     case PERF_RECORD_MISC_HYPERVISOR:
       return Profiling::MODE_HYPERVISOR;
     case PERF_RECORD_MISC_GUEST_KERNEL:
       return Profiling::MODE_GUEST_KERNEL;
     case PERF_RECORD_MISC_GUEST_USER:
       return Profiling::MODE_GUEST_USER;
     default:
       return Profiling::MODE_UNKNOWN;
   }
 }

 protos::pbzero::Profiling::StackUnwindError ToProtoEnum(
     unwindstack::ErrorCode error_code) {
   using Profiling = protos::pbzero::Profiling;
   switch (error_code) {
     case unwindstack::ERROR_NONE:
       return Profiling::UNWIND_ERROR_NONE;
     case unwindstack::ERROR_MEMORY_INVALID:
       return Profiling::UNWIND_ERROR_MEMORY_INVALID;
     case unwindstack::ERROR_UNWIND_INFO:
       return Profiling::UNWIND_ERROR_UNWIND_INFO;
     case unwindstack::ERROR_UNSUPPORTED:
       return Profiling::UNWIND_ERROR_UNSUPPORTED;
     case unwindstack::ERROR_INVALID_MAP:
       return Profiling::UNWIND_ERROR_INVALID_MAP;
     case unwindstack::ERROR_MAX_FRAMES_EXCEEDED:
       return Profiling::UNWIND_ERROR_MAX_FRAMES_EXCEEDED;
     case unwindstack::ERROR_REPEATED_FRAME:
       return Profiling::UNWIND_ERROR_REPEATED_FRAME;
     case unwindstack::ERROR_INVALID_ELF:
       return Profiling::UNWIND_ERROR_INVALID_ELF;
   }
   return Profiling::UNWIND_ERROR_UNKNOWN;
 }

 bool ShouldRejectDueToFilter(pid_t pid, const TargetFilter& filter) {
   bool reject_cmd = false;
   std::string cmdline;
   if (GetCmdlineForPID(pid, &cmdline)) {  // normalized form
     // reject if absent from non-empty whitelist, or present in blacklist
     reject_cmd = (filter.cmdlines.size() && !filter.cmdlines.count(cmdline)) ||
                  filter.exclude_cmdlines.count(cmdline);
   } else {
     PERFETTO_LOG("Failed to look up cmdline for pid [%d]",
                  static_cast<int>(pid));
     // reject only if there's a whitelist present
     reject_cmd = filter.cmdlines.size() > 0;
   }

   bool reject_pid = (filter.pids.size() && !filter.pids.count(pid)) ||
                     filter.exclude_pids.count(pid);

   if (reject_cmd || reject_pid) {
     PERFETTO_DLOG(
         "Rejecting samples for pid [%d] due to cmdline(%d) or pid(%d)",
         static_cast<int>(pid), reject_cmd, reject_pid);

     return true;
   }
   return false;
 }

 }  // namespace

 PerfProducer::PerfProducer(ProcDescriptorGetter* proc_fd_getter,
                            base::TaskRunner* task_runner)
     : task_runner_(task_runner),
       proc_fd_getter_(proc_fd_getter),
       unwinding_worker_(this),
       weak_factory_(this) {
   proc_fd_getter->SetDelegate(this);
 }

 // TODO(rsavitski): consider configure at setup + enable at start instead.
 void PerfProducer::SetupDataSource(DataSourceInstanceID,
                                    const DataSourceConfig&) {}

 void PerfProducer::StartDataSource(DataSourceInstanceID instance_id,
                                    const DataSourceConfig& config) {
   PERFETTO_LOG("StartDataSource(%zu, %s)", static_cast<size_t>(instance_id),
                config.name().c_str());

   if (config.name() == MetatraceWriter::kDataSourceName) {
     StartMetatraceSource(instance_id,
                          static_cast<BufferID>(config.target_buffer()));
     return;
   }

   // linux.perf data source
   if (config.name() != kDataSourceName)
     return;

   base::Optional<EventConfig> event_config = EventConfig::Create(config);
   if (!event_config.has_value()) {
     PERFETTO_ELOG("PerfEventConfig rejected.");
     return;
   }

   // TODO(rsavitski): consider supporting specific cpu subsets.
   if (!event_config->target_all_cpus()) {
     PERFETTO_ELOG("PerfEventConfig{all_cpus} required");
     return;
   }
   size_t num_cpus = NumberOfCpus();
   std::vector<EventReader> per_cpu_readers;
   for (uint32_t cpu = 0; cpu < num_cpus; cpu++) {
     base::Optional<EventReader> event_reader =
         EventReader::ConfigureEvents(cpu, event_config.value());
     if (!event_reader.has_value()) {
       PERFETTO_ELOG("Failed to set up perf events for cpu%" PRIu32
                     ", discarding data source.",
                     cpu);
       return;
     }
     per_cpu_readers.emplace_back(std::move(event_reader.value()));
   }

   auto buffer_id = static_cast<BufferID>(config.target_buffer());
   auto writer = endpoint_->CreateTraceWriter(buffer_id);

   // Construct the data source instance.
   std::map<DataSourceInstanceID, DataSourceState>::iterator ds_it;
   bool inserted;
   std::tie(ds_it, inserted) = data_sources_.emplace(
       std::piecewise_construct, std::forward_as_tuple(instance_id),
       std::forward_as_tuple(event_config.value(), std::move(writer),
                             std::move(per_cpu_readers)));
   PERFETTO_CHECK(inserted);

   // Write out a packet to initialize the incremental state for this sequence.
   InterningOutputTracker::WriteFixedInterningsPacket(
       ds_it->second.trace_writer.get());

   // Inform unwinder of the new data source instance.
   unwinding_worker_->PostStartDataSource(instance_id);

   // Kick off periodic read task.
   auto weak_this = weak_factory_.GetWeakPtr();
   task_runner_->PostDelayedTask(
       [weak_this, instance_id] {
         if (weak_this)
           weak_this->TickDataSourceRead(instance_id);
       },
       kReadTickPeriodMs - (NowMs() % kReadTickPeriodMs));
 }

 void PerfProducer::StopDataSource(DataSourceInstanceID instance_id) {
   PERFETTO_LOG("StopDataSource(%zu)", static_cast<size_t>(instance_id));

   // Metatrace: stop immediately (will miss the events from the
   // asynchronous shutdown of the primary data source).
   auto meta_it = metatrace_writers_.find(instance_id);
   if (meta_it != metatrace_writers_.end()) {
     meta_it->second.WriteAllAndFlushTraceWriter([] {});
     metatrace_writers_.erase(meta_it);
     return;
   }

   auto ds_it = data_sources_.find(instance_id);
   if (ds_it == data_sources_.end())
     return;

   // Start shutting down the reading frontend, which will propagate the stop
   // further as the intermediate buffers are cleared.
   DataSourceState& ds = ds_it->second;
   InitiateReaderStop(&ds);
 }

 // The perf data sources ignore flush requests, as flushing would be
 // unnecessarily complicated given out-of-order unwinding and proc-fd timeouts.
 // Instead of responding to explicit flushes, we can ensure that we're otherwise
 // well-behaved (do not reorder packets too much), and let the service scrape
 // the SMB.
 void PerfProducer::Flush(FlushRequestID flush_id,
                          const DataSourceInstanceID* data_source_ids,
                          size_t num_data_sources) {
   bool should_ack_flush = false;
   for (size_t i = 0; i < num_data_sources; i++) {
     auto ds_id = data_source_ids[i];
     PERFETTO_DLOG("Flush(%zu)", static_cast<size_t>(ds_id));

     auto meta_it = metatrace_writers_.find(ds_id);
     if (meta_it != metatrace_writers_.end()) {
       meta_it->second.WriteAllAndFlushTraceWriter([] {});
       should_ack_flush = true;
     }
     if (data_sources_.find(ds_id) != data_sources_.end()) {
       should_ack_flush = true;
     }
   }
   if (should_ack_flush)
     endpoint_->NotifyFlushComplete(flush_id);
 }

 void PerfProducer::TickDataSourceRead(DataSourceInstanceID ds_id) {
   auto it = data_sources_.find(ds_id);
   if (it == data_sources_.end()) {
     PERFETTO_DLOG("TickDataSourceRead(%zu): source gone",
                   static_cast<size_t>(ds_id));
     return;
   }
   DataSourceState& ds = it->second;

   PERFETTO_METATRACE_SCOPED(TAG_PRODUCER, PROFILER_READ_TICK);

   // Make a pass over all per-cpu readers.
   bool more_records_available = false;
   for (EventReader& reader : ds.per_cpu_readers) {
     if (ReadAndParsePerCpuBuffer(&reader, kMaxSamplesPerCpuPerReadTick, ds_id,
                                  &ds)) {
       more_records_available = true;
     }
   }

   // Wake up the unwinder as we've (likely) pushed samples into its queue.
   unwinding_worker_->PostProcessQueue();

   if (PERFETTO_UNLIKELY(ds.status == DataSourceState::Status::kShuttingDown) &&
       !more_records_available) {
     unwinding_worker_->PostInitiateDataSourceStop(ds_id);
   } else {
     // otherwise, keep reading
     auto weak_this = weak_factory_.GetWeakPtr();
     task_runner_->PostDelayedTask(
         [weak_this, ds_id] {
           if (weak_this)
             weak_this->TickDataSourceRead(ds_id);
         },
         kReadTickPeriodMs - (NowMs() % kReadTickPeriodMs));
   }
 }

 bool PerfProducer::ReadAndParsePerCpuBuffer(EventReader* reader,
                                             size_t max_samples,
                                             DataSourceInstanceID ds_id,
                                             DataSourceState* ds) {
   PERFETTO_METATRACE_SCOPED(TAG_PRODUCER, PROFILER_READ_CPU);

   // If the kernel ring buffer dropped data, record it in the trace.
   size_t cpu = reader->cpu();
   auto records_lost_callback = [this, ds_id, cpu](uint64_t records_lost) {
     auto weak_this = weak_factory_.GetWeakPtr();
     task_runner_->PostTask([weak_this, ds_id, cpu, records_lost] {
       if (weak_this)
         weak_this->EmitRingBufferLoss(ds_id, cpu, records_lost);
     });
   };

   for (size_t i = 0; i < max_samples; i++) {
     base::Optional<ParsedSample> sample =
         reader->ReadUntilSample(records_lost_callback);
     if (!sample) {
       return false;  // caught up to the writer
     }

     if (!sample->regs) {
       continue;  // skip kernel threads/workers
     }

     // Request proc-fds for the process if this is the first time we see it.
     pid_t pid = sample->pid;
     auto& process_state = ds->process_states[pid];  // insert if new

     if (process_state == ProcessTrackingStatus::kExpired) {
       PERFETTO_DLOG("Skipping sample for previously expired pid [%d]",
                     static_cast<int>(pid));
       PostEmitSkippedSample(ds_id, ProfilerStage::kRead,
                             std::move(sample.value()));
       continue;
     }

     // Previously failed the target filter check.
     if (process_state == ProcessTrackingStatus::kRejected) {
       PERFETTO_DLOG("Skipping sample for pid [%d] due to target filter",
                     static_cast<int>(pid));
       continue;
     }

     // Seeing pid for the first time.
     if (process_state == ProcessTrackingStatus::kInitial) {
       PERFETTO_DLOG("New pid: [%d]", static_cast<int>(pid));

       // Check whether samples for this new process should be
       // dropped due to the target whitelist/blacklist.
       const TargetFilter& filter = ds->event_cfg.filter();
       if (ShouldRejectDueToFilter(pid, filter)) {
         process_state = ProcessTrackingStatus::kRejected;
         continue;
       }

       // At this point, sampled process is known to be of interest, so start
       // resolving the proc-fds.
       process_state = ProcessTrackingStatus::kResolving;
       proc_fd_getter_->GetDescriptorsForPid(pid);  // response is async
       PostDescriptorLookupTimeout(ds_id, pid, kProcDescriptorTimeoutMs);
     }

     PERFETTO_CHECK(process_state == ProcessTrackingStatus::kResolved ||
                    process_state == ProcessTrackingStatus::kResolving);

     // Push the sample into the unwinding queue if there is room.
     // TODO(rsavitski): this can silently drop entries. We should either record
     // them (e.g. using |PostEmitSkippedSample|), or rearchitect the kernel
     // buffer reading s.t. we can retain the blocked samples (putting
     // back-pressure on the kernel ring buffer instead).
     auto& queue = unwinding_worker_->unwind_queue();
     WriteView write_view = queue.BeginWrite();
     if (write_view.valid) {
       queue.at(write_view.write_pos) =
           UnwindEntry{ds_id, std::move(sample.value())};
       queue.CommitWrite();
     }
   }

   // Most likely more events in the kernel buffer. Though we might be exactly on
   // the boundary due to |max_samples|.
   return true;
 }

 // Note: first-fit makes descriptor request fulfillment not true FIFO. But the
 // edge-cases where it matters are very unlikely.
 void PerfProducer::OnProcDescriptors(pid_t pid,
                                      base::ScopedFile maps_fd,
                                      base::ScopedFile mem_fd) {
   // Find first fit data source that is waiting on descriptors for the process.
   for (auto& it : data_sources_) {
     DataSourceState& ds = it.second;
     auto proc_status_it = ds.process_states.find(pid);
     if (proc_status_it != ds.process_states.end() &&
         proc_status_it->second == ProcessTrackingStatus::kResolving) {
       PERFETTO_DLOG("Handing off proc-fds for pid [%d] to DS [%zu]",
                     static_cast<int>(pid), static_cast<size_t>(it.first));

       proc_status_it->second = ProcessTrackingStatus::kResolved;
       unwinding_worker_->PostAdoptProcDescriptors(
           it.first, pid, std::move(maps_fd), std::move(mem_fd));
       return;  // done
     }
   }
   PERFETTO_DLOG(
       "Discarding proc-fds for pid [%d] as found no outstanding requests.",
       static_cast<int>(pid));
 }

 void PerfProducer::PostDescriptorLookupTimeout(DataSourceInstanceID ds_id,
                                                pid_t pid,
                                                uint32_t timeout_ms) {
   auto weak_this = weak_factory_.GetWeakPtr();
   task_runner_->PostDelayedTask(
       [weak_this, ds_id, pid] {
         if (weak_this)
           weak_this->DescriptorLookupTimeout(ds_id, pid);
       },
       timeout_ms);
 }

 void PerfProducer::DescriptorLookupTimeout(DataSourceInstanceID ds_id,
                                            pid_t pid) {
   auto ds_it = data_sources_.find(ds_id);
   if (ds_it == data_sources_.end())
     return;

   // If the request is still outstanding, poison the pid for this source.
   DataSourceState& ds = ds_it->second;
   auto proc_status_it = ds.process_states.find(pid);
   if (proc_status_it != ds.process_states.end() &&
       proc_status_it->second == ProcessTrackingStatus::kResolving) {
     PERFETTO_DLOG("Descriptor lookup timeout of pid [%d] for DS [%zu]",
                   static_cast<int>(pid), static_cast<size_t>(ds_it->first));

     proc_status_it->second = ProcessTrackingStatus::kExpired;
     // Also inform the unwinder of the state change (so that it can discard any
     // of the already-enqueued samples).
     unwinding_worker_->PostRecordTimedOutProcDescriptors(ds_id, pid);
   }
 }

 void PerfProducer::PostEmitSample(DataSourceInstanceID ds_id,
                                   CompletedSample sample) {
   // hack: c++11 lambdas can't be moved into, so stash the sample on the heap.
   CompletedSample* raw_sample = new CompletedSample(std::move(sample));
   auto weak_this = weak_factory_.GetWeakPtr();
   task_runner_->PostTask([weak_this, ds_id, raw_sample] {
     if (weak_this)
       weak_this->EmitSample(ds_id, std::move(*raw_sample));
     delete raw_sample;
   });
 }

 void PerfProducer::EmitSample(DataSourceInstanceID ds_id,
                               CompletedSample sample) {
   auto ds_it = data_sources_.find(ds_id);
   PERFETTO_CHECK(ds_it != data_sources_.end());
   DataSourceState& ds = ds_it->second;

   // intern callsite
   GlobalCallstackTrie::Node* callstack_root =
       callstack_trie_.CreateCallsite(sample.frames);
   uint64_t callstack_iid = callstack_root->id();

   // start packet
   auto packet = ds.trace_writer->NewTracePacket();
   packet->set_timestamp(sample.timestamp);

   // write new interning data (if any)
   protos::pbzero::InternedData* interned_out = packet->set_interned_data();
   ds.interning_output.WriteCallstack(callstack_root, &callstack_trie_,
                                      interned_out);

   // write the sample itself
   auto* perf_sample = packet->set_perf_sample();
   perf_sample->set_cpu(sample.cpu);
   perf_sample->set_pid(static_cast<uint32_t>(sample.pid));
   perf_sample->set_tid(static_cast<uint32_t>(sample.tid));
   perf_sample->set_cpu_mode(ToCpuModeEnum(sample.cpu_mode));
   perf_sample->set_callstack_iid(callstack_iid);
   if (sample.unwind_error != unwindstack::ERROR_NONE) {
     perf_sample->set_unwind_error(ToProtoEnum(sample.unwind_error));
   }
 }

 void PerfProducer::EmitRingBufferLoss(DataSourceInstanceID ds_id,
                                       size_t cpu,
                                       uint64_t records_lost) {
   auto ds_it = data_sources_.find(ds_id);
   PERFETTO_CHECK(ds_it != data_sources_.end());
   DataSourceState& ds = ds_it->second;
   PERFETTO_DLOG("DataSource(%zu): cpu%zu lost [%" PRIu64 "] records",
                 static_cast<size_t>(ds_id), cpu, records_lost);

   // The data loss record relates to a single ring buffer, and indicates loss
   // since the last successfully-written record in that buffer. Therefore the
   // data loss record itself has no timestamp.
   // We timestamp the packet with the boot clock for packet ordering purposes,
   // but it no longer has a (precise) interpretation relative to the sample
   // stream from that per-cpu buffer. See the proto comments for more details.
   auto packet = ds.trace_writer->NewTracePacket();
   packet->set_timestamp(static_cast<uint64_t>(base::GetBootTimeNs().count()));

   auto* perf_sample = packet->set_perf_sample();
   perf_sample->set_cpu(static_cast<uint32_t>(cpu));
   perf_sample->set_kernel_records_lost(records_lost);
 }

 void PerfProducer::PostEmitSkippedSample(DataSourceInstanceID ds_id,
                                          ProfilerStage stage,
                                          ParsedSample sample) {
   // hack: c++11 lambdas can't be moved into, so stash the sample on the heap.
   ParsedSample* raw_sample = new ParsedSample(std::move(sample));
   auto weak_this = weak_factory_.GetWeakPtr();
   task_runner_->PostTask([weak_this, ds_id, stage, raw_sample] {
     if (weak_this)
       weak_this->EmitSkippedSample(ds_id, stage, std::move(*raw_sample));
     delete raw_sample;
   });
 }

 void PerfProducer::EmitSkippedSample(DataSourceInstanceID ds_id,
                                      ProfilerStage stage,
                                      ParsedSample sample) {
   auto ds_it = data_sources_.find(ds_id);
   PERFETTO_CHECK(ds_it != data_sources_.end());
   DataSourceState& ds = ds_it->second;

   auto packet = ds.trace_writer->NewTracePacket();
   packet->set_timestamp(sample.timestamp);
   auto* perf_sample = packet->set_perf_sample();
   perf_sample->set_cpu(sample.cpu);
   perf_sample->set_pid(static_cast<uint32_t>(sample.pid));
   perf_sample->set_tid(static_cast<uint32_t>(sample.tid));
   perf_sample->set_cpu_mode(ToCpuModeEnum(sample.cpu_mode));

   using PerfSample = protos::pbzero::PerfSample;
   switch (stage) {
     case ProfilerStage::kRead:
       perf_sample->set_sample_skipped_reason(PerfSample::PROFILER_STAGE_READ);
       break;
     case ProfilerStage::kUnwind:
       perf_sample->set_sample_skipped_reason(PerfSample::PROFILER_STAGE_UNWIND);
       break;
   }
 }

 void PerfProducer::InitiateReaderStop(DataSourceState* ds) {
   PERFETTO_DLOG("InitiateReaderStop");
   PERFETTO_CHECK(ds->status != DataSourceState::Status::kShuttingDown);

   ds->status = DataSourceState::Status::kShuttingDown;
   for (auto& event_reader : ds->per_cpu_readers) {
     event_reader.PauseEvents();
   }
 }

 void PerfProducer::PostFinishDataSourceStop(DataSourceInstanceID ds_id) {
   auto weak_producer = weak_factory_.GetWeakPtr();
   task_runner_->PostTask([weak_producer, ds_id] {
     if (weak_producer)
       weak_producer->FinishDataSourceStop(ds_id);
   });
 }

 void PerfProducer::FinishDataSourceStop(DataSourceInstanceID ds_id) {
   PERFETTO_LOG("FinishDataSourceStop(%zu)", static_cast<size_t>(ds_id));
   auto ds_it = data_sources_.find(ds_id);
   PERFETTO_CHECK(ds_it != data_sources_.end());
   DataSourceState& ds = ds_it->second;
   PERFETTO_CHECK(ds.status == DataSourceState::Status::kShuttingDown);

   ds.trace_writer->Flush();
   data_sources_.erase(ds_it);

   endpoint_->NotifyDataSourceStopped(ds_id);

   // Clean up resources if there are no more active sources.
   if (data_sources_.empty()) {
     callstack_trie_.ClearTrie();  // purge internings
   }
 }

 void PerfProducer::StartMetatraceSource(DataSourceInstanceID ds_id,
                                         BufferID target_buffer) {
   auto writer = endpoint_->CreateTraceWriter(target_buffer);

   auto it_and_inserted = metatrace_writers_.emplace(
       std::piecewise_construct, std::make_tuple(ds_id), std::make_tuple());
   PERFETTO_DCHECK(it_and_inserted.second);
   // Note: only the first concurrent writer will actually be active.
   metatrace_writers_[ds_id].Enable(task_runner_, std::move(writer),
                                    metatrace::TAG_ANY);
 }

 void PerfProducer::ConnectWithRetries(const char* socket_name) {
   PERFETTO_DCHECK(state_ == kNotStarted);
   state_ = kNotConnected;

   ResetConnectionBackoff();
   producer_socket_name_ = socket_name;
   ConnectService();
 }

 void PerfProducer::ConnectService() {
   PERFETTO_DCHECK(state_ == kNotConnected);
   state_ = kConnecting;
   endpoint_ = ProducerIPCClient::Connect(
       producer_socket_name_, this, kProducerName, task_runner_,
       TracingService::ProducerSMBScrapingMode::kEnabled);
 }

 void PerfProducer::IncreaseConnectionBackoff() {
   connection_backoff_ms_ *= 2;
   if (connection_backoff_ms_ > kMaxConnectionBackoffMs)
     connection_backoff_ms_ = kMaxConnectionBackoffMs;
 }

 void PerfProducer::ResetConnectionBackoff() {
   connection_backoff_ms_ = kInitialConnectionBackoffMs;
 }

 void PerfProducer::OnConnect() {
   PERFETTO_DCHECK(state_ == kConnecting);
   state_ = kConnected;
   ResetConnectionBackoff();
   PERFETTO_LOG("Connected to the service");

   {
     // linux.perf
     DataSourceDescriptor desc;
     desc.set_name(kDataSourceName);
     desc.set_will_notify_on_stop(true);
     endpoint_->RegisterDataSource(desc);
   }
   {
     // metatrace
     DataSourceDescriptor desc;
     desc.set_name(MetatraceWriter::kDataSourceName);
     endpoint_->RegisterDataSource(desc);
   }
 }

 void PerfProducer::OnDisconnect() {
   PERFETTO_DCHECK(state_ == kConnected || state_ == kConnecting);
   PERFETTO_LOG("Disconnected from tracing service");

   auto weak_producer = weak_factory_.GetWeakPtr();
   if (state_ == kConnected)
     return task_runner_->PostTask([weak_producer] {
       if (weak_producer)
         weak_producer->Restart();
     });

   state_ = kNotConnected;
   IncreaseConnectionBackoff();
   task_runner_->PostDelayedTask(
       [weak_producer] {
         if (weak_producer)
           weak_producer->ConnectService();
       },
       connection_backoff_ms_);
 }

 void PerfProducer::Restart() {
   // We lost the connection with the tracing service. At this point we need
   // to reset all the data sources. Trying to handle that manually is going to
   // be error prone. What we do here is simply destroy the instance and
   // recreate it again.
   base::TaskRunner* task_runner = task_runner_;
   const char* socket_name = producer_socket_name_;
   ProcDescriptorGetter* proc_fd_getter = proc_fd_getter_;

   // Invoke destructor and then the constructor again.
   this->~PerfProducer();
   new (this) PerfProducer(proc_fd_getter, task_runner);

   ConnectWithRetries(socket_name);
 }

 }  // namespace profiling
 }  // namespace perfetto