blob: c309180e00d36b91560c01a1086b23b9f5e92daa [file] [log] [blame]
Isabelle Taylord404ea12018-02-19 17:28:01 +00001/*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "src/traced/probes/probes_producer.h"
18
19#include <stdio.h>
Anna Zappone4ea73c02018-03-09 16:01:21 +000020#include <sys/stat.h>
Primiano Tucci52526602018-03-29 22:53:10 +010021
22#include <algorithm>
Anna Zappone27ac99c2018-03-06 14:25:35 +000023#include <queue>
Isabelle Taylord404ea12018-02-19 17:28:01 +000024#include <string>
25
26#include "perfetto/base/logging.h"
Primiano Tuccifd8240d2018-08-01 09:34:54 +010027#include "perfetto/base/utils.h"
Hector Dearman0ff07c72018-03-15 09:54:46 +000028#include "perfetto/base/weak_ptr.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000029#include "perfetto/traced/traced.h"
30#include "perfetto/tracing/core/data_source_config.h"
31#include "perfetto/tracing/core/data_source_descriptor.h"
Hector Dearmana89cc572018-02-23 12:02:58 +000032#include "perfetto/tracing/core/ftrace_config.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000033#include "perfetto/tracing/core/trace_config.h"
34#include "perfetto/tracing/core/trace_packet.h"
Primiano Tuccic2eb5102018-05-15 10:40:01 +010035#include "perfetto/tracing/ipc/producer_ipc_client.h"
Anna Zappone2a6f9042018-03-14 13:26:07 +000036#include "src/traced/probes/filesystem/inode_file_data_source.h"
Primiano Tuccifd8240d2018-08-01 09:34:54 +010037#include "src/traced/probes/ftrace/ftrace_data_source.h"
38#include "src/traced/probes/probes_data_source.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000039
Anna Zappone27ac99c2018-03-06 14:25:35 +000040#include "perfetto/trace/filesystem/inode_file_map.pbzero.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000041#include "perfetto/trace/ftrace/ftrace_event_bundle.pbzero.h"
Hector Dearman3afb1e02018-04-27 16:46:52 +010042#include "perfetto/trace/ftrace/ftrace_stats.pbzero.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000043#include "perfetto/trace/trace_packet.pbzero.h"
44
45namespace perfetto {
46namespace {
47
Primiano Tucci3cbb10a2018-04-10 17:52:40 +010048constexpr uint32_t kInitialConnectionBackoffMs = 100;
49constexpr uint32_t kMaxConnectionBackoffMs = 30 * 1000;
Primiano Tucci578d7842018-03-29 15:27:05 +010050constexpr char kFtraceSourceName[] = "linux.ftrace";
51constexpr char kProcessStatsSourceName[] = "linux.process_stats";
52constexpr char kInodeMapSourceName[] = "linux.inode_file_map";
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010053constexpr char kSysStatsSourceName[] = "linux.sys_stats";
Isabelle Taylord404ea12018-02-19 17:28:01 +000054
55} // namespace.
56
57// State transition diagram:
58// +----------------------------+
59// v +
60// NotStarted -> NotConnected -> Connecting -> Connected
61// ^ +
62// +--------------+
63//
64
Primiano Tuccifd8240d2018-08-01 09:34:54 +010065ProbesProducer::ProbesProducer() : weak_factory_(this) {}
66ProbesProducer::~ProbesProducer() {
67 // The ftrace data sources must be deleted before the ftrace controller.
68 data_sources_.clear();
69 ftrace_.reset();
70}
Isabelle Taylord404ea12018-02-19 17:28:01 +000071
72void ProbesProducer::OnConnect() {
73 PERFETTO_DCHECK(state_ == kConnecting);
74 state_ = kConnected;
75 ResetConnectionBackoff();
76 PERFETTO_LOG("Connected to the service");
77
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010078 {
79 DataSourceDescriptor desc;
80 desc.set_name(kFtraceSourceName);
81 endpoint_->RegisterDataSource(desc);
82 }
Isabelle Taylord404ea12018-02-19 17:28:01 +000083
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010084 {
85 DataSourceDescriptor desc;
86 desc.set_name(kProcessStatsSourceName);
87 endpoint_->RegisterDataSource(desc);
88 }
Anna Zappone27ac99c2018-03-06 14:25:35 +000089
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010090 {
91 DataSourceDescriptor desc;
92 desc.set_name(kInodeMapSourceName);
93 endpoint_->RegisterDataSource(desc);
94 }
95
96 {
97 DataSourceDescriptor desc;
98 desc.set_name(kSysStatsSourceName);
99 endpoint_->RegisterDataSource(desc);
100 }
Isabelle Taylord404ea12018-02-19 17:28:01 +0000101}
102
103void ProbesProducer::OnDisconnect() {
104 PERFETTO_DCHECK(state_ == kConnected || state_ == kConnecting);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000105 PERFETTO_LOG("Disconnected from tracing service");
Primiano Tuccie56411c2018-03-30 01:15:02 +0100106 if (state_ == kConnected)
107 return task_runner_->PostTask([this] { this->Restart(); });
Isabelle Taylord404ea12018-02-19 17:28:01 +0000108
Primiano Tuccie56411c2018-03-30 01:15:02 +0100109 state_ = kNotConnected;
110 IncreaseConnectionBackoff();
Isabelle Taylord404ea12018-02-19 17:28:01 +0000111 task_runner_->PostDelayedTask([this] { this->Connect(); },
112 connection_backoff_ms_);
113}
114
Primiano Tuccie56411c2018-03-30 01:15:02 +0100115void ProbesProducer::Restart() {
116 // We lost the connection with the tracing service. At this point we need
117 // to reset all the data sources. Trying to handle that manually is going to
118 // be error prone. What we do here is simply desroying the instance and
119 // recreating it again.
120 // TODO(hjd): Add e2e test for this.
121
122 base::TaskRunner* task_runner = task_runner_;
123 const char* socket_name = socket_name_;
124
125 // Invoke destructor and then the constructor again.
126 this->~ProbesProducer();
127 new (this) ProbesProducer();
128
129 ConnectWithRetries(socket_name, task_runner);
130}
131
Primiano Tucci674076d2018-10-01 10:41:09 +0100132void ProbesProducer::SetupDataSource(DataSourceInstanceID instance_id,
Primiano Tucciafb72b52018-09-25 09:37:24 +0100133 const DataSourceConfig& config) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100134 PERFETTO_DLOG("SetupDataSource(id=%" PRIu64 ", name=%s)", instance_id,
135 config.name().c_str());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100136 PERFETTO_DCHECK(data_sources_.count(instance_id) == 0);
Primiano Tucci03de28f2018-08-01 11:29:46 +0100137 TracingSessionID session_id = config.tracing_session_id();
138 PERFETTO_CHECK(session_id > 0);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000139
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100140 std::unique_ptr<ProbesDataSource> data_source;
Hector Dearman0ff07c72018-03-15 09:54:46 +0000141 if (config.name() == kFtraceSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100142 data_source = CreateFtraceDataSource(session_id, instance_id, config);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000143 } else if (config.name() == kInodeMapSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100144 data_source = CreateInodeFileDataSource(session_id, instance_id, config);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000145 } else if (config.name() == kProcessStatsSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100146 data_source = CreateProcessStatsDataSource(session_id, instance_id, config);
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100147 } else if (config.name() == kSysStatsSourceName) {
148 data_source = CreateSysStatsDataSource(session_id, instance_id, config);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100149 }
150
151 if (!data_source) {
152 PERFETTO_ELOG("Failed to create data source '%s'", config.name().c_str());
Hector Dearman0ff07c72018-03-15 09:54:46 +0000153 return;
154 }
155
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100156 session_data_sources_.emplace(session_id, data_source.get());
157 data_sources_[instance_id] = std::move(data_source);
Primiano Tucci674076d2018-10-01 10:41:09 +0100158}
Hector Dearman0ff07c72018-03-15 09:54:46 +0000159
Primiano Tucci674076d2018-10-01 10:41:09 +0100160void ProbesProducer::StartDataSource(DataSourceInstanceID instance_id,
161 const DataSourceConfig& config) {
162 PERFETTO_DLOG("StartDataSource(id=%" PRIu64 ", name=%s)", instance_id,
163 config.name().c_str());
164 auto it = data_sources_.find(instance_id);
165 if (it == data_sources_.end()) {
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100166 // Can happen if SetupDataSource() failed (e.g. ftrace was busy).
Primiano Tucci674076d2018-10-01 10:41:09 +0100167 PERFETTO_ELOG("Data source id=%" PRIu64 " not found", instance_id);
168 return;
169 }
170 ProbesDataSource* data_source = it->second.get();
171 if (data_source->started)
172 return;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100173 if (config.trace_duration_ms() != 0) {
174 uint32_t timeout = 5000 + 2 * config.trace_duration_ms();
175 watchdogs_.emplace(
176 instance_id, base::Watchdog::GetInstance()->CreateFatalTimer(timeout));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000177 }
Primiano Tucci674076d2018-10-01 10:41:09 +0100178 data_source->started = true;
179 data_source->Start();
Isabelle Taylord404ea12018-02-19 17:28:01 +0000180}
181
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100182std::unique_ptr<ProbesDataSource> ProbesProducer::CreateFtraceDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000183 TracingSessionID session_id,
Isabelle Taylord404ea12018-02-19 17:28:01 +0000184 DataSourceInstanceID id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000185 const DataSourceConfig& config) {
Isabelle Taylord404ea12018-02-19 17:28:01 +0000186 // Don't retry if FtraceController::Create() failed once.
187 // This can legitimately happen on user builds where we cannot access the
188 // debug paths, e.g., because of SELinux rules.
189 if (ftrace_creation_failed_)
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100190 return nullptr;
Isabelle Taylord404ea12018-02-19 17:28:01 +0000191
192 // Lazily create on the first instance.
193 if (!ftrace_) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100194 ftrace_ = FtraceController::Create(task_runner_, this);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000195
196 if (!ftrace_) {
197 PERFETTO_ELOG("Failed to create FtraceController");
198 ftrace_creation_failed_ = true;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100199 return nullptr;
Isabelle Taylord404ea12018-02-19 17:28:01 +0000200 }
201
202 ftrace_->DisableAllEvents();
203 ftrace_->ClearTrace();
204 }
205
Primiano Tucci674076d2018-10-01 10:41:09 +0100206 PERFETTO_LOG("Ftrace setup (id=%" PRIu64 ", target_buf=%" PRIu32 ")", id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000207 config.target_buffer());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100208 const BufferID buffer_id = static_cast<BufferID>(config.target_buffer());
209 std::unique_ptr<FtraceDataSource> data_source(new FtraceDataSource(
210 ftrace_->GetWeakPtr(), session_id, config.ftrace_config(),
211 endpoint_->CreateTraceWriter(buffer_id)));
212 if (!ftrace_->AddDataSource(data_source.get())) {
213 PERFETTO_ELOG(
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100214 "Failed to setup tracing (too many concurrent sessions or ftrace is "
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100215 "already in use)");
216 return nullptr;
Hector Dearmanee3c49d2018-02-28 14:10:22 +0000217 }
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100218 return std::move(data_source);
Anna Zappone27ac99c2018-03-06 14:25:35 +0000219}
220
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100221std::unique_ptr<ProbesDataSource> ProbesProducer::CreateInodeFileDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000222 TracingSessionID session_id,
Anna Zappone27ac99c2018-03-06 14:25:35 +0000223 DataSourceInstanceID id,
Primiano Tuccidae35652018-03-29 18:32:02 +0100224 DataSourceConfig source_config) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100225 PERFETTO_LOG("Inode file map setup (id=%" PRIu64 ", target_buf=%" PRIu32 ")",
Anna Zappone27ac99c2018-03-06 14:25:35 +0000226 id, source_config.target_buffer());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100227 auto buffer_id = static_cast<BufferID>(source_config.target_buffer());
Anna Zappone2a6f9042018-03-14 13:26:07 +0000228 if (system_inodes_.empty())
Hector Dearman7fabd702018-03-28 12:37:15 +0100229 CreateStaticDeviceToInodeMap("/system", &system_inodes_);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100230 return std::unique_ptr<InodeFileDataSource>(new InodeFileDataSource(
231 std::move(source_config), task_runner_, session_id, &system_inodes_,
232 &cache_, endpoint_->CreateTraceWriter(buffer_id)));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000233}
234
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100235std::unique_ptr<ProbesDataSource> ProbesProducer::CreateProcessStatsDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000236 TracingSessionID session_id,
Hector Dearman77451692018-03-08 16:21:13 +0000237 DataSourceInstanceID id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000238 const DataSourceConfig& config) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100239 base::ignore_result(id);
240 auto buffer_id = static_cast<BufferID>(config.target_buffer());
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100241 return std::unique_ptr<ProcessStatsDataSource>(new ProcessStatsDataSource(
Primiano Tuccic9d4a8b2018-10-30 20:19:01 -0700242 task_runner_, session_id, endpoint_->CreateTraceWriter(buffer_id),
243 config));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000244}
245
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100246std::unique_ptr<SysStatsDataSource> ProbesProducer::CreateSysStatsDataSource(
247 TracingSessionID session_id,
248 DataSourceInstanceID id,
249 const DataSourceConfig& config) {
250 base::ignore_result(id);
251 auto buffer_id = static_cast<BufferID>(config.target_buffer());
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100252 return std::unique_ptr<SysStatsDataSource>(
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100253 new SysStatsDataSource(task_runner_, session_id,
254 endpoint_->CreateTraceWriter(buffer_id), config));
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100255}
256
Primiano Tucciafb72b52018-09-25 09:37:24 +0100257void ProbesProducer::StopDataSource(DataSourceInstanceID id) {
Isabelle Taylord404ea12018-02-19 17:28:01 +0000258 PERFETTO_LOG("Producer stop (id=%" PRIu64 ")", id);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100259 auto it = data_sources_.find(id);
260 if (it == data_sources_.end()) {
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100261 // Can happen if SetupDataSource() failed (e.g. ftrace was busy).
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100262 PERFETTO_ELOG("Cannot stop data source id=%" PRIu64 ", not found", id);
263 return;
264 }
265 ProbesDataSource* data_source = it->second.get();
266 TracingSessionID session_id = data_source->tracing_session_id;
267 auto range = session_data_sources_.equal_range(session_id);
268 for (auto kv = range.first; kv != range.second; kv++) {
269 if (kv->second != data_source)
270 continue;
271 session_data_sources_.erase(kv);
272 break;
273 }
274 data_sources_.erase(it);
Hector Dearman77451692018-03-08 16:21:13 +0000275 watchdogs_.erase(id);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000276}
277
Primiano Tuccidca727d2018-04-04 11:31:55 +0200278void ProbesProducer::OnTracingSetup() {}
Isabelle Taylor69faa902018-03-21 15:42:03 +0000279
Primiano Tuccid52e6272018-04-06 19:06:53 +0200280void ProbesProducer::Flush(FlushRequestID flush_request_id,
281 const DataSourceInstanceID* data_source_ids,
282 size_t num_data_sources) {
283 for (size_t i = 0; i < num_data_sources; i++) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100284 auto it = data_sources_.find(data_source_ids[i]);
Primiano Tucci674076d2018-10-01 10:41:09 +0100285 if (it == data_sources_.end() || !it->second->started)
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100286 continue;
287 it->second->Flush();
Primiano Tuccid52e6272018-04-06 19:06:53 +0200288 }
289 endpoint_->NotifyFlushComplete(flush_request_id);
290}
291
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100292// This function is called by the FtraceController in batches, whenever it has
293// read one or more pages from one or more cpus and written that into the
294// userspace tracing buffer. If more than one ftrace data sources are active,
295// this call typically happens after writing for all session has been handled.
296void ProbesProducer::OnFtraceDataWrittenIntoDataSourceBuffers() {
297 TracingSessionID last_session_id = 0;
298 FtraceMetadata* metadata = nullptr;
299 InodeFileDataSource* inode_data_source = nullptr;
300 ProcessStatsDataSource* ps_data_source = nullptr;
301
302 // unordered_multimap guarantees that entries with the same key are contiguous
303 // in the iteration.
304 for (auto it = session_data_sources_.begin(); /* check below*/; it++) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100305 // If this is the last iteration or the session id has changed,
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100306 // dispatch the metadata update to the linked data sources, if any.
307 if (it == session_data_sources_.end() || it->first != last_session_id) {
308 bool has_inodes = metadata && !metadata->inode_and_device.empty();
309 bool has_pids = metadata && !metadata->pids.empty();
310 if (has_inodes && inode_data_source)
311 inode_data_source->OnInodes(metadata->inode_and_device);
312 if (has_pids && ps_data_source)
313 ps_data_source->OnPids(metadata->pids);
314 if (metadata)
315 metadata->Clear();
316 metadata = nullptr;
317 inode_data_source = nullptr;
318 ps_data_source = nullptr;
319 if (it == session_data_sources_.end())
320 break;
321 last_session_id = it->first;
322 }
323 ProbesDataSource* ds = it->second;
Primiano Tucci674076d2018-10-01 10:41:09 +0100324 if (!ds->started)
325 continue;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100326 switch (ds->type_id) {
327 case FtraceDataSource::kTypeId:
328 metadata = static_cast<FtraceDataSource*>(ds)->mutable_metadata();
329 break;
330 case InodeFileDataSource::kTypeId:
331 inode_data_source = static_cast<InodeFileDataSource*>(ds);
332 break;
Primiano Tuccic9d4a8b2018-10-30 20:19:01 -0700333 case ProcessStatsDataSource::kTypeId: {
334 // A trace session might have declared more than one ps data source.
335 // In those cases we often use one for a full dump on startup (
336 // targeting a dedicated buffer) and another one for on-demand dumps
337 // targeting the main buffer.
338 // Only use the one that has on-demand dumps enabled, if any.
339 auto ps = static_cast<ProcessStatsDataSource*>(ds);
340 if (ps->on_demand_dumps_enabled())
341 ps_data_source = ps;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100342 break;
Primiano Tuccic9d4a8b2018-10-30 20:19:01 -0700343 }
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100344 case SysStatsDataSource::kTypeId:
345 break;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100346 default:
Florian Mayer6db99a92018-10-18 11:34:55 +0100347 PERFETTO_DFATAL("Invalid data source.");
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100348 } // switch (type_id)
349 } // for (session_data_sources_)
350}
351
Isabelle Taylord404ea12018-02-19 17:28:01 +0000352void ProbesProducer::ConnectWithRetries(const char* socket_name,
353 base::TaskRunner* task_runner) {
354 PERFETTO_DCHECK(state_ == kNotStarted);
355 state_ = kNotConnected;
356
357 ResetConnectionBackoff();
358 socket_name_ = socket_name;
359 task_runner_ = task_runner;
360 Connect();
361}
362
363void ProbesProducer::Connect() {
364 PERFETTO_DCHECK(state_ == kNotConnected);
365 state_ = kConnecting;
Isabelle Taylor86262cb2018-03-27 16:00:54 +0100366 endpoint_ = ProducerIPCClient::Connect(
Primiano Tucci578d7842018-03-29 15:27:05 +0100367 socket_name_, this, "perfetto.traced_probes", task_runner_);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000368}
369
370void ProbesProducer::IncreaseConnectionBackoff() {
371 connection_backoff_ms_ *= 2;
372 if (connection_backoff_ms_ > kMaxConnectionBackoffMs)
373 connection_backoff_ms_ = kMaxConnectionBackoffMs;
374}
375
376void ProbesProducer::ResetConnectionBackoff() {
377 connection_backoff_ms_ = kInitialConnectionBackoffMs;
378}
379
Isabelle Taylord404ea12018-02-19 17:28:01 +0000380} // namespace perfetto