blob: 65c0890f6a54662af7792006d58834cf39183e71 [file] [log] [blame]
Isabelle Taylord404ea12018-02-19 17:28:01 +00001/*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "src/traced/probes/probes_producer.h"
18
19#include <stdio.h>
Anna Zappone4ea73c02018-03-09 16:01:21 +000020#include <sys/stat.h>
Primiano Tucci52526602018-03-29 22:53:10 +010021
22#include <algorithm>
Anna Zappone27ac99c2018-03-06 14:25:35 +000023#include <queue>
Isabelle Taylord404ea12018-02-19 17:28:01 +000024#include <string>
25
26#include "perfetto/base/logging.h"
Primiano Tuccifd8240d2018-08-01 09:34:54 +010027#include "perfetto/base/utils.h"
Hector Dearman0ff07c72018-03-15 09:54:46 +000028#include "perfetto/base/weak_ptr.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000029#include "perfetto/traced/traced.h"
30#include "perfetto/tracing/core/data_source_config.h"
31#include "perfetto/tracing/core/data_source_descriptor.h"
Hector Dearmana89cc572018-02-23 12:02:58 +000032#include "perfetto/tracing/core/ftrace_config.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000033#include "perfetto/tracing/core/trace_config.h"
34#include "perfetto/tracing/core/trace_packet.h"
Primiano Tuccic2eb5102018-05-15 10:40:01 +010035#include "perfetto/tracing/ipc/producer_ipc_client.h"
Anna Zappone2a6f9042018-03-14 13:26:07 +000036#include "src/traced/probes/filesystem/inode_file_data_source.h"
Primiano Tuccifd8240d2018-08-01 09:34:54 +010037#include "src/traced/probes/ftrace/ftrace_data_source.h"
38#include "src/traced/probes/probes_data_source.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000039
Anna Zappone27ac99c2018-03-06 14:25:35 +000040#include "perfetto/trace/filesystem/inode_file_map.pbzero.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000041#include "perfetto/trace/ftrace/ftrace_event_bundle.pbzero.h"
Hector Dearman3afb1e02018-04-27 16:46:52 +010042#include "perfetto/trace/ftrace/ftrace_stats.pbzero.h"
Isabelle Taylord404ea12018-02-19 17:28:01 +000043#include "perfetto/trace/trace_packet.pbzero.h"
44
45namespace perfetto {
46namespace {
47
Primiano Tucci3cbb10a2018-04-10 17:52:40 +010048constexpr uint32_t kInitialConnectionBackoffMs = 100;
49constexpr uint32_t kMaxConnectionBackoffMs = 30 * 1000;
Primiano Tucci578d7842018-03-29 15:27:05 +010050constexpr char kFtraceSourceName[] = "linux.ftrace";
51constexpr char kProcessStatsSourceName[] = "linux.process_stats";
52constexpr char kInodeMapSourceName[] = "linux.inode_file_map";
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010053constexpr char kSysStatsSourceName[] = "linux.sys_stats";
Isabelle Taylord404ea12018-02-19 17:28:01 +000054
55} // namespace.
56
57// State transition diagram:
58// +----------------------------+
59// v +
60// NotStarted -> NotConnected -> Connecting -> Connected
61// ^ +
62// +--------------+
63//
64
Primiano Tuccifd8240d2018-08-01 09:34:54 +010065ProbesProducer::ProbesProducer() : weak_factory_(this) {}
66ProbesProducer::~ProbesProducer() {
67 // The ftrace data sources must be deleted before the ftrace controller.
68 data_sources_.clear();
69 ftrace_.reset();
70}
Isabelle Taylord404ea12018-02-19 17:28:01 +000071
72void ProbesProducer::OnConnect() {
73 PERFETTO_DCHECK(state_ == kConnecting);
74 state_ = kConnected;
75 ResetConnectionBackoff();
76 PERFETTO_LOG("Connected to the service");
77
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010078 {
79 DataSourceDescriptor desc;
80 desc.set_name(kFtraceSourceName);
81 endpoint_->RegisterDataSource(desc);
82 }
Isabelle Taylord404ea12018-02-19 17:28:01 +000083
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010084 {
85 DataSourceDescriptor desc;
86 desc.set_name(kProcessStatsSourceName);
87 endpoint_->RegisterDataSource(desc);
88 }
Anna Zappone27ac99c2018-03-06 14:25:35 +000089
Primiano Tucci82a8bfd2018-09-19 11:33:04 +010090 {
91 DataSourceDescriptor desc;
92 desc.set_name(kInodeMapSourceName);
93 endpoint_->RegisterDataSource(desc);
94 }
95
96 {
97 DataSourceDescriptor desc;
98 desc.set_name(kSysStatsSourceName);
99 endpoint_->RegisterDataSource(desc);
100 }
Isabelle Taylord404ea12018-02-19 17:28:01 +0000101}
102
103void ProbesProducer::OnDisconnect() {
104 PERFETTO_DCHECK(state_ == kConnected || state_ == kConnecting);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000105 PERFETTO_LOG("Disconnected from tracing service");
Primiano Tuccie56411c2018-03-30 01:15:02 +0100106 if (state_ == kConnected)
107 return task_runner_->PostTask([this] { this->Restart(); });
Isabelle Taylord404ea12018-02-19 17:28:01 +0000108
Primiano Tuccie56411c2018-03-30 01:15:02 +0100109 state_ = kNotConnected;
110 IncreaseConnectionBackoff();
Isabelle Taylord404ea12018-02-19 17:28:01 +0000111 task_runner_->PostDelayedTask([this] { this->Connect(); },
112 connection_backoff_ms_);
113}
114
Primiano Tuccie56411c2018-03-30 01:15:02 +0100115void ProbesProducer::Restart() {
116 // We lost the connection with the tracing service. At this point we need
117 // to reset all the data sources. Trying to handle that manually is going to
118 // be error prone. What we do here is simply desroying the instance and
119 // recreating it again.
120 // TODO(hjd): Add e2e test for this.
121
122 base::TaskRunner* task_runner = task_runner_;
123 const char* socket_name = socket_name_;
124
125 // Invoke destructor and then the constructor again.
126 this->~ProbesProducer();
127 new (this) ProbesProducer();
128
129 ConnectWithRetries(socket_name, task_runner);
130}
131
Primiano Tucci674076d2018-10-01 10:41:09 +0100132void ProbesProducer::SetupDataSource(DataSourceInstanceID instance_id,
Primiano Tucciafb72b52018-09-25 09:37:24 +0100133 const DataSourceConfig& config) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100134 PERFETTO_DLOG("SetupDataSource(id=%" PRIu64 ", name=%s)", instance_id,
135 config.name().c_str());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100136 PERFETTO_DCHECK(data_sources_.count(instance_id) == 0);
Primiano Tucci03de28f2018-08-01 11:29:46 +0100137 TracingSessionID session_id = config.tracing_session_id();
138 PERFETTO_CHECK(session_id > 0);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000139
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100140 std::unique_ptr<ProbesDataSource> data_source;
Hector Dearman0ff07c72018-03-15 09:54:46 +0000141 if (config.name() == kFtraceSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100142 data_source = CreateFtraceDataSource(session_id, instance_id, config);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000143 } else if (config.name() == kInodeMapSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100144 data_source = CreateInodeFileDataSource(session_id, instance_id, config);
Hector Dearman0ff07c72018-03-15 09:54:46 +0000145 } else if (config.name() == kProcessStatsSourceName) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100146 data_source = CreateProcessStatsDataSource(session_id, instance_id, config);
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100147 } else if (config.name() == kSysStatsSourceName) {
148 data_source = CreateSysStatsDataSource(session_id, instance_id, config);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100149 }
150
151 if (!data_source) {
152 PERFETTO_ELOG("Failed to create data source '%s'", config.name().c_str());
Hector Dearman0ff07c72018-03-15 09:54:46 +0000153 return;
154 }
155
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100156 session_data_sources_.emplace(session_id, data_source.get());
157 data_sources_[instance_id] = std::move(data_source);
Primiano Tucci674076d2018-10-01 10:41:09 +0100158}
Hector Dearman0ff07c72018-03-15 09:54:46 +0000159
Primiano Tucci674076d2018-10-01 10:41:09 +0100160void ProbesProducer::StartDataSource(DataSourceInstanceID instance_id,
161 const DataSourceConfig& config) {
162 PERFETTO_DLOG("StartDataSource(id=%" PRIu64 ", name=%s)", instance_id,
163 config.name().c_str());
164 auto it = data_sources_.find(instance_id);
165 if (it == data_sources_.end()) {
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100166 // Can happen if SetupDataSource() failed (e.g. ftrace was busy).
Primiano Tucci674076d2018-10-01 10:41:09 +0100167 PERFETTO_ELOG("Data source id=%" PRIu64 " not found", instance_id);
168 return;
169 }
170 ProbesDataSource* data_source = it->second.get();
171 if (data_source->started)
172 return;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100173 if (config.trace_duration_ms() != 0) {
174 uint32_t timeout = 5000 + 2 * config.trace_duration_ms();
175 watchdogs_.emplace(
176 instance_id, base::Watchdog::GetInstance()->CreateFatalTimer(timeout));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000177 }
Primiano Tucci674076d2018-10-01 10:41:09 +0100178 data_source->started = true;
179 data_source->Start();
Isabelle Taylord404ea12018-02-19 17:28:01 +0000180}
181
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100182std::unique_ptr<ProbesDataSource> ProbesProducer::CreateFtraceDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000183 TracingSessionID session_id,
Isabelle Taylord404ea12018-02-19 17:28:01 +0000184 DataSourceInstanceID id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000185 const DataSourceConfig& config) {
Isabelle Taylord404ea12018-02-19 17:28:01 +0000186 // Don't retry if FtraceController::Create() failed once.
187 // This can legitimately happen on user builds where we cannot access the
188 // debug paths, e.g., because of SELinux rules.
189 if (ftrace_creation_failed_)
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100190 return nullptr;
Isabelle Taylord404ea12018-02-19 17:28:01 +0000191
192 // Lazily create on the first instance.
193 if (!ftrace_) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100194 ftrace_ = FtraceController::Create(task_runner_, this);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000195
196 if (!ftrace_) {
197 PERFETTO_ELOG("Failed to create FtraceController");
198 ftrace_creation_failed_ = true;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100199 return nullptr;
Isabelle Taylord404ea12018-02-19 17:28:01 +0000200 }
201
202 ftrace_->DisableAllEvents();
203 ftrace_->ClearTrace();
204 }
205
Primiano Tucci674076d2018-10-01 10:41:09 +0100206 PERFETTO_LOG("Ftrace setup (id=%" PRIu64 ", target_buf=%" PRIu32 ")", id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000207 config.target_buffer());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100208 const BufferID buffer_id = static_cast<BufferID>(config.target_buffer());
209 std::unique_ptr<FtraceDataSource> data_source(new FtraceDataSource(
210 ftrace_->GetWeakPtr(), session_id, config.ftrace_config(),
211 endpoint_->CreateTraceWriter(buffer_id)));
212 if (!ftrace_->AddDataSource(data_source.get())) {
213 PERFETTO_ELOG(
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100214 "Failed to setup tracing (too many concurrent sessions or ftrace is "
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100215 "already in use)");
216 return nullptr;
Hector Dearmanee3c49d2018-02-28 14:10:22 +0000217 }
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100218 return std::move(data_source);
Anna Zappone27ac99c2018-03-06 14:25:35 +0000219}
220
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100221std::unique_ptr<ProbesDataSource> ProbesProducer::CreateInodeFileDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000222 TracingSessionID session_id,
Anna Zappone27ac99c2018-03-06 14:25:35 +0000223 DataSourceInstanceID id,
Primiano Tuccidae35652018-03-29 18:32:02 +0100224 DataSourceConfig source_config) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100225 PERFETTO_LOG("Inode file map setup (id=%" PRIu64 ", target_buf=%" PRIu32 ")",
Anna Zappone27ac99c2018-03-06 14:25:35 +0000226 id, source_config.target_buffer());
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100227 auto buffer_id = static_cast<BufferID>(source_config.target_buffer());
Anna Zappone2a6f9042018-03-14 13:26:07 +0000228 if (system_inodes_.empty())
Hector Dearman7fabd702018-03-28 12:37:15 +0100229 CreateStaticDeviceToInodeMap("/system", &system_inodes_);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100230 return std::unique_ptr<InodeFileDataSource>(new InodeFileDataSource(
231 std::move(source_config), task_runner_, session_id, &system_inodes_,
232 &cache_, endpoint_->CreateTraceWriter(buffer_id)));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000233}
234
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100235std::unique_ptr<ProbesDataSource> ProbesProducer::CreateProcessStatsDataSource(
Hector Dearman0ff07c72018-03-15 09:54:46 +0000236 TracingSessionID session_id,
Hector Dearman77451692018-03-08 16:21:13 +0000237 DataSourceInstanceID id,
Hector Dearman0ff07c72018-03-15 09:54:46 +0000238 const DataSourceConfig& config) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100239 base::ignore_result(id);
240 auto buffer_id = static_cast<BufferID>(config.target_buffer());
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100241 return std::unique_ptr<ProcessStatsDataSource>(new ProcessStatsDataSource(
242 session_id, endpoint_->CreateTraceWriter(buffer_id), config));
Isabelle Taylord404ea12018-02-19 17:28:01 +0000243}
244
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100245std::unique_ptr<SysStatsDataSource> ProbesProducer::CreateSysStatsDataSource(
246 TracingSessionID session_id,
247 DataSourceInstanceID id,
248 const DataSourceConfig& config) {
249 base::ignore_result(id);
250 auto buffer_id = static_cast<BufferID>(config.target_buffer());
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100251 return std::unique_ptr<SysStatsDataSource>(
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100252 new SysStatsDataSource(task_runner_, session_id,
253 endpoint_->CreateTraceWriter(buffer_id), config));
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100254}
255
Primiano Tucciafb72b52018-09-25 09:37:24 +0100256void ProbesProducer::StopDataSource(DataSourceInstanceID id) {
Isabelle Taylord404ea12018-02-19 17:28:01 +0000257 PERFETTO_LOG("Producer stop (id=%" PRIu64 ")", id);
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100258 auto it = data_sources_.find(id);
259 if (it == data_sources_.end()) {
Primiano Tucci8a0dc5d2018-10-02 12:51:11 +0100260 // Can happen if SetupDataSource() failed (e.g. ftrace was busy).
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100261 PERFETTO_ELOG("Cannot stop data source id=%" PRIu64 ", not found", id);
262 return;
263 }
264 ProbesDataSource* data_source = it->second.get();
265 TracingSessionID session_id = data_source->tracing_session_id;
266 auto range = session_data_sources_.equal_range(session_id);
267 for (auto kv = range.first; kv != range.second; kv++) {
268 if (kv->second != data_source)
269 continue;
270 session_data_sources_.erase(kv);
271 break;
272 }
273 data_sources_.erase(it);
Hector Dearman77451692018-03-08 16:21:13 +0000274 watchdogs_.erase(id);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000275}
276
Primiano Tuccidca727d2018-04-04 11:31:55 +0200277void ProbesProducer::OnTracingSetup() {}
Isabelle Taylor69faa902018-03-21 15:42:03 +0000278
Primiano Tuccid52e6272018-04-06 19:06:53 +0200279void ProbesProducer::Flush(FlushRequestID flush_request_id,
280 const DataSourceInstanceID* data_source_ids,
281 size_t num_data_sources) {
282 for (size_t i = 0; i < num_data_sources; i++) {
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100283 auto it = data_sources_.find(data_source_ids[i]);
Primiano Tucci674076d2018-10-01 10:41:09 +0100284 if (it == data_sources_.end() || !it->second->started)
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100285 continue;
286 it->second->Flush();
Primiano Tuccid52e6272018-04-06 19:06:53 +0200287 }
288 endpoint_->NotifyFlushComplete(flush_request_id);
289}
290
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100291// This function is called by the FtraceController in batches, whenever it has
292// read one or more pages from one or more cpus and written that into the
293// userspace tracing buffer. If more than one ftrace data sources are active,
294// this call typically happens after writing for all session has been handled.
295void ProbesProducer::OnFtraceDataWrittenIntoDataSourceBuffers() {
296 TracingSessionID last_session_id = 0;
297 FtraceMetadata* metadata = nullptr;
298 InodeFileDataSource* inode_data_source = nullptr;
299 ProcessStatsDataSource* ps_data_source = nullptr;
300
301 // unordered_multimap guarantees that entries with the same key are contiguous
302 // in the iteration.
303 for (auto it = session_data_sources_.begin(); /* check below*/; it++) {
Primiano Tucci674076d2018-10-01 10:41:09 +0100304 // If this is the last iteration or the session id has changed,
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100305 // dispatch the metadata update to the linked data sources, if any.
306 if (it == session_data_sources_.end() || it->first != last_session_id) {
307 bool has_inodes = metadata && !metadata->inode_and_device.empty();
308 bool has_pids = metadata && !metadata->pids.empty();
309 if (has_inodes && inode_data_source)
310 inode_data_source->OnInodes(metadata->inode_and_device);
311 if (has_pids && ps_data_source)
312 ps_data_source->OnPids(metadata->pids);
313 if (metadata)
314 metadata->Clear();
315 metadata = nullptr;
316 inode_data_source = nullptr;
317 ps_data_source = nullptr;
318 if (it == session_data_sources_.end())
319 break;
320 last_session_id = it->first;
321 }
322 ProbesDataSource* ds = it->second;
Primiano Tucci674076d2018-10-01 10:41:09 +0100323 if (!ds->started)
324 continue;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100325 switch (ds->type_id) {
326 case FtraceDataSource::kTypeId:
327 metadata = static_cast<FtraceDataSource*>(ds)->mutable_metadata();
328 break;
329 case InodeFileDataSource::kTypeId:
330 inode_data_source = static_cast<InodeFileDataSource*>(ds);
331 break;
332 case ProcessStatsDataSource::kTypeId:
333 ps_data_source = static_cast<ProcessStatsDataSource*>(ds);
334 break;
Primiano Tucci82a8bfd2018-09-19 11:33:04 +0100335 case SysStatsDataSource::kTypeId:
336 break;
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100337 default:
Florian Mayer6db99a92018-10-18 11:34:55 +0100338 PERFETTO_DFATAL("Invalid data source.");
Primiano Tuccifd8240d2018-08-01 09:34:54 +0100339 } // switch (type_id)
340 } // for (session_data_sources_)
341}
342
Isabelle Taylord404ea12018-02-19 17:28:01 +0000343void ProbesProducer::ConnectWithRetries(const char* socket_name,
344 base::TaskRunner* task_runner) {
345 PERFETTO_DCHECK(state_ == kNotStarted);
346 state_ = kNotConnected;
347
348 ResetConnectionBackoff();
349 socket_name_ = socket_name;
350 task_runner_ = task_runner;
351 Connect();
352}
353
354void ProbesProducer::Connect() {
355 PERFETTO_DCHECK(state_ == kNotConnected);
356 state_ = kConnecting;
Isabelle Taylor86262cb2018-03-27 16:00:54 +0100357 endpoint_ = ProducerIPCClient::Connect(
Primiano Tucci578d7842018-03-29 15:27:05 +0100358 socket_name_, this, "perfetto.traced_probes", task_runner_);
Isabelle Taylord404ea12018-02-19 17:28:01 +0000359}
360
361void ProbesProducer::IncreaseConnectionBackoff() {
362 connection_backoff_ms_ *= 2;
363 if (connection_backoff_ms_ > kMaxConnectionBackoffMs)
364 connection_backoff_ms_ = kMaxConnectionBackoffMs;
365}
366
367void ProbesProducer::ResetConnectionBackoff() {
368 connection_backoff_ms_ = kInitialConnectionBackoffMs;
369}
370
Isabelle Taylord404ea12018-02-19 17:28:01 +0000371} // namespace perfetto