blob: 2b7e98c13fdd409363561977aef176bbef0db1c7 [file] [log] [blame]
Bertrand SIMONNET52e5b992015-08-10 15:18:00 -07001/*
2 * Copyright (C) 2015 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Darin Petkov65b01462010-04-14 13:32:20 -070016
Bertrand SIMONNET4b915ae2015-07-28 15:38:14 -070017#include "metrics_daemon.h"
Darin Petkov65b01462010-04-14 13:32:20 -070018
Steve Funge86591e2014-12-01 13:38:21 -080019#include <sysexits.h>
Luigi Semenzato8accd332011-05-17 16:37:18 -070020#include <time.h>
Darin Petkov65b01462010-04-14 13:32:20 -070021
Bertrand SIMONNET4b915ae2015-07-28 15:38:14 -070022#include <base/bind.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080023#include <base/files/file_path.h>
Ben Chan51bf92a2014-09-05 08:21:06 -070024#include <base/files/file_util.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080025#include <base/hash.h>
Darin Petkov65b01462010-04-14 13:32:20 -070026#include <base/logging.h>
Ben Chan2e6543d2014-02-05 23:26:25 -080027#include <base/strings/string_number_conversions.h>
28#include <base/strings/string_split.h>
29#include <base/strings/string_util.h>
30#include <base/strings/stringprintf.h>
Bertrand SIMONNET26993622015-08-20 14:08:41 -070031#include <cutils/properties.h>
Steve Funge86591e2014-12-01 13:38:21 -080032#include <dbus/dbus.h>
33#include <dbus/message.h>
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -070034
35#include "constants.h"
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -070036#include "uploader/upload_service.h"
Darin Petkov65b01462010-04-14 13:32:20 -070037
Ben Chan2e6543d2014-02-05 23:26:25 -080038using base::FilePath;
39using base::StringPrintf;
Darin Petkovf27f0362010-06-04 13:14:19 -070040using base::Time;
41using base::TimeDelta;
42using base::TimeTicks;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080043using chromeos_metrics::PersistentInteger;
Bertrand SIMONNET59890e22015-10-02 16:45:18 -070044using com::android::Weave::CommandProxy;
45using com::android::Weave::ManagerProxy;
Luigi Semenzato8accd332011-05-17 16:37:18 -070046using std::map;
Darin Petkov38d5cb02010-06-24 12:10:26 -070047using std::string;
Luigi Semenzato8accd332011-05-17 16:37:18 -070048using std::vector;
49
Daniel Eratc83975a2014-04-04 08:53:44 -070050namespace {
Darin Petkovf27f0362010-06-04 13:14:19 -070051
Daniel Eratc83975a2014-04-04 08:53:44 -070052const char kCrashReporterInterface[] = "org.chromium.CrashReporter";
53const char kCrashReporterUserCrashSignal[] = "UserCrash";
Steve Funge86591e2014-12-01 13:38:21 -080054const char kCrashReporterMatchRule[] =
55 "type='signal',interface='%s',path='/',member='%s'";
Darin Petkov41e06232010-05-03 16:45:37 -070056
Daniel Eratc83975a2014-04-04 08:53:44 -070057const int kSecondsPerMinute = 60;
58const int kMinutesPerHour = 60;
59const int kHoursPerDay = 24;
60const int kMinutesPerDay = kHoursPerDay * kMinutesPerHour;
61const int kSecondsPerDay = kSecondsPerMinute * kMinutesPerDay;
62const int kDaysPerWeek = 7;
63const int kSecondsPerWeek = kSecondsPerDay * kDaysPerWeek;
Darin Petkov41e06232010-05-03 16:45:37 -070064
Daniel Eratc83975a2014-04-04 08:53:44 -070065// Interval between calls to UpdateStats().
Steve Funge86591e2014-12-01 13:38:21 -080066const uint32_t kUpdateStatsIntervalMs = 300000;
Darin Petkov65b01462010-04-14 13:32:20 -070067
Luigi Semenzatoc5a92342014-02-14 15:05:51 -080068const char kKernelCrashDetectedFile[] = "/var/run/kernel-crash-detected";
Daniel Eratc83975a2014-04-04 08:53:44 -070069const char kUncleanShutdownDetectedFile[] =
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080070 "/var/run/unclean-shutdown-detected";
Ken Mixterccd84c02010-08-16 19:57:13 -070071
Bertrand SIMONNETebbe35c2015-09-08 10:13:35 -070072const int kMetricMeminfoInterval = 30; // seconds
73
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -070074const char kMetricsProcStatFileName[] = "/proc/stat";
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -070075const char kMeminfoFileName[] = "/proc/meminfo";
Bertrand SIMONNET7a964052015-09-29 11:07:24 -070076const char kVmStatFileName[] = "/proc/vmstat";
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -070077const int kMetricsProcStatFirstLineItemsCount = 11;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -070078
Luigi Semenzatofb3a8212013-05-07 16:55:00 -070079// Thermal CPU throttling.
80
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -070081const char kMetricScaledCpuFrequencyName[] =
Luigi Semenzatofb3a8212013-05-07 16:55:00 -070082 "Platform.CpuFrequencyThermalScaling";
83
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -070084} // namespace
85
Luigi Semenzato96360192014-06-04 10:53:35 -070086// Zram sysfs entries.
87
88const char MetricsDaemon::kComprDataSizeName[] = "compr_data_size";
89const char MetricsDaemon::kOrigDataSizeName[] = "orig_data_size";
90const char MetricsDaemon::kZeroPagesName[] = "zero_pages";
91
Luigi Semenzato8accd332011-05-17 16:37:18 -070092// Memory use stats collection intervals. We collect some memory use interval
93// at these intervals after boot, and we stop collecting after the last one,
94// with the assumption that in most cases the memory use won't change much
95// after that.
96static const int kMemuseIntervals[] = {
97 1 * kSecondsPerMinute, // 1 minute mark
98 4 * kSecondsPerMinute, // 5 minute mark
99 25 * kSecondsPerMinute, // 0.5 hour mark
100 120 * kSecondsPerMinute, // 2.5 hour mark
101 600 * kSecondsPerMinute, // 12.5 hour mark
102};
103
Darin Petkovf1e85e42010-06-10 15:59:53 -0700104MetricsDaemon::MetricsDaemon()
Steve Funge86591e2014-12-01 13:38:21 -0800105 : memuse_final_time_(0),
Luigi Semenzato8accd332011-05-17 16:37:18 -0700106 memuse_interval_index_(0),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700107 ticks_per_second_(0),
108 latest_cpu_use_ticks_(0) {}
Darin Petkovf1e85e42010-06-10 15:59:53 -0700109
Ken Mixter4c5daa42010-08-26 18:35:06 -0700110MetricsDaemon::~MetricsDaemon() {
Ken Mixter4c5daa42010-08-26 18:35:06 -0700111}
112
Bertrand SIMONNET7a964052015-09-29 11:07:24 -0700113// static
Luigi Semenzato8accd332011-05-17 16:37:18 -0700114double MetricsDaemon::GetActiveTime() {
115 struct timespec ts;
116 int r = clock_gettime(CLOCK_MONOTONIC, &ts);
117 if (r < 0) {
118 PLOG(WARNING) << "clock_gettime(CLOCK_MONOTONIC) failed";
119 return 0;
120 } else {
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700121 return ts.tv_sec + static_cast<double>(ts.tv_nsec) / (1000 * 1000 * 1000);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700122 }
123}
124
Steve Funge86591e2014-12-01 13:38:21 -0800125int MetricsDaemon::Run() {
Ken Mixterccd84c02010-08-16 19:57:13 -0700126 if (CheckSystemCrash(kKernelCrashDetectedFile)) {
127 ProcessKernelCrash();
128 }
129
130 if (CheckSystemCrash(kUncleanShutdownDetectedFile)) {
131 ProcessUncleanShutdown();
132 }
133
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800134 // On OS version change, clear version stats (which are reported daily).
Ben Chanf05ab402014-08-07 00:54:59 -0700135 int32_t version = GetOsVersionHash();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800136 if (version_cycle_->Get() != version) {
137 version_cycle_->Set(version);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800138 kernel_crashes_version_count_->Set(0);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700139 version_cumulative_active_use_->Set(0);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700140 version_cumulative_cpu_use_->Set(0);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800141 }
142
Alex Vakulenko74dc6242015-10-13 09:23:34 -0700143 return brillo::DBusDaemon::Run();
Darin Petkov65b01462010-04-14 13:32:20 -0700144}
145
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700146void MetricsDaemon::RunUploaderTest() {
Bertrand SIMONNET12531862015-08-31 11:11:57 -0700147 upload_service_.reset(new UploadService(
Bertrand SIMONNET2765d0a2015-09-09 10:38:20 -0700148 new SystemProfileCache(true, metrics_directory_),
Bertrand SIMONNET12531862015-08-31 11:11:57 -0700149 metrics_lib_,
150 server_));
Bertrand SIMONNET2765d0a2015-09-09 10:38:20 -0700151 upload_service_->Init(upload_interval_, metrics_directory_);
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700152 upload_service_->UploadEvent();
153}
154
Ben Chanf05ab402014-08-07 00:54:59 -0700155uint32_t MetricsDaemon::GetOsVersionHash() {
156 static uint32_t cached_version_hash = 0;
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800157 static bool version_hash_is_cached = false;
158 if (version_hash_is_cached)
159 return cached_version_hash;
160 version_hash_is_cached = true;
Bertrand SIMONNET26993622015-08-20 14:08:41 -0700161
162 char version[PROPERTY_VALUE_MAX];
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -0700163 // The version might not be set for development devices. In this case, use the
164 // zero version.
Bertrand SIMONNET26993622015-08-20 14:08:41 -0700165 property_get(metrics::kProductVersionProperty, version,
166 metrics::kDefaultVersion);
167
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -0700168 cached_version_hash = base::Hash(version);
169 if (testing_) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800170 cached_version_hash = 42; // return any plausible value for the hash
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800171 }
172 return cached_version_hash;
173}
174
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700175void MetricsDaemon::Init(bool testing,
176 bool uploader_active,
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700177 bool dbus_enabled,
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700178 MetricsLibraryInterface* metrics_lib,
Bertrand SIMONNETebbe35c2015-09-08 10:13:35 -0700179 const string& diskstats_path,
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700180 const string& scaling_max_freq_path,
Steve Fung67906c62014-10-06 15:15:30 -0700181 const string& cpuinfo_max_freq_path,
Bertrand SIMONNETcac74e12014-10-09 10:14:13 -0700182 const base::TimeDelta& upload_interval,
Steve Fung67906c62014-10-06 15:15:30 -0700183 const string& server,
Bertrand SIMONNET2765d0a2015-09-09 10:38:20 -0700184 const base::FilePath& metrics_directory) {
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -0700185 CHECK(metrics_lib);
Darin Petkov65b01462010-04-14 13:32:20 -0700186 testing_ = testing;
Steve Funge86591e2014-12-01 13:38:21 -0800187 uploader_active_ = uploader_active;
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700188 dbus_enabled_ = dbus_enabled;
Bertrand SIMONNET2765d0a2015-09-09 10:38:20 -0700189 metrics_directory_ = metrics_directory;
Darin Petkovfc91b422010-05-12 13:05:45 -0700190 metrics_lib_ = metrics_lib;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700191
Bertrand SIMONNETcac74e12014-10-09 10:14:13 -0700192 upload_interval_ = upload_interval;
Steve Fung67906c62014-10-06 15:15:30 -0700193 server_ = server;
Steve Fung67906c62014-10-06 15:15:30 -0700194
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700195 // Get ticks per second (HZ) on this system.
196 // Sysconf cannot fail, so no sanity checks are needed.
197 ticks_per_second_ = sysconf(_SC_CLK_TCK);
198
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700199 daily_active_use_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700200 new PersistentInteger("Platform.UseTime.PerDay"));
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700201 version_cumulative_active_use_.reset(
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700202 new PersistentInteger("Platform.CumulativeUseTime"));
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700203 version_cumulative_cpu_use_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700204 new PersistentInteger("Platform.CumulativeCpuTime"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700205
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800206 kernel_crash_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700207 new PersistentInteger("Platform.KernelCrashInterval"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800208 unclean_shutdown_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700209 new PersistentInteger("Platform.UncleanShutdownInterval"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800210 user_crash_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700211 new PersistentInteger("Platform.UserCrashInterval"));
Darin Petkov2ccef012010-05-05 16:06:37 -0700212
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800213 any_crashes_daily_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700214 new PersistentInteger("Platform.AnyCrashes.PerDay"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800215 any_crashes_weekly_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700216 new PersistentInteger("Platform.AnyCrashes.PerWeek"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800217 user_crashes_daily_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700218 new PersistentInteger("Platform.UserCrashes.PerDay"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800219 user_crashes_weekly_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700220 new PersistentInteger("Platform.UserCrashes.PerWeek"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800221 kernel_crashes_daily_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700222 new PersistentInteger("Platform.KernelCrashes.PerDay"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800223 kernel_crashes_weekly_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700224 new PersistentInteger("Platform.KernelCrashes.PerWeek"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800225 kernel_crashes_version_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700226 new PersistentInteger("Platform.KernelCrashesSinceUpdate"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800227 unclean_shutdowns_daily_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700228 new PersistentInteger("Platform.UncleanShutdown.PerDay"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800229 unclean_shutdowns_weekly_count_.reset(
Bertrand SIMONNET5066a452015-09-25 15:38:42 -0700230 new PersistentInteger("Platform.UncleanShutdowns.PerWeek"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700231
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800232 daily_cycle_.reset(new PersistentInteger("daily.cycle"));
233 weekly_cycle_.reset(new PersistentInteger("weekly.cycle"));
234 version_cycle_.reset(new PersistentInteger("version.cycle"));
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800235
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700236 scaling_max_freq_path_ = scaling_max_freq_path;
237 cpuinfo_max_freq_path_ = cpuinfo_max_freq_path;
Bertrand SIMONNET5658dc52015-09-18 13:38:10 -0700238 disk_usage_collector_.reset(new DiskUsageCollector(metrics_lib_));
Bertrand SIMONNET7a964052015-09-29 11:07:24 -0700239 averaged_stats_collector_.reset(
240 new AveragedStatisticsCollector(metrics_lib_, diskstats_path,
241 kVmStatFileName));
Steve Funge86591e2014-12-01 13:38:21 -0800242}
243
244int MetricsDaemon::OnInit() {
Alex Vakulenko74dc6242015-10-13 09:23:34 -0700245 int return_code = dbus_enabled_ ? brillo::DBusDaemon::OnInit() :
246 brillo::Daemon::OnInit();
Steve Funge86591e2014-12-01 13:38:21 -0800247 if (return_code != EX_OK)
248 return return_code;
249
Bertrand SIMONNETebbe35c2015-09-08 10:13:35 -0700250 StatsReporterInit();
251
252 // Start collecting meminfo stats.
253 ScheduleMeminfoCallback(kMetricMeminfoInterval);
254 memuse_final_time_ = GetActiveTime() + kMemuseIntervals[0];
255 ScheduleMemuseCallback(kMemuseIntervals[0]);
256
Steve Funge86591e2014-12-01 13:38:21 -0800257 if (testing_)
258 return EX_OK;
Darin Petkov65b01462010-04-14 13:32:20 -0700259
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700260 if (dbus_enabled_) {
261 bus_->AssertOnDBusThread();
262 CHECK(bus_->SetUpAsyncOperations());
Darin Petkov65b01462010-04-14 13:32:20 -0700263
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700264 if (bus_->is_connected()) {
265 const std::string match_rule =
266 base::StringPrintf(kCrashReporterMatchRule,
267 kCrashReporterInterface,
268 kCrashReporterUserCrashSignal);
Darin Petkov65b01462010-04-14 13:32:20 -0700269
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700270 bus_->AddFilterFunction(&MetricsDaemon::MessageFilter, this);
Darin Petkov65b01462010-04-14 13:32:20 -0700271
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700272 DBusError error;
273 dbus_error_init(&error);
274 bus_->AddMatch(match_rule, &error);
Darin Petkov65b01462010-04-14 13:32:20 -0700275
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700276 if (dbus_error_is_set(&error)) {
277 LOG(ERROR) << "Failed to add match rule \"" << match_rule << "\". Got "
278 << error.name << ": " << error.message;
279 return EX_SOFTWARE;
280 }
281 } else {
282 LOG(ERROR) << "DBus isn't connected.";
283 return EX_UNAVAILABLE;
Steve Funge86591e2014-12-01 13:38:21 -0800284 }
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700285
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700286 device_ = weaved::Device::CreateInstance(
287 bus_,
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700288 base::Bind(&MetricsDaemon::UpdateWeaveState, base::Unretained(this)));
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700289 device_->AddCommandHandler(
290 "_metrics._enableAnalyticsReporting",
291 base::Bind(&MetricsDaemon::OnEnableMetrics, base::Unretained(this)));
292 device_->AddCommandHandler(
293 "_metrics._disableAnalyticsReporting",
294 base::Bind(&MetricsDaemon::OnDisableMetrics, base::Unretained(this)));
Darin Petkov703ec972010-04-27 11:02:18 -0700295 }
296
Bertrand SIMONNETebbe35c2015-09-08 10:13:35 -0700297 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
298 base::Bind(&MetricsDaemon::HandleUpdateStatsTimeout,
299 base::Unretained(this)),
300 base::TimeDelta::FromMilliseconds(kUpdateStatsIntervalMs));
301
Steve Funge86591e2014-12-01 13:38:21 -0800302 if (uploader_active_) {
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -0700303 upload_service_.reset(
304 new UploadService(new SystemProfileCache(), metrics_lib_, server_));
Bertrand SIMONNET2765d0a2015-09-09 10:38:20 -0700305 upload_service_->Init(upload_interval_, metrics_directory_);
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700306 }
Steve Funge86591e2014-12-01 13:38:21 -0800307
308 return EX_OK;
Darin Petkov65b01462010-04-14 13:32:20 -0700309}
310
Steve Funge86591e2014-12-01 13:38:21 -0800311void MetricsDaemon::OnShutdown(int* return_code) {
Bertrand SIMONNETfec4d2c2015-08-05 16:04:14 -0700312 if (!testing_ && dbus_enabled_ && bus_->is_connected()) {
Steve Funge86591e2014-12-01 13:38:21 -0800313 const std::string match_rule =
314 base::StringPrintf(kCrashReporterMatchRule,
315 kCrashReporterInterface,
316 kCrashReporterUserCrashSignal);
317
318 bus_->RemoveFilterFunction(&MetricsDaemon::MessageFilter, this);
319
320 DBusError error;
321 dbus_error_init(&error);
322 bus_->RemoveMatch(match_rule, &error);
323
324 if (dbus_error_is_set(&error)) {
325 LOG(ERROR) << "Failed to remove match rule \"" << match_rule << "\". Got "
326 << error.name << ": " << error.message;
327 }
328 }
Alex Vakulenko74dc6242015-10-13 09:23:34 -0700329 brillo::DBusDaemon::OnShutdown(return_code);
Darin Petkov65b01462010-04-14 13:32:20 -0700330}
331
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700332void MetricsDaemon::OnEnableMetrics(const std::weak_ptr<weaved::Command>& cmd) {
333 auto command = cmd.lock();
334 if (!command)
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700335 return;
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700336
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700337 if (base::WriteFile(metrics_directory_.Append(metrics::kConsentFileName),
338 "", 0) != 0) {
339 PLOG(ERROR) << "Could not create the consent file.";
Alex Vakulenko35f89632015-10-09 08:18:35 -0700340 command->Abort("metrics_error", "Could not create the consent file",
341 nullptr);
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700342 return;
343 }
344
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700345 UpdateWeaveState();
Alex Vakulenko35f89632015-10-09 08:18:35 -0700346 command->Complete({}, nullptr);
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700347}
348
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700349void MetricsDaemon::OnDisableMetrics(
350 const std::weak_ptr<weaved::Command>& cmd) {
351 auto command = cmd.lock();
352 if (!command)
353 return;
354
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700355 if (!base::DeleteFile(metrics_directory_.Append(metrics::kConsentFileName),
356 false)) {
Alex Vakulenko35f89632015-10-09 08:18:35 -0700357 PLOG(ERROR) << "Could not delete the consent file.";
358 command->Abort("metrics_error", "Could not delete the consent file",
359 nullptr);
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700360 return;
361 }
362
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700363 UpdateWeaveState();
Alex Vakulenko35f89632015-10-09 08:18:35 -0700364 command->Complete({}, nullptr);
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700365}
366
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700367void MetricsDaemon::UpdateWeaveState() {
368 if (!device_)
369 return;
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700370
Alex Vakulenko74dc6242015-10-13 09:23:34 -0700371 brillo::VariantDictionary state_change{
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700372 { "_metrics._AnalyticsReportingState",
373 metrics_lib_->AreMetricsEnabled() ? "enabled" : "disabled" }
374 };
375
Alex Vakulenko82b02de2015-10-09 20:07:47 -0700376 if (!device_->SetStateProperties(state_change, nullptr)) {
Bertrand SIMONNET59890e22015-10-02 16:45:18 -0700377 LOG(ERROR) << "failed to update weave's state";
378 }
379}
380
Darin Petkov703ec972010-04-27 11:02:18 -0700381// static
382DBusHandlerResult MetricsDaemon::MessageFilter(DBusConnection* connection,
383 DBusMessage* message,
384 void* user_data) {
Darin Petkov703ec972010-04-27 11:02:18 -0700385 int message_type = dbus_message_get_type(message);
386 if (message_type != DBUS_MESSAGE_TYPE_SIGNAL) {
Darin Petkov41e06232010-05-03 16:45:37 -0700387 DLOG(WARNING) << "unexpected message type " << message_type;
Darin Petkov703ec972010-04-27 11:02:18 -0700388 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
389 }
390
391 // Signal messages always have interfaces.
Daniel Eratc83975a2014-04-04 08:53:44 -0700392 const std::string interface(dbus_message_get_interface(message));
393 const std::string member(dbus_message_get_member(message));
394 DLOG(INFO) << "Got " << interface << "." << member << " D-Bus signal";
Darin Petkov703ec972010-04-27 11:02:18 -0700395
396 MetricsDaemon* daemon = static_cast<MetricsDaemon*>(user_data);
397
398 DBusMessageIter iter;
399 dbus_message_iter_init(message, &iter);
Daniel Eratc83975a2014-04-04 08:53:44 -0700400 if (interface == kCrashReporterInterface) {
401 CHECK_EQ(member, kCrashReporterUserCrashSignal);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700402 daemon->ProcessUserCrash();
Darin Petkov703ec972010-04-27 11:02:18 -0700403 } else {
Daniel Eratc83975a2014-04-04 08:53:44 -0700404 // Ignore messages from the bus itself.
Darin Petkov703ec972010-04-27 11:02:18 -0700405 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
406 }
407
408 return DBUS_HANDLER_RESULT_HANDLED;
Darin Petkov65b01462010-04-14 13:32:20 -0700409}
410
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700411// One might argue that parts of this should go into
412// chromium/src/base/sys_info_chromeos.c instead, but put it here for now.
413
414TimeDelta MetricsDaemon::GetIncrementalCpuUse() {
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700415 FilePath proc_stat_path = FilePath(kMetricsProcStatFileName);
416 std::string proc_stat_string;
417 if (!base::ReadFileToString(proc_stat_path, &proc_stat_string)) {
418 LOG(WARNING) << "cannot open " << kMetricsProcStatFileName;
419 return TimeDelta();
420 }
421
422 std::vector<std::string> proc_stat_lines;
423 base::SplitString(proc_stat_string, '\n', &proc_stat_lines);
424 if (proc_stat_lines.empty()) {
425 LOG(WARNING) << "cannot parse " << kMetricsProcStatFileName
426 << ": " << proc_stat_string;
427 return TimeDelta();
428 }
429 std::vector<std::string> proc_stat_totals;
430 base::SplitStringAlongWhitespace(proc_stat_lines[0], &proc_stat_totals);
431
Ben Chanf05ab402014-08-07 00:54:59 -0700432 uint64_t user_ticks, user_nice_ticks, system_ticks;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700433 if (proc_stat_totals.size() != kMetricsProcStatFirstLineItemsCount ||
434 proc_stat_totals[0] != "cpu" ||
435 !base::StringToUint64(proc_stat_totals[1], &user_ticks) ||
436 !base::StringToUint64(proc_stat_totals[2], &user_nice_ticks) ||
437 !base::StringToUint64(proc_stat_totals[3], &system_ticks)) {
438 LOG(WARNING) << "cannot parse first line: " << proc_stat_lines[0];
439 return TimeDelta(base::TimeDelta::FromSeconds(0));
440 }
441
Ben Chanf05ab402014-08-07 00:54:59 -0700442 uint64_t total_cpu_use_ticks = user_ticks + user_nice_ticks + system_ticks;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700443
444 // Sanity check.
445 if (total_cpu_use_ticks < latest_cpu_use_ticks_) {
446 LOG(WARNING) << "CPU time decreasing from " << latest_cpu_use_ticks_
447 << " to " << total_cpu_use_ticks;
448 return TimeDelta();
449 }
450
Ben Chanf05ab402014-08-07 00:54:59 -0700451 uint64_t diff = total_cpu_use_ticks - latest_cpu_use_ticks_;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700452 latest_cpu_use_ticks_ = total_cpu_use_ticks;
453 // Use microseconds to avoid significant truncations.
454 return base::TimeDelta::FromMicroseconds(
455 diff * 1000 * 1000 / ticks_per_second_);
456}
457
Darin Petkov1bb904e2010-06-16 15:58:06 -0700458void MetricsDaemon::ProcessUserCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700459 // Counts the active time up to now.
460 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov1bb904e2010-06-16 15:58:06 -0700461
462 // Reports the active use time since the last crash and resets it.
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700463 SendAndResetCrashIntervalSample(user_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700464
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800465 any_crashes_daily_count_->Add(1);
466 any_crashes_weekly_count_->Add(1);
467 user_crashes_daily_count_->Add(1);
468 user_crashes_weekly_count_->Add(1);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700469}
470
Darin Petkov38d5cb02010-06-24 12:10:26 -0700471void MetricsDaemon::ProcessKernelCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700472 // Counts the active time up to now.
473 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov38d5cb02010-06-24 12:10:26 -0700474
475 // Reports the active use time since the last crash and resets it.
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700476 SendAndResetCrashIntervalSample(kernel_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700477
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800478 any_crashes_daily_count_->Add(1);
479 any_crashes_weekly_count_->Add(1);
480 kernel_crashes_daily_count_->Add(1);
481 kernel_crashes_weekly_count_->Add(1);
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800482
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800483 kernel_crashes_version_count_->Add(1);
Darin Petkov38d5cb02010-06-24 12:10:26 -0700484}
485
Ken Mixterccd84c02010-08-16 19:57:13 -0700486void MetricsDaemon::ProcessUncleanShutdown() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700487 // Counts the active time up to now.
488 UpdateStats(TimeTicks::Now(), Time::Now());
Ken Mixterccd84c02010-08-16 19:57:13 -0700489
490 // Reports the active use time since the last crash and resets it.
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700491 SendAndResetCrashIntervalSample(unclean_shutdown_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700492
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800493 unclean_shutdowns_daily_count_->Add(1);
494 unclean_shutdowns_weekly_count_->Add(1);
495 any_crashes_daily_count_->Add(1);
496 any_crashes_weekly_count_->Add(1);
Ken Mixterccd84c02010-08-16 19:57:13 -0700497}
498
Luigi Semenzato8accd332011-05-17 16:37:18 -0700499bool MetricsDaemon::CheckSystemCrash(const string& crash_file) {
Darin Petkov38d5cb02010-06-24 12:10:26 -0700500 FilePath crash_detected(crash_file);
Ben Chan2e6543d2014-02-05 23:26:25 -0800501 if (!base::PathExists(crash_detected))
Ken Mixterccd84c02010-08-16 19:57:13 -0700502 return false;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700503
504 // Deletes the crash-detected file so that the daemon doesn't report
505 // another kernel crash in case it's restarted.
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800506 base::DeleteFile(crash_detected, false); // not recursive
Ken Mixterccd84c02010-08-16 19:57:13 -0700507 return true;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700508}
509
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700510void MetricsDaemon::StatsReporterInit() {
Bertrand SIMONNET5658dc52015-09-18 13:38:10 -0700511 disk_usage_collector_->Schedule();
Bertrand SIMONNET7a964052015-09-29 11:07:24 -0700512
513 // Don't start a collection cycle during the first run to avoid delaying the
514 // boot.
515 averaged_stats_collector_->ScheduleWait();
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800516}
517
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800518
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700519bool MetricsDaemon::ReadFreqToInt(const string& sysfs_file_name, int* value) {
Luigi Semenzatod92d18c2013-06-04 13:24:21 -0700520 const FilePath sysfs_path(sysfs_file_name);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700521 string value_string;
Ben Chan2e6543d2014-02-05 23:26:25 -0800522 if (!base::ReadFileToString(sysfs_path, &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700523 LOG(WARNING) << "cannot read " << sysfs_path.value().c_str();
524 return false;
525 }
Ben Chan2e6543d2014-02-05 23:26:25 -0800526 if (!base::RemoveChars(value_string, "\n", &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700527 LOG(WARNING) << "no newline in " << value_string;
528 // Continue even though the lack of newline is suspicious.
529 }
530 if (!base::StringToInt(value_string, value)) {
531 LOG(WARNING) << "cannot convert " << value_string << " to int";
532 return false;
533 }
534 return true;
535}
536
537void MetricsDaemon::SendCpuThrottleMetrics() {
538 // |max_freq| is 0 only the first time through.
539 static int max_freq = 0;
540 if (max_freq == -1)
541 // Give up, as sysfs did not report max_freq correctly.
542 return;
543 if (max_freq == 0 || testing_) {
544 // One-time initialization of max_freq. (Every time when testing.)
545 if (!ReadFreqToInt(cpuinfo_max_freq_path_, &max_freq)) {
546 max_freq = -1;
547 return;
548 }
549 if (max_freq == 0) {
550 LOG(WARNING) << "sysfs reports 0 max CPU frequency\n";
551 max_freq = -1;
552 return;
553 }
554 if (max_freq % 10000 == 1000) {
555 // Special case: system has turbo mode, and max non-turbo frequency is
556 // max_freq - 1000. This relies on "normal" (non-turbo) frequencies
557 // being multiples of (at least) 10 MHz. Although there is no guarantee
558 // of this, it seems a fairly reasonable assumption. Otherwise we should
559 // read scaling_available_frequencies, sort the frequencies, compare the
560 // two highest ones, and check if they differ by 1000 (kHz) (and that's a
561 // hack too, no telling when it will change).
562 max_freq -= 1000;
563 }
564 }
565 int scaled_freq = 0;
566 if (!ReadFreqToInt(scaling_max_freq_path_, &scaled_freq))
567 return;
568 // Frequencies are in kHz. If scaled_freq > max_freq, turbo is on, but
569 // scaled_freq is not the actual turbo frequency. We indicate this situation
570 // with a 101% value.
571 int percent = scaled_freq > max_freq ? 101 : scaled_freq / (max_freq / 100);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800572 SendLinearSample(kMetricScaledCpuFrequencyName, percent, 101, 102);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700573}
574
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700575void MetricsDaemon::ScheduleMeminfoCallback(int wait) {
576 if (testing_) {
577 return;
578 }
Steve Funge86591e2014-12-01 13:38:21 -0800579 base::TimeDelta waitDelta = base::TimeDelta::FromSeconds(wait);
580 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
581 base::Bind(&MetricsDaemon::MeminfoCallback, base::Unretained(this),
Steve Fung8ab89c52015-01-05 13:48:30 -0800582 waitDelta),
Steve Funge86591e2014-12-01 13:38:21 -0800583 waitDelta);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700584}
585
Steve Funge86591e2014-12-01 13:38:21 -0800586void MetricsDaemon::MeminfoCallback(base::TimeDelta wait) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700587 string meminfo_raw;
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -0700588 const FilePath meminfo_path(kMeminfoFileName);
Ben Chan2e6543d2014-02-05 23:26:25 -0800589 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700590 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
Steve Funge86591e2014-12-01 13:38:21 -0800591 return;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700592 }
Luigi Semenzato96360192014-06-04 10:53:35 -0700593 // Make both calls even if the first one fails.
Bertrand SIMONNETebbe35c2015-09-08 10:13:35 -0700594 if (ProcessMeminfo(meminfo_raw)) {
Steve Funge86591e2014-12-01 13:38:21 -0800595 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
596 base::Bind(&MetricsDaemon::MeminfoCallback, base::Unretained(this),
Steve Fung8ab89c52015-01-05 13:48:30 -0800597 wait),
Steve Funge86591e2014-12-01 13:38:21 -0800598 wait);
599 }
Luigi Semenzato96360192014-06-04 10:53:35 -0700600}
601
602// static
603bool MetricsDaemon::ReadFileToUint64(const base::FilePath& path,
Ben Chanf05ab402014-08-07 00:54:59 -0700604 uint64_t* value) {
Luigi Semenzato96360192014-06-04 10:53:35 -0700605 std::string content;
606 if (!base::ReadFileToString(path, &content)) {
607 PLOG(WARNING) << "cannot read " << path.MaybeAsASCII();
608 return false;
609 }
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700610 // Remove final newline.
611 base::TrimWhitespaceASCII(content, base::TRIM_TRAILING, &content);
Luigi Semenzato96360192014-06-04 10:53:35 -0700612 if (!base::StringToUint64(content, value)) {
613 LOG(WARNING) << "invalid integer: " << content;
614 return false;
615 }
616 return true;
617}
618
619bool MetricsDaemon::ReportZram(const base::FilePath& zram_dir) {
620 // Data sizes are in bytes. |zero_pages| is in number of pages.
Ben Chanf05ab402014-08-07 00:54:59 -0700621 uint64_t compr_data_size, orig_data_size, zero_pages;
Luigi Semenzato96360192014-06-04 10:53:35 -0700622 const size_t page_size = 4096;
623
624 if (!ReadFileToUint64(zram_dir.Append(kComprDataSizeName),
625 &compr_data_size) ||
626 !ReadFileToUint64(zram_dir.Append(kOrigDataSizeName), &orig_data_size) ||
627 !ReadFileToUint64(zram_dir.Append(kZeroPagesName), &zero_pages)) {
628 return false;
629 }
630
631 // |orig_data_size| does not include zero-filled pages.
632 orig_data_size += zero_pages * page_size;
633
634 const int compr_data_size_mb = compr_data_size >> 20;
635 const int savings_mb = (orig_data_size - compr_data_size) >> 20;
636 const int zero_ratio_percent = zero_pages * page_size * 100 / orig_data_size;
637
638 // Report compressed size in megabytes. 100 MB or less has little impact.
639 SendSample("Platform.ZramCompressedSize", compr_data_size_mb, 100, 4000, 50);
640 SendSample("Platform.ZramSavings", savings_mb, 100, 4000, 50);
641 // The compression ratio is multiplied by 100 for better resolution. The
642 // ratios of interest are between 1 and 6 (100% and 600% as reported). We
643 // don't want samples when very little memory is being compressed.
644 if (compr_data_size_mb >= 1) {
645 SendSample("Platform.ZramCompressionRatioPercent",
646 orig_data_size * 100 / compr_data_size, 100, 600, 50);
647 }
648 // The values of interest for zero_pages are between 1MB and 1GB. The units
649 // are number of pages.
650 SendSample("Platform.ZramZeroPages", zero_pages, 256, 256 * 1024, 50);
651 SendSample("Platform.ZramZeroRatioPercent", zero_ratio_percent, 1, 50, 50);
652
653 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700654}
655
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700656bool MetricsDaemon::ProcessMeminfo(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700657 static const MeminfoRecord fields_array[] = {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700658 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
659 { "MemFree", "MemFree" },
660 { "Buffers", "Buffers" },
661 { "Cached", "Cached" },
662 // { "SwapCached", "SwapCached" },
663 { "Active", "Active" },
664 { "Inactive", "Inactive" },
665 { "ActiveAnon", "Active(anon)" },
666 { "InactiveAnon", "Inactive(anon)" },
667 { "ActiveFile" , "Active(file)" },
668 { "InactiveFile", "Inactive(file)" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800669 { "Unevictable", "Unevictable", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700670 // { "Mlocked", "Mlocked" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800671 { "SwapTotal", "SwapTotal", kMeminfoOp_SwapTotal },
672 { "SwapFree", "SwapFree", kMeminfoOp_SwapFree },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700673 // { "Dirty", "Dirty" },
674 // { "Writeback", "Writeback" },
675 { "AnonPages", "AnonPages" },
676 { "Mapped", "Mapped" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800677 { "Shmem", "Shmem", kMeminfoOp_HistLog },
678 { "Slab", "Slab", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700679 // { "SReclaimable", "SReclaimable" },
680 // { "SUnreclaim", "SUnreclaim" },
681 };
Luigi Semenzato8accd332011-05-17 16:37:18 -0700682 vector<MeminfoRecord> fields(fields_array,
683 fields_array + arraysize(fields_array));
684 if (!FillMeminfo(meminfo_raw, &fields)) {
685 return false;
686 }
687 int total_memory = fields[0].value;
688 if (total_memory == 0) {
689 // this "cannot happen"
690 LOG(WARNING) << "borked meminfo parser";
691 return false;
692 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800693 int swap_total = 0;
694 int swap_free = 0;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700695 // Send all fields retrieved, except total memory.
696 for (unsigned int i = 1; i < fields.size(); i++) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800697 string metrics_name = base::StringPrintf("Platform.Meminfo%s",
698 fields[i].name);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800699 int percent;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800700 switch (fields[i].op) {
701 case kMeminfoOp_HistPercent:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800702 // report value as percent of total memory
703 percent = fields[i].value * 100 / total_memory;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800704 SendLinearSample(metrics_name, percent, 100, 101);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800705 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800706 case kMeminfoOp_HistLog:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800707 // report value in kbytes, log scale, 4Gb max
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800708 SendSample(metrics_name, fields[i].value, 1, 4 * 1000 * 1000, 100);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800709 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800710 case kMeminfoOp_SwapTotal:
711 swap_total = fields[i].value;
712 case kMeminfoOp_SwapFree:
713 swap_free = fields[i].value;
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800714 break;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700715 }
716 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800717 if (swap_total > 0) {
718 int swap_used = swap_total - swap_free;
719 int swap_used_percent = swap_used * 100 / swap_total;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800720 SendSample("Platform.MeminfoSwapUsed", swap_used, 1, 8 * 1000 * 1000, 100);
Bertrand SIMONNET008fb7e2015-09-21 16:48:01 -0700721 SendLinearSample("Platform.MeminfoSwapUsed.Percent", swap_used_percent,
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800722 100, 101);
723 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700724 return true;
725}
726
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700727bool MetricsDaemon::FillMeminfo(const string& meminfo_raw,
728 vector<MeminfoRecord>* fields) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700729 vector<string> lines;
730 unsigned int nlines = Tokenize(meminfo_raw, "\n", &lines);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700731
732 // Scan meminfo output and collect field values. Each field name has to
733 // match a meminfo entry (case insensitive) after removing non-alpha
734 // characters from the entry.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700735 unsigned int ifield = 0;
736 for (unsigned int iline = 0;
737 iline < nlines && ifield < fields->size();
738 iline++) {
739 vector<string> tokens;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700740 Tokenize(lines[iline], ": ", &tokens);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700741 if (strcmp((*fields)[ifield].match, tokens[0].c_str()) == 0) {
742 // Name matches. Parse value and save.
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -0700743 if (!base::StringToInt(tokens[1], &(*fields)[ifield].value)) {
744 LOG(WARNING) << "Cound not convert " << tokens[1] << " to int";
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700745 return false;
746 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700747 ifield++;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700748 }
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700749 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700750 if (ifield < fields->size()) {
751 // End of input reached while scanning.
752 LOG(WARNING) << "cannot find field " << (*fields)[ifield].match
753 << " and following";
754 return false;
755 }
756 return true;
757}
758
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800759void MetricsDaemon::ScheduleMemuseCallback(double interval) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700760 if (testing_) {
761 return;
762 }
Steve Funge86591e2014-12-01 13:38:21 -0800763 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
764 base::Bind(&MetricsDaemon::MemuseCallback, base::Unretained(this)),
765 base::TimeDelta::FromSeconds(interval));
Luigi Semenzato8accd332011-05-17 16:37:18 -0700766}
767
768void MetricsDaemon::MemuseCallback() {
769 // Since we only care about active time (i.e. uptime minus sleep time) but
770 // the callbacks are driven by real time (uptime), we check if we should
771 // reschedule this callback due to intervening sleep periods.
772 double now = GetActiveTime();
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800773 // Avoid intervals of less than one second.
774 double remaining_time = ceil(memuse_final_time_ - now);
775 if (remaining_time > 0) {
776 ScheduleMemuseCallback(remaining_time);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700777 } else {
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800778 // Report stats and advance the measurement interval unless there are
779 // errors or we've completed the last interval.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700780 if (MemuseCallbackWork() &&
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800781 memuse_interval_index_ < arraysize(kMemuseIntervals)) {
782 double interval = kMemuseIntervals[memuse_interval_index_++];
783 memuse_final_time_ = now + interval;
784 ScheduleMemuseCallback(interval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700785 }
786 }
787}
788
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700789bool MetricsDaemon::MemuseCallbackWork() {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700790 string meminfo_raw;
Bertrand SIMONNET675a10c2015-08-25 14:11:43 -0700791 const FilePath meminfo_path(kMeminfoFileName);
Ben Chan2e6543d2014-02-05 23:26:25 -0800792 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700793 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
794 return false;
795 }
796 return ProcessMemuse(meminfo_raw);
797}
798
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700799bool MetricsDaemon::ProcessMemuse(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700800 static const MeminfoRecord fields_array[] = {
801 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
802 { "ActiveAnon", "Active(anon)" },
803 { "InactiveAnon", "Inactive(anon)" },
804 };
805 vector<MeminfoRecord> fields(fields_array,
806 fields_array + arraysize(fields_array));
807 if (!FillMeminfo(meminfo_raw, &fields)) {
808 return false;
809 }
810 int total = fields[0].value;
811 int active_anon = fields[1].value;
812 int inactive_anon = fields[2].value;
813 if (total == 0) {
814 // this "cannot happen"
815 LOG(WARNING) << "borked meminfo parser";
816 return false;
817 }
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800818 string metrics_name = base::StringPrintf("Platform.MemuseAnon%d",
819 memuse_interval_index_);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800820 SendLinearSample(metrics_name, (active_anon + inactive_anon) * 100 / total,
Luigi Semenzato8accd332011-05-17 16:37:18 -0700821 100, 101);
822 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700823}
824
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800825void MetricsDaemon::SendSample(const string& name, int sample,
Darin Petkov11b8eb32010-05-18 11:00:59 -0700826 int min, int max, int nbuckets) {
Darin Petkovfc91b422010-05-12 13:05:45 -0700827 metrics_lib_->SendToUMA(name, sample, min, max, nbuckets);
Darin Petkov65b01462010-04-14 13:32:20 -0700828}
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700829
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700830void MetricsDaemon::SendKernelCrashesCumulativeCountStats() {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800831 // Report the number of crashes for this OS version, but don't clear the
832 // counter. It is cleared elsewhere on version change.
Ben Chanf05ab402014-08-07 00:54:59 -0700833 int64_t crashes_count = kernel_crashes_version_count_->Get();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800834 SendSample(kernel_crashes_version_count_->Name(),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700835 crashes_count,
836 1, // value of first bucket
837 500, // value of last bucket
838 100); // number of buckets
839
840
Ben Chanf05ab402014-08-07 00:54:59 -0700841 int64_t cpu_use_ms = version_cumulative_cpu_use_->Get();
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700842 SendSample(version_cumulative_cpu_use_->Name(),
843 cpu_use_ms / 1000, // stat is in seconds
844 1, // device may be used very little...
845 8 * 1000 * 1000, // ... or a lot (a little over 90 days)
846 100);
847
848 // On the first run after an autoupdate, cpu_use_ms and active_use_seconds
849 // can be zero. Avoid division by zero.
850 if (cpu_use_ms > 0) {
851 // Send the crash frequency since update in number of crashes per CPU year.
852 SendSample("Logging.KernelCrashesPerCpuYear",
853 crashes_count * kSecondsPerDay * 365 * 1000 / cpu_use_ms,
854 1,
855 1000 * 1000, // about one crash every 30s of CPU time
856 100);
857 }
858
Ben Chanf05ab402014-08-07 00:54:59 -0700859 int64_t active_use_seconds = version_cumulative_active_use_->Get();
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700860 if (active_use_seconds > 0) {
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700861 SendSample(version_cumulative_active_use_->Name(),
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700862 active_use_seconds,
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700863 1, // device may be used very little...
864 8 * 1000 * 1000, // ... or a lot (about 90 days)
865 100);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700866 // Same as above, but per year of active time.
867 SendSample("Logging.KernelCrashesPerActiveYear",
868 crashes_count * kSecondsPerDay * 365 / active_use_seconds,
869 1,
870 1000 * 1000, // about one crash every 30s of active time
871 100);
872 }
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800873}
874
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700875void MetricsDaemon::SendAndResetDailyUseSample(
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700876 const scoped_ptr<PersistentInteger>& use) {
877 SendSample(use->Name(),
878 use->GetAndClear(),
879 1, // value of first bucket
880 kSecondsPerDay, // value of last bucket
881 50); // number of buckets
882}
883
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700884void MetricsDaemon::SendAndResetCrashIntervalSample(
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800885 const scoped_ptr<PersistentInteger>& interval) {
886 SendSample(interval->Name(),
887 interval->GetAndClear(),
888 1, // value of first bucket
889 4 * kSecondsPerWeek, // value of last bucket
890 50); // number of buckets
891}
892
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700893void MetricsDaemon::SendAndResetCrashFrequencySample(
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800894 const scoped_ptr<PersistentInteger>& frequency) {
895 SendSample(frequency->Name(),
896 frequency->GetAndClear(),
897 1, // value of first bucket
898 100, // value of last bucket
899 50); // number of buckets
900}
901
902void MetricsDaemon::SendLinearSample(const string& name, int sample,
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700903 int max, int nbuckets) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700904 // TODO(semenzato): add a proper linear histogram to the Chrome external
905 // metrics API.
906 LOG_IF(FATAL, nbuckets != max + 1) << "unsupported histogram scale";
907 metrics_lib_->SendEnumToUMA(name, sample, max);
908}
Daniel Eratc83975a2014-04-04 08:53:44 -0700909
910void MetricsDaemon::UpdateStats(TimeTicks now_ticks,
911 Time now_wall_time) {
912 const int elapsed_seconds = (now_ticks - last_update_stats_time_).InSeconds();
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700913 daily_active_use_->Add(elapsed_seconds);
914 version_cumulative_active_use_->Add(elapsed_seconds);
Daniel Eratc83975a2014-04-04 08:53:44 -0700915 user_crash_interval_->Add(elapsed_seconds);
916 kernel_crash_interval_->Add(elapsed_seconds);
917 version_cumulative_cpu_use_->Add(GetIncrementalCpuUse().InMilliseconds());
918 last_update_stats_time_ = now_ticks;
919
920 const TimeDelta since_epoch = now_wall_time - Time::UnixEpoch();
921 const int day = since_epoch.InDays();
922 const int week = day / 7;
923
924 if (daily_cycle_->Get() != day) {
925 daily_cycle_->Set(day);
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700926 SendAndResetDailyUseSample(daily_active_use_);
927 SendAndResetCrashFrequencySample(any_crashes_daily_count_);
928 SendAndResetCrashFrequencySample(user_crashes_daily_count_);
929 SendAndResetCrashFrequencySample(kernel_crashes_daily_count_);
930 SendAndResetCrashFrequencySample(unclean_shutdowns_daily_count_);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700931 SendKernelCrashesCumulativeCountStats();
Daniel Eratc83975a2014-04-04 08:53:44 -0700932 }
933
934 if (weekly_cycle_->Get() != week) {
935 weekly_cycle_->Set(week);
Bertrand SIMONNET2d037832015-09-16 17:11:51 -0700936 SendAndResetCrashFrequencySample(any_crashes_weekly_count_);
937 SendAndResetCrashFrequencySample(user_crashes_weekly_count_);
938 SendAndResetCrashFrequencySample(kernel_crashes_weekly_count_);
939 SendAndResetCrashFrequencySample(unclean_shutdowns_weekly_count_);
Daniel Eratc83975a2014-04-04 08:53:44 -0700940 }
941}
942
Steve Funge86591e2014-12-01 13:38:21 -0800943void MetricsDaemon::HandleUpdateStatsTimeout() {
944 UpdateStats(TimeTicks::Now(), Time::Now());
945 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
946 base::Bind(&MetricsDaemon::HandleUpdateStatsTimeout,
947 base::Unretained(this)),
948 base::TimeDelta::FromMilliseconds(kUpdateStatsIntervalMs));
Daniel Eratc83975a2014-04-04 08:53:44 -0700949}