blob: e8f0c6c19bdafeb71a318defe4acdf148ef84ce0 [file] [log] [blame]
Darin Petkov8032dd02011-05-09 16:33:19 -07001// Copyright (c) 2011 The Chromium OS Authors. All rights reserved.
Darin Petkov65b01462010-04-14 13:32:20 -07002// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
Luigi Semenzato4a6c9422014-06-30 18:12:28 -07005// For PRIu64 in inttypes.h, used by scanf. TODO(semenzato): replace
6// with libchromeos methods.
7#define __STDC_FORMAT_MACROS
8
9#include "metrics/metrics_daemon.h"
Darin Petkov65b01462010-04-14 13:32:20 -070010
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080011#include <fcntl.h>
Luigi Semenzato4a6c9422014-06-30 18:12:28 -070012#include <inttypes.h>
Luigi Semenzato8accd332011-05-17 16:37:18 -070013#include <math.h>
Ken Mixter4c5daa42010-08-26 18:35:06 -070014#include <string.h>
Luigi Semenzato8accd332011-05-17 16:37:18 -070015#include <time.h>
Darin Petkov65b01462010-04-14 13:32:20 -070016
Luigi Semenzato859b3f02014-02-05 15:33:19 -080017#include <base/at_exit.h>
Darin Petkov38d5cb02010-06-24 12:10:26 -070018#include <base/file_util.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080019#include <base/files/file_path.h>
20#include <base/hash.h>
Darin Petkov65b01462010-04-14 13:32:20 -070021#include <base/logging.h>
Ben Chan2e6543d2014-02-05 23:26:25 -080022#include <base/strings/string_number_conversions.h>
23#include <base/strings/string_split.h>
24#include <base/strings/string_util.h>
25#include <base/strings/stringprintf.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080026#include <base/sys_info.h>
Darin Petkov40f25732013-04-29 15:07:31 +020027#include <chromeos/dbus/service_constants.h>
Ken Mixter4c5daa42010-08-26 18:35:06 -070028#include <dbus/dbus-glib-lowlevel.h>
Darin Petkov65b01462010-04-14 13:32:20 -070029
Ben Chan2e6543d2014-02-05 23:26:25 -080030using base::FilePath;
31using base::StringPrintf;
Darin Petkovf27f0362010-06-04 13:14:19 -070032using base::Time;
33using base::TimeDelta;
34using base::TimeTicks;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080035using chromeos_metrics::PersistentInteger;
Luigi Semenzato8accd332011-05-17 16:37:18 -070036using std::map;
Darin Petkov38d5cb02010-06-24 12:10:26 -070037using std::string;
Luigi Semenzato8accd332011-05-17 16:37:18 -070038using std::vector;
39
Daniel Eratc83975a2014-04-04 08:53:44 -070040namespace {
Darin Petkovf27f0362010-06-04 13:14:19 -070041
Darin Petkov703ec972010-04-27 11:02:18 -070042#define SAFE_MESSAGE(e) (e.message ? e.message : "unknown error")
Darin Petkov40f25732013-04-29 15:07:31 +020043
Daniel Eratc83975a2014-04-04 08:53:44 -070044const char kCrashReporterInterface[] = "org.chromium.CrashReporter";
45const char kCrashReporterUserCrashSignal[] = "UserCrash";
Darin Petkov41e06232010-05-03 16:45:37 -070046
Daniel Eratc83975a2014-04-04 08:53:44 -070047const int kSecondsPerMinute = 60;
48const int kMinutesPerHour = 60;
49const int kHoursPerDay = 24;
50const int kMinutesPerDay = kHoursPerDay * kMinutesPerHour;
51const int kSecondsPerDay = kSecondsPerMinute * kMinutesPerDay;
52const int kDaysPerWeek = 7;
53const int kSecondsPerWeek = kSecondsPerDay * kDaysPerWeek;
Darin Petkov41e06232010-05-03 16:45:37 -070054
Daniel Eratc83975a2014-04-04 08:53:44 -070055// Interval between calls to UpdateStats().
56const guint kUpdateStatsIntervalMs = 300000;
Darin Petkov65b01462010-04-14 13:32:20 -070057
Luigi Semenzatoc5a92342014-02-14 15:05:51 -080058const char kKernelCrashDetectedFile[] = "/var/run/kernel-crash-detected";
Daniel Eratc83975a2014-04-04 08:53:44 -070059const char kUncleanShutdownDetectedFile[] =
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080060 "/var/run/unclean-shutdown-detected";
Ken Mixterccd84c02010-08-16 19:57:13 -070061
Daniel Eratc83975a2014-04-04 08:53:44 -070062} // namespace
63
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080064// disk stats metrics
65
66// The {Read,Write}Sectors numbers are in sectors/second.
67// A sector is usually 512 bytes.
68
69const char MetricsDaemon::kMetricReadSectorsLongName[] =
70 "Platform.ReadSectorsLong";
71const char MetricsDaemon::kMetricWriteSectorsLongName[] =
72 "Platform.WriteSectorsLong";
73const char MetricsDaemon::kMetricReadSectorsShortName[] =
74 "Platform.ReadSectorsShort";
75const char MetricsDaemon::kMetricWriteSectorsShortName[] =
76 "Platform.WriteSectorsShort";
77
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070078const int MetricsDaemon::kMetricStatsShortInterval = 1; // seconds
79const int MetricsDaemon::kMetricStatsLongInterval = 30; // seconds
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080080
Luigi Semenzato29c7ef92011-04-12 14:12:35 -070081const int MetricsDaemon::kMetricMeminfoInterval = 30; // seconds
82
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080083// Assume a max rate of 250Mb/s for reads (worse for writes) and 512 byte
84// sectors.
85const int MetricsDaemon::kMetricSectorsIOMax = 500000; // sectors/second
86const int MetricsDaemon::kMetricSectorsBuckets = 50; // buckets
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070087// Page size is 4k, sector size is 0.5k. We're not interested in page fault
88// rates that the disk cannot sustain.
89const int MetricsDaemon::kMetricPageFaultsMax = kMetricSectorsIOMax / 8;
90const int MetricsDaemon::kMetricPageFaultsBuckets = 50;
91
92// Major page faults, i.e. the ones that require data to be read from disk.
93
94const char MetricsDaemon::kMetricPageFaultsLongName[] =
95 "Platform.PageFaultsLong";
96const char MetricsDaemon::kMetricPageFaultsShortName[] =
97 "Platform.PageFaultsShort";
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080098
Sonny Rao4b8aebb2013-07-31 23:18:31 -070099// Swap in and Swap out
100
101const char MetricsDaemon::kMetricSwapInLongName[] =
102 "Platform.SwapInLong";
103const char MetricsDaemon::kMetricSwapInShortName[] =
104 "Platform.SwapInShort";
105
106const char MetricsDaemon::kMetricSwapOutLongName[] =
107 "Platform.SwapOutLong";
108const char MetricsDaemon::kMetricSwapOutShortName[] =
109 "Platform.SwapOutShort";
110
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700111const char MetricsDaemon::kMetricsProcStatFileName[] = "/proc/stat";
112const int MetricsDaemon::kMetricsProcStatFirstLineItemsCount = 11;
113
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700114// Thermal CPU throttling.
115
116const char MetricsDaemon::kMetricScaledCpuFrequencyName[] =
117 "Platform.CpuFrequencyThermalScaling";
118
Luigi Semenzato96360192014-06-04 10:53:35 -0700119// Zram sysfs entries.
120
121const char MetricsDaemon::kComprDataSizeName[] = "compr_data_size";
122const char MetricsDaemon::kOrigDataSizeName[] = "orig_data_size";
123const char MetricsDaemon::kZeroPagesName[] = "zero_pages";
124
Luigi Semenzato8accd332011-05-17 16:37:18 -0700125// Memory use stats collection intervals. We collect some memory use interval
126// at these intervals after boot, and we stop collecting after the last one,
127// with the assumption that in most cases the memory use won't change much
128// after that.
129static const int kMemuseIntervals[] = {
130 1 * kSecondsPerMinute, // 1 minute mark
131 4 * kSecondsPerMinute, // 5 minute mark
132 25 * kSecondsPerMinute, // 0.5 hour mark
133 120 * kSecondsPerMinute, // 2.5 hour mark
134 600 * kSecondsPerMinute, // 12.5 hour mark
135};
136
Darin Petkovf1e85e42010-06-10 15:59:53 -0700137MetricsDaemon::MetricsDaemon()
Daniel Eratc83975a2014-04-04 08:53:44 -0700138 : update_stats_timeout_id_(-1),
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800139 memuse_final_time_(0),
Luigi Semenzato8accd332011-05-17 16:37:18 -0700140 memuse_interval_index_(0),
141 read_sectors_(0),
142 write_sectors_(0),
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700143 vmstats_(),
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700144 stats_state_(kStatsShort),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700145 stats_initial_time_(0),
146 ticks_per_second_(0),
147 latest_cpu_use_ticks_(0) {}
Darin Petkovf1e85e42010-06-10 15:59:53 -0700148
Ken Mixter4c5daa42010-08-26 18:35:06 -0700149MetricsDaemon::~MetricsDaemon() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700150 if (update_stats_timeout_id_ > -1)
151 g_source_remove(update_stats_timeout_id_);
Ken Mixter4c5daa42010-08-26 18:35:06 -0700152}
153
Luigi Semenzato8accd332011-05-17 16:37:18 -0700154double MetricsDaemon::GetActiveTime() {
155 struct timespec ts;
156 int r = clock_gettime(CLOCK_MONOTONIC, &ts);
157 if (r < 0) {
158 PLOG(WARNING) << "clock_gettime(CLOCK_MONOTONIC) failed";
159 return 0;
160 } else {
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700161 return ts.tv_sec + static_cast<double>(ts.tv_nsec) / (1000 * 1000 * 1000);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700162 }
163}
164
Darin Petkov2ccef012010-05-05 16:06:37 -0700165void MetricsDaemon::Run(bool run_as_daemon) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800166 base::AtExitManager at_exit_manager;
167
Darin Petkov38d5cb02010-06-24 12:10:26 -0700168 if (run_as_daemon && daemon(0, 0) != 0)
169 return;
170
Ken Mixterccd84c02010-08-16 19:57:13 -0700171 if (CheckSystemCrash(kKernelCrashDetectedFile)) {
172 ProcessKernelCrash();
173 }
174
175 if (CheckSystemCrash(kUncleanShutdownDetectedFile)) {
176 ProcessUncleanShutdown();
177 }
178
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800179 // On OS version change, clear version stats (which are reported daily).
180 int32 version = GetOsVersionHash();
181 if (version_cycle_->Get() != version) {
182 version_cycle_->Set(version);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800183 kernel_crashes_version_count_->Set(0);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700184 version_cumulative_active_use_->Set(0);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700185 version_cumulative_cpu_use_->Set(0);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800186 }
187
Darin Petkov38d5cb02010-06-24 12:10:26 -0700188 Loop();
Darin Petkov65b01462010-04-14 13:32:20 -0700189}
190
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800191uint32 MetricsDaemon::GetOsVersionHash() {
192 static uint32 cached_version_hash = 0;
193 static bool version_hash_is_cached = false;
194 if (version_hash_is_cached)
195 return cached_version_hash;
196 version_hash_is_cached = true;
197 std::string version;
198 if (base::SysInfo::GetLsbReleaseValue("CHROMEOS_RELEASE_VERSION", &version)) {
199 cached_version_hash = base::Hash(version);
200 } else if (testing_) {
201 cached_version_hash = 42; // return any plausible value for the hash
202 } else {
203 LOG(FATAL) << "could not find CHROMEOS_RELEASE_VERSION";
204 }
205 return cached_version_hash;
206}
207
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800208void MetricsDaemon::Init(bool testing, MetricsLibraryInterface* metrics_lib,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700209 const string& diskstats_path,
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700210 const string& vmstats_path,
211 const string& scaling_max_freq_path,
Daniel Eratc83975a2014-04-04 08:53:44 -0700212 const string& cpuinfo_max_freq_path) {
Darin Petkov65b01462010-04-14 13:32:20 -0700213 testing_ = testing;
Darin Petkovfc91b422010-05-12 13:05:45 -0700214 DCHECK(metrics_lib != NULL);
215 metrics_lib_ = metrics_lib;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700216
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700217 // Get ticks per second (HZ) on this system.
218 // Sysconf cannot fail, so no sanity checks are needed.
219 ticks_per_second_ = sysconf(_SC_CLK_TCK);
220
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700221 daily_active_use_.reset(
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800222 new PersistentInteger("Logging.DailyUseTime"));
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700223 version_cumulative_active_use_.reset(
224 new PersistentInteger("Logging.CumulativeDailyUseTime"));
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700225 version_cumulative_cpu_use_.reset(
226 new PersistentInteger("Logging.CumulativeCpuTime"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700227
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800228 kernel_crash_interval_.reset(
229 new PersistentInteger("Logging.KernelCrashInterval"));
230 unclean_shutdown_interval_.reset(
231 new PersistentInteger("Logging.UncleanShutdownInterval"));
232 user_crash_interval_.reset(
233 new PersistentInteger("Logging.UserCrashInterval"));
Darin Petkov2ccef012010-05-05 16:06:37 -0700234
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800235 any_crashes_daily_count_.reset(
236 new PersistentInteger("Logging.AnyCrashesDaily"));
237 any_crashes_weekly_count_.reset(
238 new PersistentInteger("Logging.AnyCrashesWeekly"));
239 user_crashes_daily_count_.reset(
240 new PersistentInteger("Logging.UserCrashesDaily"));
241 user_crashes_weekly_count_.reset(
242 new PersistentInteger("Logging.UserCrashesWeekly"));
243 kernel_crashes_daily_count_.reset(
244 new PersistentInteger("Logging.KernelCrashesDaily"));
245 kernel_crashes_weekly_count_.reset(
246 new PersistentInteger("Logging.KernelCrashesWeekly"));
247 kernel_crashes_version_count_.reset(
248 new PersistentInteger("Logging.KernelCrashesSinceUpdate"));
249 unclean_shutdowns_daily_count_.reset(
250 new PersistentInteger("Logging.UncleanShutdownsDaily"));
251 unclean_shutdowns_weekly_count_.reset(
252 new PersistentInteger("Logging.UncleanShutdownsWeekly"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700253
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800254 daily_cycle_.reset(new PersistentInteger("daily.cycle"));
255 weekly_cycle_.reset(new PersistentInteger("weekly.cycle"));
256 version_cycle_.reset(new PersistentInteger("version.cycle"));
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800257
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700258 diskstats_path_ = diskstats_path;
259 vmstats_path_ = vmstats_path;
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700260 scaling_max_freq_path_ = scaling_max_freq_path;
261 cpuinfo_max_freq_path_ = cpuinfo_max_freq_path;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700262 StatsReporterInit();
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800263
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700264 // Start collecting meminfo stats.
265 ScheduleMeminfoCallback(kMetricMeminfoInterval);
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800266 memuse_final_time_ = GetActiveTime() + kMemuseIntervals[0];
267 ScheduleMemuseCallback(kMemuseIntervals[0]);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700268
Darin Petkov2ccef012010-05-05 16:06:37 -0700269 // Don't setup D-Bus and GLib in test mode.
270 if (testing)
271 return;
Darin Petkov65b01462010-04-14 13:32:20 -0700272
Darin Petkov703ec972010-04-27 11:02:18 -0700273 g_type_init();
Ben Chan6f598422013-06-22 06:29:36 -0700274 dbus_threads_init_default();
Darin Petkov65b01462010-04-14 13:32:20 -0700275
Darin Petkov703ec972010-04-27 11:02:18 -0700276 DBusError error;
277 dbus_error_init(&error);
Darin Petkov65b01462010-04-14 13:32:20 -0700278
David James3b3add52010-06-04 15:01:19 -0700279 DBusConnection* connection = dbus_bus_get(DBUS_BUS_SYSTEM, &error);
Darin Petkov703ec972010-04-27 11:02:18 -0700280 LOG_IF(FATAL, dbus_error_is_set(&error)) <<
281 "No D-Bus connection: " << SAFE_MESSAGE(error);
Darin Petkov65b01462010-04-14 13:32:20 -0700282
Darin Petkov703ec972010-04-27 11:02:18 -0700283 dbus_connection_setup_with_g_main(connection, NULL);
Darin Petkov65b01462010-04-14 13:32:20 -0700284
Darin Petkov40f25732013-04-29 15:07:31 +0200285 vector<string> matches;
286 matches.push_back(
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800287 base::StringPrintf("type='signal',interface='%s',path='/',member='%s'",
288 kCrashReporterInterface,
289 kCrashReporterUserCrashSignal));
Darin Petkov40f25732013-04-29 15:07:31 +0200290
Darin Petkov703ec972010-04-27 11:02:18 -0700291 // Registers D-Bus matches for the signals we would like to catch.
Darin Petkov40f25732013-04-29 15:07:31 +0200292 for (vector<string>::const_iterator it = matches.begin();
293 it != matches.end(); ++it) {
294 const char* match = it->c_str();
Darin Petkov41e06232010-05-03 16:45:37 -0700295 DLOG(INFO) << "adding dbus match: " << match;
Darin Petkov703ec972010-04-27 11:02:18 -0700296 dbus_bus_add_match(connection, match, &error);
297 LOG_IF(FATAL, dbus_error_is_set(&error)) <<
298 "unable to add a match: " << SAFE_MESSAGE(error);
299 }
300
301 // Adds the D-Bus filter routine to be called back whenever one of
302 // the registered D-Bus matches is successful. The daemon is not
303 // activated for D-Bus messages that don't match.
304 CHECK(dbus_connection_add_filter(connection, MessageFilter, this, NULL));
Daniel Eratc83975a2014-04-04 08:53:44 -0700305
306 update_stats_timeout_id_ =
307 g_timeout_add(kUpdateStatsIntervalMs, &HandleUpdateStatsTimeout, this);
Darin Petkov65b01462010-04-14 13:32:20 -0700308}
309
310void MetricsDaemon::Loop() {
Darin Petkov703ec972010-04-27 11:02:18 -0700311 GMainLoop* loop = g_main_loop_new(NULL, false);
312 g_main_loop_run(loop);
Darin Petkov65b01462010-04-14 13:32:20 -0700313}
314
Darin Petkov703ec972010-04-27 11:02:18 -0700315// static
316DBusHandlerResult MetricsDaemon::MessageFilter(DBusConnection* connection,
317 DBusMessage* message,
318 void* user_data) {
Darin Petkov703ec972010-04-27 11:02:18 -0700319 int message_type = dbus_message_get_type(message);
320 if (message_type != DBUS_MESSAGE_TYPE_SIGNAL) {
Darin Petkov41e06232010-05-03 16:45:37 -0700321 DLOG(WARNING) << "unexpected message type " << message_type;
Darin Petkov703ec972010-04-27 11:02:18 -0700322 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
323 }
324
325 // Signal messages always have interfaces.
Daniel Eratc83975a2014-04-04 08:53:44 -0700326 const std::string interface(dbus_message_get_interface(message));
327 const std::string member(dbus_message_get_member(message));
328 DLOG(INFO) << "Got " << interface << "." << member << " D-Bus signal";
Darin Petkov703ec972010-04-27 11:02:18 -0700329
330 MetricsDaemon* daemon = static_cast<MetricsDaemon*>(user_data);
331
332 DBusMessageIter iter;
333 dbus_message_iter_init(message, &iter);
Daniel Eratc83975a2014-04-04 08:53:44 -0700334 if (interface == kCrashReporterInterface) {
335 CHECK_EQ(member, kCrashReporterUserCrashSignal);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700336 daemon->ProcessUserCrash();
Darin Petkov703ec972010-04-27 11:02:18 -0700337 } else {
Daniel Eratc83975a2014-04-04 08:53:44 -0700338 // Ignore messages from the bus itself.
Darin Petkov703ec972010-04-27 11:02:18 -0700339 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
340 }
341
342 return DBUS_HANDLER_RESULT_HANDLED;
Darin Petkov65b01462010-04-14 13:32:20 -0700343}
344
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700345// One might argue that parts of this should go into
346// chromium/src/base/sys_info_chromeos.c instead, but put it here for now.
347
348TimeDelta MetricsDaemon::GetIncrementalCpuUse() {
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700349 FilePath proc_stat_path = FilePath(kMetricsProcStatFileName);
350 std::string proc_stat_string;
351 if (!base::ReadFileToString(proc_stat_path, &proc_stat_string)) {
352 LOG(WARNING) << "cannot open " << kMetricsProcStatFileName;
353 return TimeDelta();
354 }
355
356 std::vector<std::string> proc_stat_lines;
357 base::SplitString(proc_stat_string, '\n', &proc_stat_lines);
358 if (proc_stat_lines.empty()) {
359 LOG(WARNING) << "cannot parse " << kMetricsProcStatFileName
360 << ": " << proc_stat_string;
361 return TimeDelta();
362 }
363 std::vector<std::string> proc_stat_totals;
364 base::SplitStringAlongWhitespace(proc_stat_lines[0], &proc_stat_totals);
365
366 uint64 user_ticks, user_nice_ticks, system_ticks;
367 if (proc_stat_totals.size() != kMetricsProcStatFirstLineItemsCount ||
368 proc_stat_totals[0] != "cpu" ||
369 !base::StringToUint64(proc_stat_totals[1], &user_ticks) ||
370 !base::StringToUint64(proc_stat_totals[2], &user_nice_ticks) ||
371 !base::StringToUint64(proc_stat_totals[3], &system_ticks)) {
372 LOG(WARNING) << "cannot parse first line: " << proc_stat_lines[0];
373 return TimeDelta(base::TimeDelta::FromSeconds(0));
374 }
375
376 uint64 total_cpu_use_ticks = user_ticks + user_nice_ticks + system_ticks;
377
378 // Sanity check.
379 if (total_cpu_use_ticks < latest_cpu_use_ticks_) {
380 LOG(WARNING) << "CPU time decreasing from " << latest_cpu_use_ticks_
381 << " to " << total_cpu_use_ticks;
382 return TimeDelta();
383 }
384
385 uint64 diff = total_cpu_use_ticks - latest_cpu_use_ticks_;
386 latest_cpu_use_ticks_ = total_cpu_use_ticks;
387 // Use microseconds to avoid significant truncations.
388 return base::TimeDelta::FromMicroseconds(
389 diff * 1000 * 1000 / ticks_per_second_);
390}
391
Darin Petkov1bb904e2010-06-16 15:58:06 -0700392void MetricsDaemon::ProcessUserCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700393 // Counts the active time up to now.
394 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov1bb904e2010-06-16 15:58:06 -0700395
396 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800397 SendCrashIntervalSample(user_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700398
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800399 any_crashes_daily_count_->Add(1);
400 any_crashes_weekly_count_->Add(1);
401 user_crashes_daily_count_->Add(1);
402 user_crashes_weekly_count_->Add(1);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700403}
404
Darin Petkov38d5cb02010-06-24 12:10:26 -0700405void MetricsDaemon::ProcessKernelCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700406 // Counts the active time up to now.
407 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov38d5cb02010-06-24 12:10:26 -0700408
409 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800410 SendCrashIntervalSample(kernel_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700411
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800412 any_crashes_daily_count_->Add(1);
413 any_crashes_weekly_count_->Add(1);
414 kernel_crashes_daily_count_->Add(1);
415 kernel_crashes_weekly_count_->Add(1);
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800416
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800417 kernel_crashes_version_count_->Add(1);
Darin Petkov38d5cb02010-06-24 12:10:26 -0700418}
419
Ken Mixterccd84c02010-08-16 19:57:13 -0700420void MetricsDaemon::ProcessUncleanShutdown() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700421 // Counts the active time up to now.
422 UpdateStats(TimeTicks::Now(), Time::Now());
Ken Mixterccd84c02010-08-16 19:57:13 -0700423
424 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800425 SendCrashIntervalSample(unclean_shutdown_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700426
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800427 unclean_shutdowns_daily_count_->Add(1);
428 unclean_shutdowns_weekly_count_->Add(1);
429 any_crashes_daily_count_->Add(1);
430 any_crashes_weekly_count_->Add(1);
Ken Mixterccd84c02010-08-16 19:57:13 -0700431}
432
Luigi Semenzato8accd332011-05-17 16:37:18 -0700433bool MetricsDaemon::CheckSystemCrash(const string& crash_file) {
Darin Petkov38d5cb02010-06-24 12:10:26 -0700434 FilePath crash_detected(crash_file);
Ben Chan2e6543d2014-02-05 23:26:25 -0800435 if (!base::PathExists(crash_detected))
Ken Mixterccd84c02010-08-16 19:57:13 -0700436 return false;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700437
438 // Deletes the crash-detected file so that the daemon doesn't report
439 // another kernel crash in case it's restarted.
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800440 base::DeleteFile(crash_detected, false); // not recursive
Ken Mixterccd84c02010-08-16 19:57:13 -0700441 return true;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700442}
443
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700444void MetricsDaemon::StatsReporterInit() {
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800445 DiskStatsReadStats(&read_sectors_, &write_sectors_);
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700446 VmStatsReadStats(&vmstats_);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800447 // The first time around just run the long stat, so we don't delay boot.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700448 stats_state_ = kStatsLong;
449 stats_initial_time_ = GetActiveTime();
450 if (stats_initial_time_ < 0) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700451 LOG(WARNING) << "not collecting disk stats";
452 } else {
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700453 ScheduleStatsCallback(kMetricStatsLongInterval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700454 }
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800455}
456
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700457void MetricsDaemon::ScheduleStatsCallback(int wait) {
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800458 if (testing_) {
459 return;
460 }
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700461 g_timeout_add_seconds(wait, StatsCallbackStatic, this);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800462}
463
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700464bool MetricsDaemon::DiskStatsReadStats(uint64* read_sectors,
465 uint64* write_sectors) {
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800466 int nchars;
467 int nitems;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700468 bool success = false;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800469 char line[200];
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700470 if (diskstats_path_.empty()) {
471 return false;
472 }
Luigi Semenzato0f132bb2011-02-28 11:17:43 -0800473 int file = HANDLE_EINTR(open(diskstats_path_.c_str(), O_RDONLY));
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800474 if (file < 0) {
475 PLOG(WARNING) << "cannot open " << diskstats_path_;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700476 return false;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800477 }
478 nchars = HANDLE_EINTR(read(file, line, sizeof(line)));
479 if (nchars < 0) {
480 PLOG(WARNING) << "cannot read from " << diskstats_path_;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700481 return false;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800482 } else {
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700483 LOG_IF(WARNING, nchars == sizeof(line))
484 << "line too long in " << diskstats_path_;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800485 line[nchars] = '\0';
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700486 nitems = sscanf(line, "%*d %*d %" PRIu64 "d %*d %*d %*d %" PRIu64 "d",
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800487 read_sectors, write_sectors);
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700488 if (nitems == 2) {
489 success = true;
490 } else {
491 LOG(WARNING) << "found " << nitems << " items in "
492 << diskstats_path_ << ", expected 2";
493 }
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800494 }
Mike Frysinger3e8a8512014-05-14 16:14:37 -0400495 IGNORE_EINTR(close(file));
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700496 return success;
497}
498
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700499bool MetricsDaemon::VmStatsParseStats(const char* stats,
500 struct VmstatRecord* record) {
501 // a mapping of string name to field in VmstatRecord and whether we found it
502 struct mapping {
503 const string name;
504 uint64_t* value_p;
505 bool found;
506 } map[] =
507 { { .name = "pgmajfault",
508 .value_p = &record->page_faults_,
509 .found = false },
510 { .name = "pswpin",
511 .value_p = &record->swap_in_,
512 .found = false },
513 { .name = "pswpout",
514 .value_p = &record->swap_out_,
515 .found = false }, };
516
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700517 // Each line in the file has the form
518 // <ID> <VALUE>
519 // for instance:
520 // nr_free_pages 213427
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700521 vector<string> lines;
522 Tokenize(stats, "\n", &lines);
523 for (vector<string>::iterator it = lines.begin();
524 it != lines.end(); ++it) {
525 vector<string> tokens;
526 base::SplitString(*it, ' ', &tokens);
527 if (tokens.size() == 2) {
528 for (unsigned int i = 0; i < sizeof(map)/sizeof(struct mapping); i++) {
529 if (!tokens[0].compare(map[i].name)) {
530 if (!base::StringToUint64(tokens[1], map[i].value_p))
531 return false;
532 map[i].found = true;
533 }
534 }
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700535 } else {
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700536 LOG(WARNING) << "unexpected vmstat format";
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700537 }
538 }
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700539 // make sure we got all the stats
540 for (unsigned i = 0; i < sizeof(map)/sizeof(struct mapping); i++) {
541 if (map[i].found == false) {
542 LOG(WARNING) << "vmstat missing " << map[i].name;
543 return false;
544 }
545 }
546 return true;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700547}
548
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700549bool MetricsDaemon::VmStatsReadStats(struct VmstatRecord* stats) {
550 string value_string;
551 FilePath* path = new FilePath(vmstats_path_);
Ben Chan2e6543d2014-02-05 23:26:25 -0800552 if (!base::ReadFileToString(*path, &value_string)) {
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700553 delete path;
554 LOG(WARNING) << "cannot read " << vmstats_path_;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700555 return false;
556 }
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700557 delete path;
558 return VmStatsParseStats(value_string.c_str(), stats);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800559}
560
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700561bool MetricsDaemon::ReadFreqToInt(const string& sysfs_file_name, int* value) {
Luigi Semenzatod92d18c2013-06-04 13:24:21 -0700562 const FilePath sysfs_path(sysfs_file_name);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700563 string value_string;
Ben Chan2e6543d2014-02-05 23:26:25 -0800564 if (!base::ReadFileToString(sysfs_path, &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700565 LOG(WARNING) << "cannot read " << sysfs_path.value().c_str();
566 return false;
567 }
Ben Chan2e6543d2014-02-05 23:26:25 -0800568 if (!base::RemoveChars(value_string, "\n", &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700569 LOG(WARNING) << "no newline in " << value_string;
570 // Continue even though the lack of newline is suspicious.
571 }
572 if (!base::StringToInt(value_string, value)) {
573 LOG(WARNING) << "cannot convert " << value_string << " to int";
574 return false;
575 }
576 return true;
577}
578
579void MetricsDaemon::SendCpuThrottleMetrics() {
580 // |max_freq| is 0 only the first time through.
581 static int max_freq = 0;
582 if (max_freq == -1)
583 // Give up, as sysfs did not report max_freq correctly.
584 return;
585 if (max_freq == 0 || testing_) {
586 // One-time initialization of max_freq. (Every time when testing.)
587 if (!ReadFreqToInt(cpuinfo_max_freq_path_, &max_freq)) {
588 max_freq = -1;
589 return;
590 }
591 if (max_freq == 0) {
592 LOG(WARNING) << "sysfs reports 0 max CPU frequency\n";
593 max_freq = -1;
594 return;
595 }
596 if (max_freq % 10000 == 1000) {
597 // Special case: system has turbo mode, and max non-turbo frequency is
598 // max_freq - 1000. This relies on "normal" (non-turbo) frequencies
599 // being multiples of (at least) 10 MHz. Although there is no guarantee
600 // of this, it seems a fairly reasonable assumption. Otherwise we should
601 // read scaling_available_frequencies, sort the frequencies, compare the
602 // two highest ones, and check if they differ by 1000 (kHz) (and that's a
603 // hack too, no telling when it will change).
604 max_freq -= 1000;
605 }
606 }
607 int scaled_freq = 0;
608 if (!ReadFreqToInt(scaling_max_freq_path_, &scaled_freq))
609 return;
610 // Frequencies are in kHz. If scaled_freq > max_freq, turbo is on, but
611 // scaled_freq is not the actual turbo frequency. We indicate this situation
612 // with a 101% value.
613 int percent = scaled_freq > max_freq ? 101 : scaled_freq / (max_freq / 100);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800614 SendLinearSample(kMetricScaledCpuFrequencyName, percent, 101, 102);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700615}
616
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800617// static
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700618gboolean MetricsDaemon::StatsCallbackStatic(void* handle) {
619 (static_cast<MetricsDaemon*>(handle))->StatsCallback();
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800620 return false; // one-time callback
621}
622
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700623// Collects disk and vm stats alternating over a short and a long interval.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700624
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700625void MetricsDaemon::StatsCallback() {
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700626 uint64 read_sectors_now, write_sectors_now;
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700627 struct VmstatRecord vmstats_now;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700628 double time_now = GetActiveTime();
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700629 double delta_time = time_now - stats_initial_time_;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700630 if (testing_) {
631 // Fake the time when testing.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700632 delta_time = stats_state_ == kStatsShort ?
633 kMetricStatsShortInterval : kMetricStatsLongInterval;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700634 }
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700635 bool diskstats_success = DiskStatsReadStats(&read_sectors_now,
636 &write_sectors_now);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700637 int delta_read = read_sectors_now - read_sectors_;
638 int delta_write = write_sectors_now - write_sectors_;
639 int read_sectors_per_second = delta_read / delta_time;
640 int write_sectors_per_second = delta_write / delta_time;
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700641 bool vmstats_success = VmStatsReadStats(&vmstats_now);
642 uint64_t delta_faults = vmstats_now.page_faults_ - vmstats_.page_faults_;
643 uint64_t delta_swap_in = vmstats_now.swap_in_ - vmstats_.swap_in_;
644 uint64_t delta_swap_out = vmstats_now.swap_out_ - vmstats_.swap_out_;
645 uint64_t page_faults_per_second = delta_faults / delta_time;
646 uint64_t swap_in_per_second = delta_swap_in / delta_time;
647 uint64_t swap_out_per_second = delta_swap_out / delta_time;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800648
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700649 switch (stats_state_) {
650 case kStatsShort:
651 if (diskstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800652 SendSample(kMetricReadSectorsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700653 read_sectors_per_second,
654 1,
655 kMetricSectorsIOMax,
656 kMetricSectorsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800657 SendSample(kMetricWriteSectorsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700658 write_sectors_per_second,
659 1,
660 kMetricSectorsIOMax,
661 kMetricSectorsBuckets);
662 }
663 if (vmstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800664 SendSample(kMetricPageFaultsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700665 page_faults_per_second,
666 1,
667 kMetricPageFaultsMax,
668 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800669 SendSample(kMetricSwapInShortName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700670 swap_in_per_second,
671 1,
672 kMetricPageFaultsMax,
673 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800674 SendSample(kMetricSwapOutShortName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700675 swap_out_per_second,
676 1,
677 kMetricPageFaultsMax,
678 kMetricPageFaultsBuckets);
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700679 }
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800680 // Schedule long callback.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700681 stats_state_ = kStatsLong;
682 ScheduleStatsCallback(kMetricStatsLongInterval -
683 kMetricStatsShortInterval);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800684 break;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700685 case kStatsLong:
686 if (diskstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800687 SendSample(kMetricReadSectorsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700688 read_sectors_per_second,
689 1,
690 kMetricSectorsIOMax,
691 kMetricSectorsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800692 SendSample(kMetricWriteSectorsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700693 write_sectors_per_second,
694 1,
695 kMetricSectorsIOMax,
696 kMetricSectorsBuckets);
697 // Reset sector counters.
698 read_sectors_ = read_sectors_now;
699 write_sectors_ = write_sectors_now;
700 }
701 if (vmstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800702 SendSample(kMetricPageFaultsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700703 page_faults_per_second,
704 1,
705 kMetricPageFaultsMax,
706 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800707 SendSample(kMetricSwapInLongName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700708 swap_in_per_second,
709 1,
710 kMetricPageFaultsMax,
711 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800712 SendSample(kMetricSwapOutLongName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700713 swap_out_per_second,
714 1,
715 kMetricPageFaultsMax,
716 kMetricPageFaultsBuckets);
717
718 vmstats_ = vmstats_now;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700719 }
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700720 SendCpuThrottleMetrics();
Luigi Semenzato8accd332011-05-17 16:37:18 -0700721 // Set start time for new cycle.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700722 stats_initial_time_ = time_now;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800723 // Schedule short callback.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700724 stats_state_ = kStatsShort;
725 ScheduleStatsCallback(kMetricStatsShortInterval);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800726 break;
727 default:
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700728 LOG(FATAL) << "Invalid stats state";
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800729 }
730}
731
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700732void MetricsDaemon::ScheduleMeminfoCallback(int wait) {
733 if (testing_) {
734 return;
735 }
736 g_timeout_add_seconds(wait, MeminfoCallbackStatic, this);
737}
738
739// static
740gboolean MetricsDaemon::MeminfoCallbackStatic(void* handle) {
741 return (static_cast<MetricsDaemon*>(handle))->MeminfoCallback();
742}
743
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700744bool MetricsDaemon::MeminfoCallback() {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700745 string meminfo_raw;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700746 const FilePath meminfo_path("/proc/meminfo");
Ben Chan2e6543d2014-02-05 23:26:25 -0800747 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700748 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
749 return false;
750 }
Luigi Semenzato96360192014-06-04 10:53:35 -0700751 // Make both calls even if the first one fails.
752 bool success = ProcessMeminfo(meminfo_raw);
753 return ReportZram(base::FilePath(FILE_PATH_LITERAL("/sys/block/zram0"))) &&
754 success;
755}
756
757// static
758bool MetricsDaemon::ReadFileToUint64(const base::FilePath& path,
759 uint64* value) {
760 std::string content;
761 if (!base::ReadFileToString(path, &content)) {
762 PLOG(WARNING) << "cannot read " << path.MaybeAsASCII();
763 return false;
764 }
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700765 // Remove final newline.
766 base::TrimWhitespaceASCII(content, base::TRIM_TRAILING, &content);
Luigi Semenzato96360192014-06-04 10:53:35 -0700767 if (!base::StringToUint64(content, value)) {
768 LOG(WARNING) << "invalid integer: " << content;
769 return false;
770 }
771 return true;
772}
773
774bool MetricsDaemon::ReportZram(const base::FilePath& zram_dir) {
775 // Data sizes are in bytes. |zero_pages| is in number of pages.
776 uint64 compr_data_size, orig_data_size, zero_pages;
777 const size_t page_size = 4096;
778
779 if (!ReadFileToUint64(zram_dir.Append(kComprDataSizeName),
780 &compr_data_size) ||
781 !ReadFileToUint64(zram_dir.Append(kOrigDataSizeName), &orig_data_size) ||
782 !ReadFileToUint64(zram_dir.Append(kZeroPagesName), &zero_pages)) {
783 return false;
784 }
785
786 // |orig_data_size| does not include zero-filled pages.
787 orig_data_size += zero_pages * page_size;
788
789 const int compr_data_size_mb = compr_data_size >> 20;
790 const int savings_mb = (orig_data_size - compr_data_size) >> 20;
791 const int zero_ratio_percent = zero_pages * page_size * 100 / orig_data_size;
792
793 // Report compressed size in megabytes. 100 MB or less has little impact.
794 SendSample("Platform.ZramCompressedSize", compr_data_size_mb, 100, 4000, 50);
795 SendSample("Platform.ZramSavings", savings_mb, 100, 4000, 50);
796 // The compression ratio is multiplied by 100 for better resolution. The
797 // ratios of interest are between 1 and 6 (100% and 600% as reported). We
798 // don't want samples when very little memory is being compressed.
799 if (compr_data_size_mb >= 1) {
800 SendSample("Platform.ZramCompressionRatioPercent",
801 orig_data_size * 100 / compr_data_size, 100, 600, 50);
802 }
803 // The values of interest for zero_pages are between 1MB and 1GB. The units
804 // are number of pages.
805 SendSample("Platform.ZramZeroPages", zero_pages, 256, 256 * 1024, 50);
806 SendSample("Platform.ZramZeroRatioPercent", zero_ratio_percent, 1, 50, 50);
807
808 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700809}
810
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700811bool MetricsDaemon::ProcessMeminfo(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700812 static const MeminfoRecord fields_array[] = {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700813 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
814 { "MemFree", "MemFree" },
815 { "Buffers", "Buffers" },
816 { "Cached", "Cached" },
817 // { "SwapCached", "SwapCached" },
818 { "Active", "Active" },
819 { "Inactive", "Inactive" },
820 { "ActiveAnon", "Active(anon)" },
821 { "InactiveAnon", "Inactive(anon)" },
822 { "ActiveFile" , "Active(file)" },
823 { "InactiveFile", "Inactive(file)" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800824 { "Unevictable", "Unevictable", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700825 // { "Mlocked", "Mlocked" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800826 { "SwapTotal", "SwapTotal", kMeminfoOp_SwapTotal },
827 { "SwapFree", "SwapFree", kMeminfoOp_SwapFree },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700828 // { "Dirty", "Dirty" },
829 // { "Writeback", "Writeback" },
830 { "AnonPages", "AnonPages" },
831 { "Mapped", "Mapped" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800832 { "Shmem", "Shmem", kMeminfoOp_HistLog },
833 { "Slab", "Slab", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700834 // { "SReclaimable", "SReclaimable" },
835 // { "SUnreclaim", "SUnreclaim" },
836 };
Luigi Semenzato8accd332011-05-17 16:37:18 -0700837 vector<MeminfoRecord> fields(fields_array,
838 fields_array + arraysize(fields_array));
839 if (!FillMeminfo(meminfo_raw, &fields)) {
840 return false;
841 }
842 int total_memory = fields[0].value;
843 if (total_memory == 0) {
844 // this "cannot happen"
845 LOG(WARNING) << "borked meminfo parser";
846 return false;
847 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800848 int swap_total = 0;
849 int swap_free = 0;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700850 // Send all fields retrieved, except total memory.
851 for (unsigned int i = 1; i < fields.size(); i++) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800852 string metrics_name = base::StringPrintf("Platform.Meminfo%s",
853 fields[i].name);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800854 int percent;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800855 switch (fields[i].op) {
856 case kMeminfoOp_HistPercent:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800857 // report value as percent of total memory
858 percent = fields[i].value * 100 / total_memory;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800859 SendLinearSample(metrics_name, percent, 100, 101);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800860 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800861 case kMeminfoOp_HistLog:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800862 // report value in kbytes, log scale, 4Gb max
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800863 SendSample(metrics_name, fields[i].value, 1, 4 * 1000 * 1000, 100);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800864 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800865 case kMeminfoOp_SwapTotal:
866 swap_total = fields[i].value;
867 case kMeminfoOp_SwapFree:
868 swap_free = fields[i].value;
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800869 break;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700870 }
871 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800872 if (swap_total > 0) {
873 int swap_used = swap_total - swap_free;
874 int swap_used_percent = swap_used * 100 / swap_total;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800875 SendSample("Platform.MeminfoSwapUsed", swap_used, 1, 8 * 1000 * 1000, 100);
876 SendLinearSample("Platform.MeminfoSwapUsedPercent", swap_used_percent,
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800877 100, 101);
878 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700879 return true;
880}
881
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700882bool MetricsDaemon::FillMeminfo(const string& meminfo_raw,
883 vector<MeminfoRecord>* fields) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700884 vector<string> lines;
885 unsigned int nlines = Tokenize(meminfo_raw, "\n", &lines);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700886
887 // Scan meminfo output and collect field values. Each field name has to
888 // match a meminfo entry (case insensitive) after removing non-alpha
889 // characters from the entry.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700890 unsigned int ifield = 0;
891 for (unsigned int iline = 0;
892 iline < nlines && ifield < fields->size();
893 iline++) {
894 vector<string> tokens;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700895 Tokenize(lines[iline], ": ", &tokens);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700896 if (strcmp((*fields)[ifield].match, tokens[0].c_str()) == 0) {
897 // Name matches. Parse value and save.
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700898 char* rest;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700899 (*fields)[ifield].value =
900 static_cast<int>(strtol(tokens[1].c_str(), &rest, 10));
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700901 if (*rest != '\0') {
902 LOG(WARNING) << "missing meminfo value";
903 return false;
904 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700905 ifield++;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700906 }
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700907 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700908 if (ifield < fields->size()) {
909 // End of input reached while scanning.
910 LOG(WARNING) << "cannot find field " << (*fields)[ifield].match
911 << " and following";
912 return false;
913 }
914 return true;
915}
916
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800917void MetricsDaemon::ScheduleMemuseCallback(double interval) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700918 if (testing_) {
919 return;
920 }
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800921 g_timeout_add_seconds(interval, MemuseCallbackStatic, this);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700922}
923
924// static
925gboolean MetricsDaemon::MemuseCallbackStatic(void* handle) {
926 MetricsDaemon* daemon = static_cast<MetricsDaemon*>(handle);
927 daemon->MemuseCallback();
928 return false;
929}
930
931void MetricsDaemon::MemuseCallback() {
932 // Since we only care about active time (i.e. uptime minus sleep time) but
933 // the callbacks are driven by real time (uptime), we check if we should
934 // reschedule this callback due to intervening sleep periods.
935 double now = GetActiveTime();
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800936 // Avoid intervals of less than one second.
937 double remaining_time = ceil(memuse_final_time_ - now);
938 if (remaining_time > 0) {
939 ScheduleMemuseCallback(remaining_time);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700940 } else {
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800941 // Report stats and advance the measurement interval unless there are
942 // errors or we've completed the last interval.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700943 if (MemuseCallbackWork() &&
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800944 memuse_interval_index_ < arraysize(kMemuseIntervals)) {
945 double interval = kMemuseIntervals[memuse_interval_index_++];
946 memuse_final_time_ = now + interval;
947 ScheduleMemuseCallback(interval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700948 }
949 }
950}
951
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700952bool MetricsDaemon::MemuseCallbackWork() {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700953 string meminfo_raw;
954 const FilePath meminfo_path("/proc/meminfo");
Ben Chan2e6543d2014-02-05 23:26:25 -0800955 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700956 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
957 return false;
958 }
959 return ProcessMemuse(meminfo_raw);
960}
961
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700962bool MetricsDaemon::ProcessMemuse(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700963 static const MeminfoRecord fields_array[] = {
964 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
965 { "ActiveAnon", "Active(anon)" },
966 { "InactiveAnon", "Inactive(anon)" },
967 };
968 vector<MeminfoRecord> fields(fields_array,
969 fields_array + arraysize(fields_array));
970 if (!FillMeminfo(meminfo_raw, &fields)) {
971 return false;
972 }
973 int total = fields[0].value;
974 int active_anon = fields[1].value;
975 int inactive_anon = fields[2].value;
976 if (total == 0) {
977 // this "cannot happen"
978 LOG(WARNING) << "borked meminfo parser";
979 return false;
980 }
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800981 string metrics_name = base::StringPrintf("Platform.MemuseAnon%d",
982 memuse_interval_index_);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800983 SendLinearSample(metrics_name, (active_anon + inactive_anon) * 100 / total,
Luigi Semenzato8accd332011-05-17 16:37:18 -0700984 100, 101);
985 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700986}
987
Luigi Semenzato5ef2e392014-04-15 15:15:02 -0700988void MetricsDaemon::ReportDailyUse(int use_seconds) {
989 if (use_seconds <= 0)
Darin Petkov1bb904e2010-06-16 15:58:06 -0700990 return;
991
Luigi Semenzato5ef2e392014-04-15 15:15:02 -0700992 int minutes = (use_seconds + kSecondsPerMinute / 2) / kSecondsPerMinute;
993 SendSample("Logging.DailyUseTime",
994 minutes,
995 1,
996 kMinutesPerDay * 30 * 2, // cumulative---two months worth
997 50);
Darin Petkovf1e85e42010-06-10 15:59:53 -0700998}
999
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001000void MetricsDaemon::SendSample(const string& name, int sample,
Darin Petkov11b8eb32010-05-18 11:00:59 -07001001 int min, int max, int nbuckets) {
Darin Petkovfc91b422010-05-12 13:05:45 -07001002 metrics_lib_->SendToUMA(name, sample, min, max, nbuckets);
Darin Petkov65b01462010-04-14 13:32:20 -07001003}
Luigi Semenzato29c7ef92011-04-12 14:12:35 -07001004
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001005void MetricsDaemon::SendKernelCrashesCumulativeCountStats() {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001006 // Report the number of crashes for this OS version, but don't clear the
1007 // counter. It is cleared elsewhere on version change.
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001008 int64 crashes_count = kernel_crashes_version_count_->Get();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001009 SendSample(kernel_crashes_version_count_->Name(),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001010 crashes_count,
1011 1, // value of first bucket
1012 500, // value of last bucket
1013 100); // number of buckets
1014
1015
1016 int64 cpu_use_ms = version_cumulative_cpu_use_->Get();
1017 SendSample(version_cumulative_cpu_use_->Name(),
1018 cpu_use_ms / 1000, // stat is in seconds
1019 1, // device may be used very little...
1020 8 * 1000 * 1000, // ... or a lot (a little over 90 days)
1021 100);
1022
1023 // On the first run after an autoupdate, cpu_use_ms and active_use_seconds
1024 // can be zero. Avoid division by zero.
1025 if (cpu_use_ms > 0) {
1026 // Send the crash frequency since update in number of crashes per CPU year.
1027 SendSample("Logging.KernelCrashesPerCpuYear",
1028 crashes_count * kSecondsPerDay * 365 * 1000 / cpu_use_ms,
1029 1,
1030 1000 * 1000, // about one crash every 30s of CPU time
1031 100);
1032 }
1033
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001034 int64 active_use_seconds = version_cumulative_active_use_->Get();
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001035 if (active_use_seconds > 0) {
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001036 SendSample(version_cumulative_active_use_->Name(),
1037 active_use_seconds / 1000, // stat is in seconds
1038 1, // device may be used very little...
1039 8 * 1000 * 1000, // ... or a lot (about 90 days)
1040 100);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001041 // Same as above, but per year of active time.
1042 SendSample("Logging.KernelCrashesPerActiveYear",
1043 crashes_count * kSecondsPerDay * 365 / active_use_seconds,
1044 1,
1045 1000 * 1000, // about one crash every 30s of active time
1046 100);
1047 }
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001048}
1049
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001050void MetricsDaemon::SendDailyUseSample(
1051 const scoped_ptr<PersistentInteger>& use) {
1052 SendSample(use->Name(),
1053 use->GetAndClear(),
1054 1, // value of first bucket
1055 kSecondsPerDay, // value of last bucket
1056 50); // number of buckets
1057}
1058
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001059void MetricsDaemon::SendCrashIntervalSample(
1060 const scoped_ptr<PersistentInteger>& interval) {
1061 SendSample(interval->Name(),
1062 interval->GetAndClear(),
1063 1, // value of first bucket
1064 4 * kSecondsPerWeek, // value of last bucket
1065 50); // number of buckets
1066}
1067
1068void MetricsDaemon::SendCrashFrequencySample(
1069 const scoped_ptr<PersistentInteger>& frequency) {
1070 SendSample(frequency->Name(),
1071 frequency->GetAndClear(),
1072 1, // value of first bucket
1073 100, // value of last bucket
1074 50); // number of buckets
1075}
1076
1077void MetricsDaemon::SendLinearSample(const string& name, int sample,
Luigi Semenzato29c7ef92011-04-12 14:12:35 -07001078 int max, int nbuckets) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -07001079 // TODO(semenzato): add a proper linear histogram to the Chrome external
1080 // metrics API.
1081 LOG_IF(FATAL, nbuckets != max + 1) << "unsupported histogram scale";
1082 metrics_lib_->SendEnumToUMA(name, sample, max);
1083}
Daniel Eratc83975a2014-04-04 08:53:44 -07001084
1085void MetricsDaemon::UpdateStats(TimeTicks now_ticks,
1086 Time now_wall_time) {
1087 const int elapsed_seconds = (now_ticks - last_update_stats_time_).InSeconds();
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001088 daily_active_use_->Add(elapsed_seconds);
1089 version_cumulative_active_use_->Add(elapsed_seconds);
Daniel Eratc83975a2014-04-04 08:53:44 -07001090 user_crash_interval_->Add(elapsed_seconds);
1091 kernel_crash_interval_->Add(elapsed_seconds);
1092 version_cumulative_cpu_use_->Add(GetIncrementalCpuUse().InMilliseconds());
1093 last_update_stats_time_ = now_ticks;
1094
1095 const TimeDelta since_epoch = now_wall_time - Time::UnixEpoch();
1096 const int day = since_epoch.InDays();
1097 const int week = day / 7;
1098
1099 if (daily_cycle_->Get() != day) {
1100 daily_cycle_->Set(day);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001101 SendDailyUseSample(daily_active_use_);
1102 SendDailyUseSample(version_cumulative_active_use_);
Daniel Eratc83975a2014-04-04 08:53:44 -07001103 SendCrashFrequencySample(any_crashes_daily_count_);
1104 SendCrashFrequencySample(user_crashes_daily_count_);
1105 SendCrashFrequencySample(kernel_crashes_daily_count_);
1106 SendCrashFrequencySample(unclean_shutdowns_daily_count_);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001107 SendKernelCrashesCumulativeCountStats();
Daniel Eratc83975a2014-04-04 08:53:44 -07001108 }
1109
1110 if (weekly_cycle_->Get() != week) {
1111 weekly_cycle_->Set(week);
1112 SendCrashFrequencySample(any_crashes_weekly_count_);
1113 SendCrashFrequencySample(user_crashes_weekly_count_);
1114 SendCrashFrequencySample(kernel_crashes_weekly_count_);
1115 SendCrashFrequencySample(unclean_shutdowns_weekly_count_);
1116 }
1117}
1118
1119// static
1120gboolean MetricsDaemon::HandleUpdateStatsTimeout(gpointer data) {
1121 static_cast<MetricsDaemon*>(data)->UpdateStats(TimeTicks::Now(), Time::Now());
1122 return TRUE;
1123}