blob: 634027842f293696e732736b08460a65dcd48a0d [file] [log] [blame]
Darin Petkov8032dd02011-05-09 16:33:19 -07001// Copyright (c) 2011 The Chromium OS Authors. All rights reserved.
Darin Petkov65b01462010-04-14 13:32:20 -07002// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
Bertrand SIMONNET4b915ae2015-07-28 15:38:14 -07005#include "metrics_daemon.h"
Darin Petkov65b01462010-04-14 13:32:20 -07006
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -08007#include <fcntl.h>
Luigi Semenzato4a6c9422014-06-30 18:12:28 -07008#include <inttypes.h>
Luigi Semenzato8accd332011-05-17 16:37:18 -07009#include <math.h>
Ken Mixter4c5daa42010-08-26 18:35:06 -070010#include <string.h>
Steve Funge86591e2014-12-01 13:38:21 -080011#include <sysexits.h>
Luigi Semenzato8accd332011-05-17 16:37:18 -070012#include <time.h>
Darin Petkov65b01462010-04-14 13:32:20 -070013
Bertrand SIMONNET4b915ae2015-07-28 15:38:14 -070014#include <base/bind.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080015#include <base/files/file_path.h>
Ben Chan51bf92a2014-09-05 08:21:06 -070016#include <base/files/file_util.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080017#include <base/hash.h>
Darin Petkov65b01462010-04-14 13:32:20 -070018#include <base/logging.h>
Ben Chan2e6543d2014-02-05 23:26:25 -080019#include <base/strings/string_number_conversions.h>
20#include <base/strings/string_split.h>
21#include <base/strings/string_util.h>
22#include <base/strings/stringprintf.h>
Luigi Semenzato859b3f02014-02-05 15:33:19 -080023#include <base/sys_info.h>
Steve Funge86591e2014-12-01 13:38:21 -080024#include <dbus/dbus.h>
25#include <dbus/message.h>
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -070026
27#include "constants.h"
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -070028#include "uploader/upload_service.h"
Darin Petkov65b01462010-04-14 13:32:20 -070029
Ben Chan2e6543d2014-02-05 23:26:25 -080030using base::FilePath;
31using base::StringPrintf;
Darin Petkovf27f0362010-06-04 13:14:19 -070032using base::Time;
33using base::TimeDelta;
34using base::TimeTicks;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080035using chromeos_metrics::PersistentInteger;
Luigi Semenzato8accd332011-05-17 16:37:18 -070036using std::map;
Darin Petkov38d5cb02010-06-24 12:10:26 -070037using std::string;
Luigi Semenzato8accd332011-05-17 16:37:18 -070038using std::vector;
39
Daniel Eratc83975a2014-04-04 08:53:44 -070040namespace {
Darin Petkovf27f0362010-06-04 13:14:19 -070041
Darin Petkov703ec972010-04-27 11:02:18 -070042#define SAFE_MESSAGE(e) (e.message ? e.message : "unknown error")
Darin Petkov40f25732013-04-29 15:07:31 +020043
Daniel Eratc83975a2014-04-04 08:53:44 -070044const char kCrashReporterInterface[] = "org.chromium.CrashReporter";
45const char kCrashReporterUserCrashSignal[] = "UserCrash";
Steve Funge86591e2014-12-01 13:38:21 -080046const char kCrashReporterMatchRule[] =
47 "type='signal',interface='%s',path='/',member='%s'";
Darin Petkov41e06232010-05-03 16:45:37 -070048
Daniel Eratc83975a2014-04-04 08:53:44 -070049const int kSecondsPerMinute = 60;
50const int kMinutesPerHour = 60;
51const int kHoursPerDay = 24;
52const int kMinutesPerDay = kHoursPerDay * kMinutesPerHour;
53const int kSecondsPerDay = kSecondsPerMinute * kMinutesPerDay;
54const int kDaysPerWeek = 7;
55const int kSecondsPerWeek = kSecondsPerDay * kDaysPerWeek;
Darin Petkov41e06232010-05-03 16:45:37 -070056
Daniel Eratc83975a2014-04-04 08:53:44 -070057// Interval between calls to UpdateStats().
Steve Funge86591e2014-12-01 13:38:21 -080058const uint32_t kUpdateStatsIntervalMs = 300000;
Darin Petkov65b01462010-04-14 13:32:20 -070059
Luigi Semenzatoc5a92342014-02-14 15:05:51 -080060const char kKernelCrashDetectedFile[] = "/var/run/kernel-crash-detected";
Daniel Eratc83975a2014-04-04 08:53:44 -070061const char kUncleanShutdownDetectedFile[] =
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080062 "/var/run/unclean-shutdown-detected";
Ken Mixterccd84c02010-08-16 19:57:13 -070063
Daniel Eratc83975a2014-04-04 08:53:44 -070064} // namespace
65
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080066// disk stats metrics
67
68// The {Read,Write}Sectors numbers are in sectors/second.
69// A sector is usually 512 bytes.
70
71const char MetricsDaemon::kMetricReadSectorsLongName[] =
72 "Platform.ReadSectorsLong";
73const char MetricsDaemon::kMetricWriteSectorsLongName[] =
74 "Platform.WriteSectorsLong";
75const char MetricsDaemon::kMetricReadSectorsShortName[] =
76 "Platform.ReadSectorsShort";
77const char MetricsDaemon::kMetricWriteSectorsShortName[] =
78 "Platform.WriteSectorsShort";
79
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070080const int MetricsDaemon::kMetricStatsShortInterval = 1; // seconds
81const int MetricsDaemon::kMetricStatsLongInterval = 30; // seconds
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080082
Luigi Semenzato29c7ef92011-04-12 14:12:35 -070083const int MetricsDaemon::kMetricMeminfoInterval = 30; // seconds
84
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080085// Assume a max rate of 250Mb/s for reads (worse for writes) and 512 byte
86// sectors.
87const int MetricsDaemon::kMetricSectorsIOMax = 500000; // sectors/second
88const int MetricsDaemon::kMetricSectorsBuckets = 50; // buckets
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070089// Page size is 4k, sector size is 0.5k. We're not interested in page fault
90// rates that the disk cannot sustain.
91const int MetricsDaemon::kMetricPageFaultsMax = kMetricSectorsIOMax / 8;
92const int MetricsDaemon::kMetricPageFaultsBuckets = 50;
93
94// Major page faults, i.e. the ones that require data to be read from disk.
95
96const char MetricsDaemon::kMetricPageFaultsLongName[] =
97 "Platform.PageFaultsLong";
98const char MetricsDaemon::kMetricPageFaultsShortName[] =
99 "Platform.PageFaultsShort";
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800100
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700101// Swap in and Swap out
102
103const char MetricsDaemon::kMetricSwapInLongName[] =
104 "Platform.SwapInLong";
105const char MetricsDaemon::kMetricSwapInShortName[] =
106 "Platform.SwapInShort";
107
108const char MetricsDaemon::kMetricSwapOutLongName[] =
109 "Platform.SwapOutLong";
110const char MetricsDaemon::kMetricSwapOutShortName[] =
111 "Platform.SwapOutShort";
112
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700113const char MetricsDaemon::kMetricsProcStatFileName[] = "/proc/stat";
114const int MetricsDaemon::kMetricsProcStatFirstLineItemsCount = 11;
115
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700116// Thermal CPU throttling.
117
118const char MetricsDaemon::kMetricScaledCpuFrequencyName[] =
119 "Platform.CpuFrequencyThermalScaling";
120
Luigi Semenzato96360192014-06-04 10:53:35 -0700121// Zram sysfs entries.
122
123const char MetricsDaemon::kComprDataSizeName[] = "compr_data_size";
124const char MetricsDaemon::kOrigDataSizeName[] = "orig_data_size";
125const char MetricsDaemon::kZeroPagesName[] = "zero_pages";
126
Luigi Semenzato8accd332011-05-17 16:37:18 -0700127// Memory use stats collection intervals. We collect some memory use interval
128// at these intervals after boot, and we stop collecting after the last one,
129// with the assumption that in most cases the memory use won't change much
130// after that.
131static const int kMemuseIntervals[] = {
132 1 * kSecondsPerMinute, // 1 minute mark
133 4 * kSecondsPerMinute, // 5 minute mark
134 25 * kSecondsPerMinute, // 0.5 hour mark
135 120 * kSecondsPerMinute, // 2.5 hour mark
136 600 * kSecondsPerMinute, // 12.5 hour mark
137};
138
Darin Petkovf1e85e42010-06-10 15:59:53 -0700139MetricsDaemon::MetricsDaemon()
Steve Funge86591e2014-12-01 13:38:21 -0800140 : memuse_final_time_(0),
Luigi Semenzato8accd332011-05-17 16:37:18 -0700141 memuse_interval_index_(0),
142 read_sectors_(0),
143 write_sectors_(0),
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700144 vmstats_(),
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700145 stats_state_(kStatsShort),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700146 stats_initial_time_(0),
147 ticks_per_second_(0),
148 latest_cpu_use_ticks_(0) {}
Darin Petkovf1e85e42010-06-10 15:59:53 -0700149
Ken Mixter4c5daa42010-08-26 18:35:06 -0700150MetricsDaemon::~MetricsDaemon() {
Ken Mixter4c5daa42010-08-26 18:35:06 -0700151}
152
Luigi Semenzato8accd332011-05-17 16:37:18 -0700153double MetricsDaemon::GetActiveTime() {
154 struct timespec ts;
155 int r = clock_gettime(CLOCK_MONOTONIC, &ts);
156 if (r < 0) {
157 PLOG(WARNING) << "clock_gettime(CLOCK_MONOTONIC) failed";
158 return 0;
159 } else {
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700160 return ts.tv_sec + static_cast<double>(ts.tv_nsec) / (1000 * 1000 * 1000);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700161 }
162}
163
Steve Funge86591e2014-12-01 13:38:21 -0800164int MetricsDaemon::Run() {
Ken Mixterccd84c02010-08-16 19:57:13 -0700165 if (CheckSystemCrash(kKernelCrashDetectedFile)) {
166 ProcessKernelCrash();
167 }
168
169 if (CheckSystemCrash(kUncleanShutdownDetectedFile)) {
170 ProcessUncleanShutdown();
171 }
172
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800173 // On OS version change, clear version stats (which are reported daily).
Ben Chanf05ab402014-08-07 00:54:59 -0700174 int32_t version = GetOsVersionHash();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800175 if (version_cycle_->Get() != version) {
176 version_cycle_->Set(version);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800177 kernel_crashes_version_count_->Set(0);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700178 version_cumulative_active_use_->Set(0);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700179 version_cumulative_cpu_use_->Set(0);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800180 }
181
Steve Funge86591e2014-12-01 13:38:21 -0800182 return chromeos::DBusDaemon::Run();
Darin Petkov65b01462010-04-14 13:32:20 -0700183}
184
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700185void MetricsDaemon::RunUploaderTest() {
Bertrand SIMONNET71a62ef2014-10-07 11:26:25 -0700186 upload_service_.reset(new UploadService(new SystemProfileCache(true,
187 config_root_),
Bertrand SIMONNETe4fa61e2015-02-18 09:38:55 -0800188 metrics_lib_,
Bertrand SIMONNET71a62ef2014-10-07 11:26:25 -0700189 server_));
Bertrand SIMONNETcac74e12014-10-09 10:14:13 -0700190 upload_service_->Init(upload_interval_, metrics_file_);
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700191 upload_service_->UploadEvent();
192}
193
Ben Chanf05ab402014-08-07 00:54:59 -0700194uint32_t MetricsDaemon::GetOsVersionHash() {
195 static uint32_t cached_version_hash = 0;
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800196 static bool version_hash_is_cached = false;
197 if (version_hash_is_cached)
198 return cached_version_hash;
199 version_hash_is_cached = true;
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -0700200 std::string version = metrics::kDefaultVersion;
201 // The version might not be set for development devices. In this case, use the
202 // zero version.
203 base::SysInfo::GetLsbReleaseValue("BRILLO_VERSION", &version);
204 cached_version_hash = base::Hash(version);
205 if (testing_) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800206 cached_version_hash = 42; // return any plausible value for the hash
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800207 }
208 return cached_version_hash;
209}
210
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700211void MetricsDaemon::Init(bool testing,
212 bool uploader_active,
213 MetricsLibraryInterface* metrics_lib,
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700214 const string& vmstats_path,
215 const string& scaling_max_freq_path,
Steve Fung67906c62014-10-06 15:15:30 -0700216 const string& cpuinfo_max_freq_path,
Bertrand SIMONNETcac74e12014-10-09 10:14:13 -0700217 const base::TimeDelta& upload_interval,
Steve Fung67906c62014-10-06 15:15:30 -0700218 const string& server,
Bertrand SIMONNET71a62ef2014-10-07 11:26:25 -0700219 const string& metrics_file,
220 const string& config_root) {
Darin Petkov65b01462010-04-14 13:32:20 -0700221 testing_ = testing;
Steve Funge86591e2014-12-01 13:38:21 -0800222 uploader_active_ = uploader_active;
Bertrand SIMONNET71a62ef2014-10-07 11:26:25 -0700223 config_root_ = config_root;
Alex Vakulenko14595032014-08-28 14:59:56 -0700224 DCHECK(metrics_lib != nullptr);
Darin Petkovfc91b422010-05-12 13:05:45 -0700225 metrics_lib_ = metrics_lib;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700226
Bertrand SIMONNETcac74e12014-10-09 10:14:13 -0700227 upload_interval_ = upload_interval;
Steve Fung67906c62014-10-06 15:15:30 -0700228 server_ = server;
229 metrics_file_ = metrics_file;
230
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700231 // Get ticks per second (HZ) on this system.
232 // Sysconf cannot fail, so no sanity checks are needed.
233 ticks_per_second_ = sysconf(_SC_CLK_TCK);
234
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700235 daily_active_use_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700236 new PersistentInteger("Platform.DailyUseTime"));
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700237 version_cumulative_active_use_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700238 new PersistentInteger("Platform.CumulativeDailyUseTime"));
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700239 version_cumulative_cpu_use_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700240 new PersistentInteger("Platform.CumulativeCpuTime"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700241
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800242 kernel_crash_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700243 new PersistentInteger("Platform.KernelCrashInterval"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800244 unclean_shutdown_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700245 new PersistentInteger("Platform.UncleanShutdownInterval"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800246 user_crash_interval_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700247 new PersistentInteger("Platform.UserCrashInterval"));
Darin Petkov2ccef012010-05-05 16:06:37 -0700248
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800249 any_crashes_daily_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700250 new PersistentInteger("Platform.AnyCrashesDaily"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800251 any_crashes_weekly_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700252 new PersistentInteger("Platform.AnyCrashesWeekly"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800253 user_crashes_daily_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700254 new PersistentInteger("Platform.UserCrashesDaily"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800255 user_crashes_weekly_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700256 new PersistentInteger("Platform.UserCrashesWeekly"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800257 kernel_crashes_daily_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700258 new PersistentInteger("Platform.KernelCrashesDaily"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800259 kernel_crashes_weekly_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700260 new PersistentInteger("Platform.KernelCrashesWeekly"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800261 kernel_crashes_version_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700262 new PersistentInteger("Platform.KernelCrashesSinceUpdate"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800263 unclean_shutdowns_daily_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700264 new PersistentInteger("Platform.UncleanShutdownsDaily"));
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800265 unclean_shutdowns_weekly_count_.reset(
Luigi Semenzatodc865892015-07-09 08:28:08 -0700266 new PersistentInteger("Platform.UncleanShutdownsWeekly"));
Darin Petkov38d5cb02010-06-24 12:10:26 -0700267
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800268 daily_cycle_.reset(new PersistentInteger("daily.cycle"));
269 weekly_cycle_.reset(new PersistentInteger("weekly.cycle"));
270 version_cycle_.reset(new PersistentInteger("version.cycle"));
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800271
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700272 vmstats_path_ = vmstats_path;
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700273 scaling_max_freq_path_ = scaling_max_freq_path;
274 cpuinfo_max_freq_path_ = cpuinfo_max_freq_path;
Steve Funge86591e2014-12-01 13:38:21 -0800275}
276
277int MetricsDaemon::OnInit() {
278 int return_code = chromeos::DBusDaemon::OnInit();
279 if (return_code != EX_OK)
280 return return_code;
281
Steve Funge86591e2014-12-01 13:38:21 -0800282 if (testing_)
283 return EX_OK;
Darin Petkov65b01462010-04-14 13:32:20 -0700284
Steve Funge86591e2014-12-01 13:38:21 -0800285 bus_->AssertOnDBusThread();
286 CHECK(bus_->SetUpAsyncOperations());
Darin Petkov65b01462010-04-14 13:32:20 -0700287
Steve Funge86591e2014-12-01 13:38:21 -0800288 if (bus_->is_connected()) {
289 const std::string match_rule =
290 base::StringPrintf(kCrashReporterMatchRule,
291 kCrashReporterInterface,
292 kCrashReporterUserCrashSignal);
Darin Petkov65b01462010-04-14 13:32:20 -0700293
Steve Funge86591e2014-12-01 13:38:21 -0800294 bus_->AddFilterFunction(&MetricsDaemon::MessageFilter, this);
Darin Petkov65b01462010-04-14 13:32:20 -0700295
Steve Funge86591e2014-12-01 13:38:21 -0800296 DBusError error;
297 dbus_error_init(&error);
298 bus_->AddMatch(match_rule, &error);
Darin Petkov65b01462010-04-14 13:32:20 -0700299
Steve Funge86591e2014-12-01 13:38:21 -0800300 if (dbus_error_is_set(&error)) {
301 LOG(ERROR) << "Failed to add match rule \"" << match_rule << "\". Got "
302 << error.name << ": " << error.message;
303 return EX_SOFTWARE;
304 }
305 } else {
306 LOG(ERROR) << "DBus isn't connected.";
307 return EX_UNAVAILABLE;
Darin Petkov703ec972010-04-27 11:02:18 -0700308 }
309
Steve Funge86591e2014-12-01 13:38:21 -0800310 if (uploader_active_) {
Bertrand SIMONNETbae5dcc2015-08-04 14:12:10 -0700311 upload_service_.reset(
312 new UploadService(new SystemProfileCache(), metrics_lib_, server_));
313 upload_service_->Init(upload_interval_, metrics_file_);
Bertrand SIMONNET46b49da2014-06-25 14:38:07 -0700314 }
Steve Funge86591e2014-12-01 13:38:21 -0800315
316 return EX_OK;
Darin Petkov65b01462010-04-14 13:32:20 -0700317}
318
Steve Funge86591e2014-12-01 13:38:21 -0800319void MetricsDaemon::OnShutdown(int* return_code) {
320 if (!testing_ && bus_->is_connected()) {
321 const std::string match_rule =
322 base::StringPrintf(kCrashReporterMatchRule,
323 kCrashReporterInterface,
324 kCrashReporterUserCrashSignal);
325
326 bus_->RemoveFilterFunction(&MetricsDaemon::MessageFilter, this);
327
328 DBusError error;
329 dbus_error_init(&error);
330 bus_->RemoveMatch(match_rule, &error);
331
332 if (dbus_error_is_set(&error)) {
333 LOG(ERROR) << "Failed to remove match rule \"" << match_rule << "\". Got "
334 << error.name << ": " << error.message;
335 }
336 }
337 chromeos::DBusDaemon::OnShutdown(return_code);
Darin Petkov65b01462010-04-14 13:32:20 -0700338}
339
Darin Petkov703ec972010-04-27 11:02:18 -0700340// static
341DBusHandlerResult MetricsDaemon::MessageFilter(DBusConnection* connection,
342 DBusMessage* message,
343 void* user_data) {
Darin Petkov703ec972010-04-27 11:02:18 -0700344 int message_type = dbus_message_get_type(message);
345 if (message_type != DBUS_MESSAGE_TYPE_SIGNAL) {
Darin Petkov41e06232010-05-03 16:45:37 -0700346 DLOG(WARNING) << "unexpected message type " << message_type;
Darin Petkov703ec972010-04-27 11:02:18 -0700347 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
348 }
349
350 // Signal messages always have interfaces.
Daniel Eratc83975a2014-04-04 08:53:44 -0700351 const std::string interface(dbus_message_get_interface(message));
352 const std::string member(dbus_message_get_member(message));
353 DLOG(INFO) << "Got " << interface << "." << member << " D-Bus signal";
Darin Petkov703ec972010-04-27 11:02:18 -0700354
355 MetricsDaemon* daemon = static_cast<MetricsDaemon*>(user_data);
356
357 DBusMessageIter iter;
358 dbus_message_iter_init(message, &iter);
Daniel Eratc83975a2014-04-04 08:53:44 -0700359 if (interface == kCrashReporterInterface) {
360 CHECK_EQ(member, kCrashReporterUserCrashSignal);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700361 daemon->ProcessUserCrash();
Darin Petkov703ec972010-04-27 11:02:18 -0700362 } else {
Daniel Eratc83975a2014-04-04 08:53:44 -0700363 // Ignore messages from the bus itself.
Darin Petkov703ec972010-04-27 11:02:18 -0700364 return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
365 }
366
367 return DBUS_HANDLER_RESULT_HANDLED;
Darin Petkov65b01462010-04-14 13:32:20 -0700368}
369
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700370// One might argue that parts of this should go into
371// chromium/src/base/sys_info_chromeos.c instead, but put it here for now.
372
373TimeDelta MetricsDaemon::GetIncrementalCpuUse() {
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700374 FilePath proc_stat_path = FilePath(kMetricsProcStatFileName);
375 std::string proc_stat_string;
376 if (!base::ReadFileToString(proc_stat_path, &proc_stat_string)) {
377 LOG(WARNING) << "cannot open " << kMetricsProcStatFileName;
378 return TimeDelta();
379 }
380
381 std::vector<std::string> proc_stat_lines;
382 base::SplitString(proc_stat_string, '\n', &proc_stat_lines);
383 if (proc_stat_lines.empty()) {
384 LOG(WARNING) << "cannot parse " << kMetricsProcStatFileName
385 << ": " << proc_stat_string;
386 return TimeDelta();
387 }
388 std::vector<std::string> proc_stat_totals;
389 base::SplitStringAlongWhitespace(proc_stat_lines[0], &proc_stat_totals);
390
Ben Chanf05ab402014-08-07 00:54:59 -0700391 uint64_t user_ticks, user_nice_ticks, system_ticks;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700392 if (proc_stat_totals.size() != kMetricsProcStatFirstLineItemsCount ||
393 proc_stat_totals[0] != "cpu" ||
394 !base::StringToUint64(proc_stat_totals[1], &user_ticks) ||
395 !base::StringToUint64(proc_stat_totals[2], &user_nice_ticks) ||
396 !base::StringToUint64(proc_stat_totals[3], &system_ticks)) {
397 LOG(WARNING) << "cannot parse first line: " << proc_stat_lines[0];
398 return TimeDelta(base::TimeDelta::FromSeconds(0));
399 }
400
Ben Chanf05ab402014-08-07 00:54:59 -0700401 uint64_t total_cpu_use_ticks = user_ticks + user_nice_ticks + system_ticks;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700402
403 // Sanity check.
404 if (total_cpu_use_ticks < latest_cpu_use_ticks_) {
405 LOG(WARNING) << "CPU time decreasing from " << latest_cpu_use_ticks_
406 << " to " << total_cpu_use_ticks;
407 return TimeDelta();
408 }
409
Ben Chanf05ab402014-08-07 00:54:59 -0700410 uint64_t diff = total_cpu_use_ticks - latest_cpu_use_ticks_;
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700411 latest_cpu_use_ticks_ = total_cpu_use_ticks;
412 // Use microseconds to avoid significant truncations.
413 return base::TimeDelta::FromMicroseconds(
414 diff * 1000 * 1000 / ticks_per_second_);
415}
416
Darin Petkov1bb904e2010-06-16 15:58:06 -0700417void MetricsDaemon::ProcessUserCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700418 // Counts the active time up to now.
419 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov1bb904e2010-06-16 15:58:06 -0700420
421 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800422 SendCrashIntervalSample(user_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700423
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800424 any_crashes_daily_count_->Add(1);
425 any_crashes_weekly_count_->Add(1);
426 user_crashes_daily_count_->Add(1);
427 user_crashes_weekly_count_->Add(1);
Darin Petkov1bb904e2010-06-16 15:58:06 -0700428}
429
Darin Petkov38d5cb02010-06-24 12:10:26 -0700430void MetricsDaemon::ProcessKernelCrash() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700431 // Counts the active time up to now.
432 UpdateStats(TimeTicks::Now(), Time::Now());
Darin Petkov38d5cb02010-06-24 12:10:26 -0700433
434 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800435 SendCrashIntervalSample(kernel_crash_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700436
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800437 any_crashes_daily_count_->Add(1);
438 any_crashes_weekly_count_->Add(1);
439 kernel_crashes_daily_count_->Add(1);
440 kernel_crashes_weekly_count_->Add(1);
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800441
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800442 kernel_crashes_version_count_->Add(1);
Darin Petkov38d5cb02010-06-24 12:10:26 -0700443}
444
Ken Mixterccd84c02010-08-16 19:57:13 -0700445void MetricsDaemon::ProcessUncleanShutdown() {
Daniel Eratc83975a2014-04-04 08:53:44 -0700446 // Counts the active time up to now.
447 UpdateStats(TimeTicks::Now(), Time::Now());
Ken Mixterccd84c02010-08-16 19:57:13 -0700448
449 // Reports the active use time since the last crash and resets it.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800450 SendCrashIntervalSample(unclean_shutdown_interval_);
Ken Mixterccd84c02010-08-16 19:57:13 -0700451
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800452 unclean_shutdowns_daily_count_->Add(1);
453 unclean_shutdowns_weekly_count_->Add(1);
454 any_crashes_daily_count_->Add(1);
455 any_crashes_weekly_count_->Add(1);
Ken Mixterccd84c02010-08-16 19:57:13 -0700456}
457
Luigi Semenzato8accd332011-05-17 16:37:18 -0700458bool MetricsDaemon::CheckSystemCrash(const string& crash_file) {
Darin Petkov38d5cb02010-06-24 12:10:26 -0700459 FilePath crash_detected(crash_file);
Ben Chan2e6543d2014-02-05 23:26:25 -0800460 if (!base::PathExists(crash_detected))
Ken Mixterccd84c02010-08-16 19:57:13 -0700461 return false;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700462
463 // Deletes the crash-detected file so that the daemon doesn't report
464 // another kernel crash in case it's restarted.
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800465 base::DeleteFile(crash_detected, false); // not recursive
Ken Mixterccd84c02010-08-16 19:57:13 -0700466 return true;
Darin Petkov38d5cb02010-06-24 12:10:26 -0700467}
468
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700469void MetricsDaemon::StatsReporterInit() {
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800470 DiskStatsReadStats(&read_sectors_, &write_sectors_);
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700471 VmStatsReadStats(&vmstats_);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800472 // The first time around just run the long stat, so we don't delay boot.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700473 stats_state_ = kStatsLong;
474 stats_initial_time_ = GetActiveTime();
475 if (stats_initial_time_ < 0) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700476 LOG(WARNING) << "not collecting disk stats";
477 } else {
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700478 ScheduleStatsCallback(kMetricStatsLongInterval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700479 }
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800480}
481
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700482void MetricsDaemon::ScheduleStatsCallback(int wait) {
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800483 if (testing_) {
484 return;
485 }
Steve Funge86591e2014-12-01 13:38:21 -0800486 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
487 base::Bind(&MetricsDaemon::StatsCallback, base::Unretained(this)),
488 base::TimeDelta::FromSeconds(wait));
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800489}
490
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700491bool MetricsDaemon::VmStatsParseStats(const char* stats,
492 struct VmstatRecord* record) {
493 // a mapping of string name to field in VmstatRecord and whether we found it
494 struct mapping {
495 const string name;
496 uint64_t* value_p;
497 bool found;
498 } map[] =
499 { { .name = "pgmajfault",
500 .value_p = &record->page_faults_,
501 .found = false },
502 { .name = "pswpin",
503 .value_p = &record->swap_in_,
504 .found = false },
505 { .name = "pswpout",
506 .value_p = &record->swap_out_,
507 .found = false }, };
508
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700509 // Each line in the file has the form
510 // <ID> <VALUE>
511 // for instance:
512 // nr_free_pages 213427
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700513 vector<string> lines;
514 Tokenize(stats, "\n", &lines);
515 for (vector<string>::iterator it = lines.begin();
516 it != lines.end(); ++it) {
517 vector<string> tokens;
518 base::SplitString(*it, ' ', &tokens);
519 if (tokens.size() == 2) {
520 for (unsigned int i = 0; i < sizeof(map)/sizeof(struct mapping); i++) {
521 if (!tokens[0].compare(map[i].name)) {
522 if (!base::StringToUint64(tokens[1], map[i].value_p))
523 return false;
524 map[i].found = true;
525 }
526 }
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700527 } else {
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700528 LOG(WARNING) << "unexpected vmstat format";
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700529 }
530 }
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700531 // make sure we got all the stats
532 for (unsigned i = 0; i < sizeof(map)/sizeof(struct mapping); i++) {
533 if (map[i].found == false) {
534 LOG(WARNING) << "vmstat missing " << map[i].name;
535 return false;
536 }
537 }
538 return true;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700539}
540
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700541bool MetricsDaemon::VmStatsReadStats(struct VmstatRecord* stats) {
542 string value_string;
543 FilePath* path = new FilePath(vmstats_path_);
Ben Chan2e6543d2014-02-05 23:26:25 -0800544 if (!base::ReadFileToString(*path, &value_string)) {
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700545 delete path;
546 LOG(WARNING) << "cannot read " << vmstats_path_;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700547 return false;
548 }
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700549 delete path;
550 return VmStatsParseStats(value_string.c_str(), stats);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800551}
552
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700553bool MetricsDaemon::ReadFreqToInt(const string& sysfs_file_name, int* value) {
Luigi Semenzatod92d18c2013-06-04 13:24:21 -0700554 const FilePath sysfs_path(sysfs_file_name);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700555 string value_string;
Ben Chan2e6543d2014-02-05 23:26:25 -0800556 if (!base::ReadFileToString(sysfs_path, &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700557 LOG(WARNING) << "cannot read " << sysfs_path.value().c_str();
558 return false;
559 }
Ben Chan2e6543d2014-02-05 23:26:25 -0800560 if (!base::RemoveChars(value_string, "\n", &value_string)) {
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700561 LOG(WARNING) << "no newline in " << value_string;
562 // Continue even though the lack of newline is suspicious.
563 }
564 if (!base::StringToInt(value_string, value)) {
565 LOG(WARNING) << "cannot convert " << value_string << " to int";
566 return false;
567 }
568 return true;
569}
570
571void MetricsDaemon::SendCpuThrottleMetrics() {
572 // |max_freq| is 0 only the first time through.
573 static int max_freq = 0;
574 if (max_freq == -1)
575 // Give up, as sysfs did not report max_freq correctly.
576 return;
577 if (max_freq == 0 || testing_) {
578 // One-time initialization of max_freq. (Every time when testing.)
579 if (!ReadFreqToInt(cpuinfo_max_freq_path_, &max_freq)) {
580 max_freq = -1;
581 return;
582 }
583 if (max_freq == 0) {
584 LOG(WARNING) << "sysfs reports 0 max CPU frequency\n";
585 max_freq = -1;
586 return;
587 }
588 if (max_freq % 10000 == 1000) {
589 // Special case: system has turbo mode, and max non-turbo frequency is
590 // max_freq - 1000. This relies on "normal" (non-turbo) frequencies
591 // being multiples of (at least) 10 MHz. Although there is no guarantee
592 // of this, it seems a fairly reasonable assumption. Otherwise we should
593 // read scaling_available_frequencies, sort the frequencies, compare the
594 // two highest ones, and check if they differ by 1000 (kHz) (and that's a
595 // hack too, no telling when it will change).
596 max_freq -= 1000;
597 }
598 }
599 int scaled_freq = 0;
600 if (!ReadFreqToInt(scaling_max_freq_path_, &scaled_freq))
601 return;
602 // Frequencies are in kHz. If scaled_freq > max_freq, turbo is on, but
603 // scaled_freq is not the actual turbo frequency. We indicate this situation
604 // with a 101% value.
605 int percent = scaled_freq > max_freq ? 101 : scaled_freq / (max_freq / 100);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800606 SendLinearSample(kMetricScaledCpuFrequencyName, percent, 101, 102);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700607}
608
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700609// Collects disk and vm stats alternating over a short and a long interval.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700610
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700611void MetricsDaemon::StatsCallback() {
Ben Chanf05ab402014-08-07 00:54:59 -0700612 uint64_t read_sectors_now, write_sectors_now;
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700613 struct VmstatRecord vmstats_now;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700614 double time_now = GetActiveTime();
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700615 double delta_time = time_now - stats_initial_time_;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700616 if (testing_) {
617 // Fake the time when testing.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700618 delta_time = stats_state_ == kStatsShort ?
619 kMetricStatsShortInterval : kMetricStatsLongInterval;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700620 }
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700621 bool diskstats_success = DiskStatsReadStats(&read_sectors_now,
622 &write_sectors_now);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700623 int delta_read = read_sectors_now - read_sectors_;
624 int delta_write = write_sectors_now - write_sectors_;
625 int read_sectors_per_second = delta_read / delta_time;
626 int write_sectors_per_second = delta_write / delta_time;
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700627 bool vmstats_success = VmStatsReadStats(&vmstats_now);
628 uint64_t delta_faults = vmstats_now.page_faults_ - vmstats_.page_faults_;
629 uint64_t delta_swap_in = vmstats_now.swap_in_ - vmstats_.swap_in_;
630 uint64_t delta_swap_out = vmstats_now.swap_out_ - vmstats_.swap_out_;
631 uint64_t page_faults_per_second = delta_faults / delta_time;
632 uint64_t swap_in_per_second = delta_swap_in / delta_time;
633 uint64_t swap_out_per_second = delta_swap_out / delta_time;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800634
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700635 switch (stats_state_) {
636 case kStatsShort:
637 if (diskstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800638 SendSample(kMetricReadSectorsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700639 read_sectors_per_second,
640 1,
641 kMetricSectorsIOMax,
642 kMetricSectorsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800643 SendSample(kMetricWriteSectorsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700644 write_sectors_per_second,
645 1,
646 kMetricSectorsIOMax,
647 kMetricSectorsBuckets);
648 }
649 if (vmstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800650 SendSample(kMetricPageFaultsShortName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700651 page_faults_per_second,
652 1,
653 kMetricPageFaultsMax,
654 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800655 SendSample(kMetricSwapInShortName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700656 swap_in_per_second,
657 1,
658 kMetricPageFaultsMax,
659 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800660 SendSample(kMetricSwapOutShortName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700661 swap_out_per_second,
662 1,
663 kMetricPageFaultsMax,
664 kMetricPageFaultsBuckets);
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700665 }
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800666 // Schedule long callback.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700667 stats_state_ = kStatsLong;
668 ScheduleStatsCallback(kMetricStatsLongInterval -
669 kMetricStatsShortInterval);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800670 break;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700671 case kStatsLong:
672 if (diskstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800673 SendSample(kMetricReadSectorsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700674 read_sectors_per_second,
675 1,
676 kMetricSectorsIOMax,
677 kMetricSectorsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800678 SendSample(kMetricWriteSectorsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700679 write_sectors_per_second,
680 1,
681 kMetricSectorsIOMax,
682 kMetricSectorsBuckets);
683 // Reset sector counters.
684 read_sectors_ = read_sectors_now;
685 write_sectors_ = write_sectors_now;
686 }
687 if (vmstats_success) {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800688 SendSample(kMetricPageFaultsLongName,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700689 page_faults_per_second,
690 1,
691 kMetricPageFaultsMax,
692 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800693 SendSample(kMetricSwapInLongName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700694 swap_in_per_second,
695 1,
696 kMetricPageFaultsMax,
697 kMetricPageFaultsBuckets);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800698 SendSample(kMetricSwapOutLongName,
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700699 swap_out_per_second,
700 1,
701 kMetricPageFaultsMax,
702 kMetricPageFaultsBuckets);
703
704 vmstats_ = vmstats_now;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700705 }
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700706 SendCpuThrottleMetrics();
Luigi Semenzato8accd332011-05-17 16:37:18 -0700707 // Set start time for new cycle.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700708 stats_initial_time_ = time_now;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800709 // Schedule short callback.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700710 stats_state_ = kStatsShort;
711 ScheduleStatsCallback(kMetricStatsShortInterval);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800712 break;
713 default:
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700714 LOG(FATAL) << "Invalid stats state";
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800715 }
716}
717
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700718void MetricsDaemon::ScheduleMeminfoCallback(int wait) {
719 if (testing_) {
720 return;
721 }
Steve Funge86591e2014-12-01 13:38:21 -0800722 base::TimeDelta waitDelta = base::TimeDelta::FromSeconds(wait);
723 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
724 base::Bind(&MetricsDaemon::MeminfoCallback, base::Unretained(this),
Steve Fung8ab89c52015-01-05 13:48:30 -0800725 waitDelta),
Steve Funge86591e2014-12-01 13:38:21 -0800726 waitDelta);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700727}
728
Steve Funge86591e2014-12-01 13:38:21 -0800729void MetricsDaemon::MeminfoCallback(base::TimeDelta wait) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700730 string meminfo_raw;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700731 const FilePath meminfo_path("/proc/meminfo");
Ben Chan2e6543d2014-02-05 23:26:25 -0800732 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700733 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
Steve Funge86591e2014-12-01 13:38:21 -0800734 return;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700735 }
Luigi Semenzato96360192014-06-04 10:53:35 -0700736 // Make both calls even if the first one fails.
737 bool success = ProcessMeminfo(meminfo_raw);
Steve Funge86591e2014-12-01 13:38:21 -0800738 bool reschedule =
739 ReportZram(base::FilePath(FILE_PATH_LITERAL("/sys/block/zram0"))) &&
Luigi Semenzato96360192014-06-04 10:53:35 -0700740 success;
Steve Funge86591e2014-12-01 13:38:21 -0800741 if (reschedule) {
742 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
743 base::Bind(&MetricsDaemon::MeminfoCallback, base::Unretained(this),
Steve Fung8ab89c52015-01-05 13:48:30 -0800744 wait),
Steve Funge86591e2014-12-01 13:38:21 -0800745 wait);
746 }
Luigi Semenzato96360192014-06-04 10:53:35 -0700747}
748
749// static
750bool MetricsDaemon::ReadFileToUint64(const base::FilePath& path,
Ben Chanf05ab402014-08-07 00:54:59 -0700751 uint64_t* value) {
Luigi Semenzato96360192014-06-04 10:53:35 -0700752 std::string content;
753 if (!base::ReadFileToString(path, &content)) {
754 PLOG(WARNING) << "cannot read " << path.MaybeAsASCII();
755 return false;
756 }
Luigi Semenzato4a6c9422014-06-30 18:12:28 -0700757 // Remove final newline.
758 base::TrimWhitespaceASCII(content, base::TRIM_TRAILING, &content);
Luigi Semenzato96360192014-06-04 10:53:35 -0700759 if (!base::StringToUint64(content, value)) {
760 LOG(WARNING) << "invalid integer: " << content;
761 return false;
762 }
763 return true;
764}
765
766bool MetricsDaemon::ReportZram(const base::FilePath& zram_dir) {
767 // Data sizes are in bytes. |zero_pages| is in number of pages.
Ben Chanf05ab402014-08-07 00:54:59 -0700768 uint64_t compr_data_size, orig_data_size, zero_pages;
Luigi Semenzato96360192014-06-04 10:53:35 -0700769 const size_t page_size = 4096;
770
771 if (!ReadFileToUint64(zram_dir.Append(kComprDataSizeName),
772 &compr_data_size) ||
773 !ReadFileToUint64(zram_dir.Append(kOrigDataSizeName), &orig_data_size) ||
774 !ReadFileToUint64(zram_dir.Append(kZeroPagesName), &zero_pages)) {
775 return false;
776 }
777
778 // |orig_data_size| does not include zero-filled pages.
779 orig_data_size += zero_pages * page_size;
780
781 const int compr_data_size_mb = compr_data_size >> 20;
782 const int savings_mb = (orig_data_size - compr_data_size) >> 20;
783 const int zero_ratio_percent = zero_pages * page_size * 100 / orig_data_size;
784
785 // Report compressed size in megabytes. 100 MB or less has little impact.
786 SendSample("Platform.ZramCompressedSize", compr_data_size_mb, 100, 4000, 50);
787 SendSample("Platform.ZramSavings", savings_mb, 100, 4000, 50);
788 // The compression ratio is multiplied by 100 for better resolution. The
789 // ratios of interest are between 1 and 6 (100% and 600% as reported). We
790 // don't want samples when very little memory is being compressed.
791 if (compr_data_size_mb >= 1) {
792 SendSample("Platform.ZramCompressionRatioPercent",
793 orig_data_size * 100 / compr_data_size, 100, 600, 50);
794 }
795 // The values of interest for zero_pages are between 1MB and 1GB. The units
796 // are number of pages.
797 SendSample("Platform.ZramZeroPages", zero_pages, 256, 256 * 1024, 50);
798 SendSample("Platform.ZramZeroRatioPercent", zero_ratio_percent, 1, 50, 50);
799
800 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700801}
802
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700803bool MetricsDaemon::ProcessMeminfo(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700804 static const MeminfoRecord fields_array[] = {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700805 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
806 { "MemFree", "MemFree" },
807 { "Buffers", "Buffers" },
808 { "Cached", "Cached" },
809 // { "SwapCached", "SwapCached" },
810 { "Active", "Active" },
811 { "Inactive", "Inactive" },
812 { "ActiveAnon", "Active(anon)" },
813 { "InactiveAnon", "Inactive(anon)" },
814 { "ActiveFile" , "Active(file)" },
815 { "InactiveFile", "Inactive(file)" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800816 { "Unevictable", "Unevictable", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700817 // { "Mlocked", "Mlocked" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800818 { "SwapTotal", "SwapTotal", kMeminfoOp_SwapTotal },
819 { "SwapFree", "SwapFree", kMeminfoOp_SwapFree },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700820 // { "Dirty", "Dirty" },
821 // { "Writeback", "Writeback" },
822 { "AnonPages", "AnonPages" },
823 { "Mapped", "Mapped" },
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800824 { "Shmem", "Shmem", kMeminfoOp_HistLog },
825 { "Slab", "Slab", kMeminfoOp_HistLog },
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700826 // { "SReclaimable", "SReclaimable" },
827 // { "SUnreclaim", "SUnreclaim" },
828 };
Luigi Semenzato8accd332011-05-17 16:37:18 -0700829 vector<MeminfoRecord> fields(fields_array,
830 fields_array + arraysize(fields_array));
831 if (!FillMeminfo(meminfo_raw, &fields)) {
832 return false;
833 }
834 int total_memory = fields[0].value;
835 if (total_memory == 0) {
836 // this "cannot happen"
837 LOG(WARNING) << "borked meminfo parser";
838 return false;
839 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800840 int swap_total = 0;
841 int swap_free = 0;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700842 // Send all fields retrieved, except total memory.
843 for (unsigned int i = 1; i < fields.size(); i++) {
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800844 string metrics_name = base::StringPrintf("Platform.Meminfo%s",
845 fields[i].name);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800846 int percent;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800847 switch (fields[i].op) {
848 case kMeminfoOp_HistPercent:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800849 // report value as percent of total memory
850 percent = fields[i].value * 100 / total_memory;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800851 SendLinearSample(metrics_name, percent, 100, 101);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800852 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800853 case kMeminfoOp_HistLog:
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800854 // report value in kbytes, log scale, 4Gb max
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800855 SendSample(metrics_name, fields[i].value, 1, 4 * 1000 * 1000, 100);
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800856 break;
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800857 case kMeminfoOp_SwapTotal:
858 swap_total = fields[i].value;
859 case kMeminfoOp_SwapFree:
860 swap_free = fields[i].value;
Luigi Semenzato3ccca062013-02-04 19:50:45 -0800861 break;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700862 }
863 }
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800864 if (swap_total > 0) {
865 int swap_used = swap_total - swap_free;
866 int swap_used_percent = swap_used * 100 / swap_total;
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800867 SendSample("Platform.MeminfoSwapUsed", swap_used, 1, 8 * 1000 * 1000, 100);
868 SendLinearSample("Platform.MeminfoSwapUsedPercent", swap_used_percent,
Luigi Semenzato942cbab2013-02-12 13:17:07 -0800869 100, 101);
870 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700871 return true;
872}
873
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700874bool MetricsDaemon::FillMeminfo(const string& meminfo_raw,
875 vector<MeminfoRecord>* fields) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700876 vector<string> lines;
877 unsigned int nlines = Tokenize(meminfo_raw, "\n", &lines);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700878
879 // Scan meminfo output and collect field values. Each field name has to
880 // match a meminfo entry (case insensitive) after removing non-alpha
881 // characters from the entry.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700882 unsigned int ifield = 0;
883 for (unsigned int iline = 0;
884 iline < nlines && ifield < fields->size();
885 iline++) {
886 vector<string> tokens;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700887 Tokenize(lines[iline], ": ", &tokens);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700888 if (strcmp((*fields)[ifield].match, tokens[0].c_str()) == 0) {
889 // Name matches. Parse value and save.
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700890 char* rest;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700891 (*fields)[ifield].value =
892 static_cast<int>(strtol(tokens[1].c_str(), &rest, 10));
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700893 if (*rest != '\0') {
894 LOG(WARNING) << "missing meminfo value";
895 return false;
896 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700897 ifield++;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700898 }
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700899 }
Luigi Semenzato8accd332011-05-17 16:37:18 -0700900 if (ifield < fields->size()) {
901 // End of input reached while scanning.
902 LOG(WARNING) << "cannot find field " << (*fields)[ifield].match
903 << " and following";
904 return false;
905 }
906 return true;
907}
908
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800909void MetricsDaemon::ScheduleMemuseCallback(double interval) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700910 if (testing_) {
911 return;
912 }
Steve Funge86591e2014-12-01 13:38:21 -0800913 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
914 base::Bind(&MetricsDaemon::MemuseCallback, base::Unretained(this)),
915 base::TimeDelta::FromSeconds(interval));
Luigi Semenzato8accd332011-05-17 16:37:18 -0700916}
917
918void MetricsDaemon::MemuseCallback() {
919 // Since we only care about active time (i.e. uptime minus sleep time) but
920 // the callbacks are driven by real time (uptime), we check if we should
921 // reschedule this callback due to intervening sleep periods.
922 double now = GetActiveTime();
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800923 // Avoid intervals of less than one second.
924 double remaining_time = ceil(memuse_final_time_ - now);
925 if (remaining_time > 0) {
926 ScheduleMemuseCallback(remaining_time);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700927 } else {
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800928 // Report stats and advance the measurement interval unless there are
929 // errors or we've completed the last interval.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700930 if (MemuseCallbackWork() &&
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800931 memuse_interval_index_ < arraysize(kMemuseIntervals)) {
932 double interval = kMemuseIntervals[memuse_interval_index_++];
933 memuse_final_time_ = now + interval;
934 ScheduleMemuseCallback(interval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700935 }
936 }
937}
938
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700939bool MetricsDaemon::MemuseCallbackWork() {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700940 string meminfo_raw;
941 const FilePath meminfo_path("/proc/meminfo");
Ben Chan2e6543d2014-02-05 23:26:25 -0800942 if (!base::ReadFileToString(meminfo_path, &meminfo_raw)) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700943 LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
944 return false;
945 }
946 return ProcessMemuse(meminfo_raw);
947}
948
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700949bool MetricsDaemon::ProcessMemuse(const string& meminfo_raw) {
Luigi Semenzato8accd332011-05-17 16:37:18 -0700950 static const MeminfoRecord fields_array[] = {
951 { "MemTotal", "MemTotal" }, // SPECIAL CASE: total system memory
952 { "ActiveAnon", "Active(anon)" },
953 { "InactiveAnon", "Inactive(anon)" },
954 };
955 vector<MeminfoRecord> fields(fields_array,
956 fields_array + arraysize(fields_array));
957 if (!FillMeminfo(meminfo_raw, &fields)) {
958 return false;
959 }
960 int total = fields[0].value;
961 int active_anon = fields[1].value;
962 int inactive_anon = fields[2].value;
963 if (total == 0) {
964 // this "cannot happen"
965 LOG(WARNING) << "borked meminfo parser";
966 return false;
967 }
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800968 string metrics_name = base::StringPrintf("Platform.MemuseAnon%d",
969 memuse_interval_index_);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800970 SendLinearSample(metrics_name, (active_anon + inactive_anon) * 100 / total,
Luigi Semenzato8accd332011-05-17 16:37:18 -0700971 100, 101);
972 return true;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700973}
974
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800975void MetricsDaemon::SendSample(const string& name, int sample,
Darin Petkov11b8eb32010-05-18 11:00:59 -0700976 int min, int max, int nbuckets) {
Darin Petkovfc91b422010-05-12 13:05:45 -0700977 metrics_lib_->SendToUMA(name, sample, min, max, nbuckets);
Darin Petkov65b01462010-04-14 13:32:20 -0700978}
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700979
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -0700980void MetricsDaemon::SendKernelCrashesCumulativeCountStats() {
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800981 // Report the number of crashes for this OS version, but don't clear the
982 // counter. It is cleared elsewhere on version change.
Ben Chanf05ab402014-08-07 00:54:59 -0700983 int64_t crashes_count = kernel_crashes_version_count_->Get();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800984 SendSample(kernel_crashes_version_count_->Name(),
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700985 crashes_count,
986 1, // value of first bucket
987 500, // value of last bucket
988 100); // number of buckets
989
990
Ben Chanf05ab402014-08-07 00:54:59 -0700991 int64_t cpu_use_ms = version_cumulative_cpu_use_->Get();
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700992 SendSample(version_cumulative_cpu_use_->Name(),
993 cpu_use_ms / 1000, // stat is in seconds
994 1, // device may be used very little...
995 8 * 1000 * 1000, // ... or a lot (a little over 90 days)
996 100);
997
998 // On the first run after an autoupdate, cpu_use_ms and active_use_seconds
999 // can be zero. Avoid division by zero.
1000 if (cpu_use_ms > 0) {
1001 // Send the crash frequency since update in number of crashes per CPU year.
1002 SendSample("Logging.KernelCrashesPerCpuYear",
1003 crashes_count * kSecondsPerDay * 365 * 1000 / cpu_use_ms,
1004 1,
1005 1000 * 1000, // about one crash every 30s of CPU time
1006 100);
1007 }
1008
Ben Chanf05ab402014-08-07 00:54:59 -07001009 int64_t active_use_seconds = version_cumulative_active_use_->Get();
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001010 if (active_use_seconds > 0) {
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001011 SendSample(version_cumulative_active_use_->Name(),
1012 active_use_seconds / 1000, // stat is in seconds
1013 1, // device may be used very little...
1014 8 * 1000 * 1000, // ... or a lot (about 90 days)
1015 100);
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -07001016 // Same as above, but per year of active time.
1017 SendSample("Logging.KernelCrashesPerActiveYear",
1018 crashes_count * kSecondsPerDay * 365 / active_use_seconds,
1019 1,
1020 1000 * 1000, // about one crash every 30s of active time
1021 100);
1022 }
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001023}
1024
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001025void MetricsDaemon::SendDailyUseSample(
1026 const scoped_ptr<PersistentInteger>& use) {
1027 SendSample(use->Name(),
1028 use->GetAndClear(),
1029 1, // value of first bucket
1030 kSecondsPerDay, // value of last bucket
1031 50); // number of buckets
1032}
1033
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -08001034void MetricsDaemon::SendCrashIntervalSample(
1035 const scoped_ptr<PersistentInteger>& interval) {
1036 SendSample(interval->Name(),
1037 interval->GetAndClear(),
1038 1, // value of first bucket
1039 4 * kSecondsPerWeek, // value of last bucket
1040 50); // number of buckets
1041}
1042
1043void MetricsDaemon::SendCrashFrequencySample(
1044 const scoped_ptr<PersistentInteger>& frequency) {
1045 SendSample(frequency->Name(),
1046 frequency->GetAndClear(),
1047 1, // value of first bucket
1048 100, // value of last bucket
1049 50); // number of buckets
1050}
1051
1052void MetricsDaemon::SendLinearSample(const string& name, int sample,
Luigi Semenzato29c7ef92011-04-12 14:12:35 -07001053 int max, int nbuckets) {
Luigi Semenzato29c7ef92011-04-12 14:12:35 -07001054 // TODO(semenzato): add a proper linear histogram to the Chrome external
1055 // metrics API.
1056 LOG_IF(FATAL, nbuckets != max + 1) << "unsupported histogram scale";
1057 metrics_lib_->SendEnumToUMA(name, sample, max);
1058}
Daniel Eratc83975a2014-04-04 08:53:44 -07001059
1060void MetricsDaemon::UpdateStats(TimeTicks now_ticks,
1061 Time now_wall_time) {
1062 const int elapsed_seconds = (now_ticks - last_update_stats_time_).InSeconds();
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001063 daily_active_use_->Add(elapsed_seconds);
1064 version_cumulative_active_use_->Add(elapsed_seconds);
Daniel Eratc83975a2014-04-04 08:53:44 -07001065 user_crash_interval_->Add(elapsed_seconds);
1066 kernel_crash_interval_->Add(elapsed_seconds);
1067 version_cumulative_cpu_use_->Add(GetIncrementalCpuUse().InMilliseconds());
1068 last_update_stats_time_ = now_ticks;
1069
1070 const TimeDelta since_epoch = now_wall_time - Time::UnixEpoch();
1071 const int day = since_epoch.InDays();
1072 const int week = day / 7;
1073
1074 if (daily_cycle_->Get() != day) {
1075 daily_cycle_->Set(day);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001076 SendDailyUseSample(daily_active_use_);
1077 SendDailyUseSample(version_cumulative_active_use_);
Daniel Eratc83975a2014-04-04 08:53:44 -07001078 SendCrashFrequencySample(any_crashes_daily_count_);
1079 SendCrashFrequencySample(user_crashes_daily_count_);
1080 SendCrashFrequencySample(kernel_crashes_daily_count_);
1081 SendCrashFrequencySample(unclean_shutdowns_daily_count_);
Luigi Semenzatoe5883fa2014-04-18 17:00:35 -07001082 SendKernelCrashesCumulativeCountStats();
Daniel Eratc83975a2014-04-04 08:53:44 -07001083 }
1084
1085 if (weekly_cycle_->Get() != week) {
1086 weekly_cycle_->Set(week);
1087 SendCrashFrequencySample(any_crashes_weekly_count_);
1088 SendCrashFrequencySample(user_crashes_weekly_count_);
1089 SendCrashFrequencySample(kernel_crashes_weekly_count_);
1090 SendCrashFrequencySample(unclean_shutdowns_weekly_count_);
1091 }
1092}
1093
Steve Funge86591e2014-12-01 13:38:21 -08001094void MetricsDaemon::HandleUpdateStatsTimeout() {
1095 UpdateStats(TimeTicks::Now(), Time::Now());
1096 base::MessageLoop::current()->PostDelayedTask(FROM_HERE,
1097 base::Bind(&MetricsDaemon::HandleUpdateStatsTimeout,
1098 base::Unretained(this)),
1099 base::TimeDelta::FromMilliseconds(kUpdateStatsIntervalMs));
Daniel Eratc83975a2014-04-04 08:53:44 -07001100}