blob: 929706a2df83a1186d090d80e42062dea05a79bb [file] [log] [blame]
Darin Petkov65b01462010-04-14 13:32:20 -07001// Copyright (c) 2010 The Chromium OS Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#ifndef METRICS_DAEMON_H_
6#define METRICS_DAEMON_H_
7
Darin Petkov703ec972010-04-27 11:02:18 -07008#include <dbus/dbus.h>
Darin Petkov41e06232010-05-03 16:45:37 -07009#include <glib.h>
Ken Mixter4c5daa42010-08-26 18:35:06 -070010#include <map>
Darin Petkov65b01462010-04-14 13:32:20 -070011
Ben Chan2e6543d2014-02-05 23:26:25 -080012#include <base/files/file_path.h>
Chris Masone817016a2011-05-12 14:14:48 -070013#include <base/memory/scoped_ptr.h>
Ben Chan2e6543d2014-02-05 23:26:25 -080014#include <base/time/time.h>
Darin Petkovf1e85e42010-06-10 15:59:53 -070015#include <gtest/gtest_prod.h> // for FRIEND_TEST
16
Darin Petkovfc91b422010-05-12 13:05:45 -070017#include "metrics_library.h"
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080018#include "persistent_integer.h"
Darin Petkovfc91b422010-05-12 13:05:45 -070019
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080020using chromeos_metrics::PersistentInteger;
Darin Petkov2ccef012010-05-05 16:06:37 -070021
Darin Petkov65b01462010-04-14 13:32:20 -070022class MetricsDaemon {
23
24 public:
Darin Petkovf1e85e42010-06-10 15:59:53 -070025 MetricsDaemon();
26 ~MetricsDaemon();
Darin Petkov65b01462010-04-14 13:32:20 -070027
Darin Petkov11b8eb32010-05-18 11:00:59 -070028 // Initializes.
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080029 void Init(bool testing, MetricsLibraryInterface* metrics_lib,
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070030 const std::string& diskstats_path,
Luigi Semenzatofb3a8212013-05-07 16:55:00 -070031 const std::string& vmstats_path,
32 const std::string& cpuinfo_max_freq_path,
33 const std::string& scaling_max_freq_path);
Darin Petkov11b8eb32010-05-18 11:00:59 -070034
Darin Petkov703ec972010-04-27 11:02:18 -070035 // Does all the work. If |run_as_daemon| is true, daemonizes by
Darin Petkov2ccef012010-05-05 16:06:37 -070036 // forking.
37 void Run(bool run_as_daemon);
Darin Petkov65b01462010-04-14 13:32:20 -070038
39 private:
Darin Petkov2ccef012010-05-05 16:06:37 -070040 friend class MetricsDaemonTest;
Ken Mixterccd84c02010-08-16 19:57:13 -070041 FRIEND_TEST(MetricsDaemonTest, CheckSystemCrash);
Ken Mixter4c5daa42010-08-26 18:35:06 -070042 FRIEND_TEST(MetricsDaemonTest, ComputeEpochNoCurrent);
43 FRIEND_TEST(MetricsDaemonTest, ComputeEpochNoLast);
44 FRIEND_TEST(MetricsDaemonTest, GetHistogramPath);
45 FRIEND_TEST(MetricsDaemonTest, IsNewEpoch);
Darin Petkove579d662010-05-05 16:19:39 -070046 FRIEND_TEST(MetricsDaemonTest, MessageFilter);
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070047 FRIEND_TEST(MetricsDaemonTest, ParseVmStats);
Darin Petkov38d5cb02010-06-24 12:10:26 -070048 FRIEND_TEST(MetricsDaemonTest, ProcessKernelCrash);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -070049 FRIEND_TEST(MetricsDaemonTest, ProcessMeminfo);
50 FRIEND_TEST(MetricsDaemonTest, ProcessMeminfo2);
Ken Mixterccd84c02010-08-16 19:57:13 -070051 FRIEND_TEST(MetricsDaemonTest, ProcessUncleanShutdown);
Darin Petkov1bb904e2010-06-16 15:58:06 -070052 FRIEND_TEST(MetricsDaemonTest, ProcessUserCrash);
Ken Mixterccd84c02010-08-16 19:57:13 -070053 FRIEND_TEST(MetricsDaemonTest, ReportCrashesDailyFrequency);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -070054 FRIEND_TEST(MetricsDaemonTest, ReadFreqToInt);
Ken Mixterccd84c02010-08-16 19:57:13 -070055 FRIEND_TEST(MetricsDaemonTest, ReportDailyUse);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080056 FRIEND_TEST(MetricsDaemonTest, ReportDiskStats);
Ken Mixterccd84c02010-08-16 19:57:13 -070057 FRIEND_TEST(MetricsDaemonTest, ReportKernelCrashInterval);
58 FRIEND_TEST(MetricsDaemonTest, ReportUncleanShutdownInterval);
59 FRIEND_TEST(MetricsDaemonTest, ReportUserCrashInterval);
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -080060 FRIEND_TEST(MetricsDaemonTest, SendSample);
Luigi Semenzatofb3a8212013-05-07 16:55:00 -070061 FRIEND_TEST(MetricsDaemonTest, SendCpuThrottleMetrics);
Darin Petkov41e06232010-05-03 16:45:37 -070062
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080063 // State for disk stats collector callback.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -070064 enum StatsState {
65 kStatsShort, // short wait before short interval collection
66 kStatsLong, // final wait before new collection
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -080067 };
68
Darin Petkov41e06232010-05-03 16:45:37 -070069 // Data record for aggregating daily usage.
70 class UseRecord {
71 public:
72 UseRecord() : day_(0), seconds_(0) {}
73 int day_;
74 int seconds_;
75 };
76
Luigi Semenzato3ccca062013-02-04 19:50:45 -080077 // Type of scale to use for meminfo histograms. For most of them we use
78 // percent of total RAM, but for some we use absolute numbers, usually in
79 // megabytes, on a log scale from 0 to 4000, and 0 to 8000 for compressed
80 // swap (since it can be larger than total RAM).
Luigi Semenzato942cbab2013-02-12 13:17:07 -080081 enum MeminfoOp {
82 kMeminfoOp_HistPercent = 0,
83 kMeminfoOp_HistLog,
84 kMeminfoOp_SwapTotal,
85 kMeminfoOp_SwapFree,
Luigi Semenzato3ccca062013-02-04 19:50:45 -080086 };
87
Luigi Semenzato8accd332011-05-17 16:37:18 -070088 // Record for retrieving and reporting values from /proc/meminfo.
89 struct MeminfoRecord {
Luigi Semenzato3ccca062013-02-04 19:50:45 -080090 const char* name; // print name
91 const char* match; // string to match in output of /proc/meminfo
Luigi Semenzato942cbab2013-02-12 13:17:07 -080092 MeminfoOp op; // histogram scale selector, or other operator
Luigi Semenzato3ccca062013-02-04 19:50:45 -080093 int value; // value from /proc/meminfo
Luigi Semenzato8accd332011-05-17 16:37:18 -070094 };
95
Sonny Rao4b8aebb2013-07-31 23:18:31 -070096 // Record for retrieving and reporting values from /proc/vmstat
97 struct VmstatRecord {
98 uint64_t page_faults_; // major faults
99 uint64_t swap_in_; // pages swapped in
100 uint64_t swap_out_; // pages swapped out
101 };
102
Darin Petkov2ccef012010-05-05 16:06:37 -0700103 // Metric parameters.
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800104 static const char kMetricReadSectorsLongName[];
105 static const char kMetricReadSectorsShortName[];
106 static const char kMetricWriteSectorsLongName[];
107 static const char kMetricWriteSectorsShortName[];
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700108 static const char kMetricPageFaultsShortName[];
109 static const char kMetricPageFaultsLongName[];
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700110 static const char kMetricSwapInLongName[];
111 static const char kMetricSwapInShortName[];
112 static const char kMetricSwapOutLongName[];
113 static const char kMetricSwapOutShortName[];
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700114 static const char kMetricScaledCpuFrequencyName[];
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700115 static const int kMetricStatsShortInterval;
116 static const int kMetricStatsLongInterval;
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700117 static const int kMetricMeminfoInterval;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800118 static const int kMetricSectorsIOMax;
119 static const int kMetricSectorsBuckets;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700120 static const int kMetricPageFaultsMax;
121 static const int kMetricPageFaultsBuckets;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800122 static const char kMetricsDiskStatsPath[];
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700123 static const char kMetricsVmStatsPath[];
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700124 static const char kMetricsProcStatFileName[];
125 static const int kMetricsProcStatFirstLineItemsCount;
Darin Petkov2ccef012010-05-05 16:06:37 -0700126
Luigi Semenzato8accd332011-05-17 16:37:18 -0700127 // Returns the active time since boot (uptime minus sleep time) in seconds.
128 double GetActiveTime();
129
Darin Petkov65b01462010-04-14 13:32:20 -0700130 // Creates the event loop and enters it.
131 void Loop();
132
Darin Petkov703ec972010-04-27 11:02:18 -0700133 // D-Bus filter callback.
134 static DBusHandlerResult MessageFilter(DBusConnection* connection,
135 DBusMessage* message,
136 void* user_data);
Darin Petkov65b01462010-04-14 13:32:20 -0700137
Darin Petkov41e06232010-05-03 16:45:37 -0700138 // Updates the daily usage file, if necessary, by adding |seconds|
139 // of active use to the |day| since Epoch. If there's usage data for
140 // day in the past in the usage file, that data is sent to UMA and
141 // removed from the file. If there's already usage data for |day| in
142 // the usage file, the |seconds| are accumulated.
143 void LogDailyUseRecord(int day, int seconds);
144
Darin Petkov1bb904e2010-06-16 15:58:06 -0700145 // Updates the active use time and logs time between user-space
146 // process crashes.
147 void ProcessUserCrash();
148
Darin Petkov38d5cb02010-06-24 12:10:26 -0700149 // Updates the active use time and logs time between kernel crashes.
150 void ProcessKernelCrash();
151
Ken Mixterccd84c02010-08-16 19:57:13 -0700152 // Updates the active use time and logs time between unclean shutdowns.
153 void ProcessUncleanShutdown();
154
155 // Checks if a kernel crash has been detected and returns true if
156 // so. The method assumes that a kernel crash has happened if
157 // |crash_file| exists. It removes the file immediately if it
158 // exists, so it must not be called more than once.
159 bool CheckSystemCrash(const std::string& crash_file);
Darin Petkov38d5cb02010-06-24 12:10:26 -0700160
Ken Mixter4c5daa42010-08-26 18:35:06 -0700161 // Report daily use through UMA.
Luigi Semenzato5ef2e392014-04-15 15:15:02 -0700162 void ReportDailyUse(int use_seconds);
Ken Mixter4c5daa42010-08-26 18:35:06 -0700163
Darin Petkov11b8eb32010-05-18 11:00:59 -0700164 // Sends a regular (exponential) histogram sample to Chrome for
165 // transport to UMA. See MetricsLibrary::SendToUMA in
166 // metrics_library.h for a description of the arguments.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800167 void SendSample(const std::string& name, int sample,
Darin Petkov11b8eb32010-05-18 11:00:59 -0700168 int min, int max, int nbuckets);
Darin Petkov65b01462010-04-14 13:32:20 -0700169
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700170 // Sends a linear histogram sample to Chrome for transport to UMA. See
171 // MetricsLibrary::SendToUMA in metrics_library.h for a description of the
172 // arguments.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800173 void SendLinearSample(const std::string& name, int sample,
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700174 int max, int nbuckets);
175
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700176 // Sends various cumulative kernel crash-related stats, for instance the
177 // total number of kernel crashes since the last version update.
178 void SendKernelCrashesCumulativeCountStats(int64 active_time_seconds);
179
180 // Returns the total (system-wide) CPU usage between the time of the most
181 // recent call to this function and now.
182 base::TimeDelta GetIncrementalCpuUse();
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800183
184 // Sends a sample representing a time interval between two crashes of the
185 // same type.
186 void SendCrashIntervalSample(const scoped_ptr<PersistentInteger>& interval);
187
188 // Sends a sample representing a frequency of crashes of some type.
189 void SendCrashFrequencySample(const scoped_ptr<PersistentInteger>& frequency);
190
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700191 // Initializes vm and disk stats reporting.
192 void StatsReporterInit();
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800193
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700194 // Schedules a callback for the next vm and disk stats collection.
195 void ScheduleStatsCallback(int wait);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800196
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700197 // Reads cumulative disk statistics from sysfs. Returns true for success.
198 bool DiskStatsReadStats(long int* read_sectors, long int* write_sectors);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800199
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700200 // Reads cumulative vm statistics from procfs. Returns true for success.
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700201 bool VmStatsReadStats(struct VmstatRecord* stats);
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800202
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700203 // Parse cumulative vm statistics from a C string. Returns true for success.
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700204 bool VmStatsParseStats(const char* stats, struct VmstatRecord* record);
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700205
206 // Reports disk and vm statistics (static version for glib). Arguments are a
207 // glib artifact.
208 static gboolean StatsCallbackStatic(void* handle);
209
210 // Reports disk and vm statistics.
211 void StatsCallback();
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800212
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700213 // Schedules meminfo collection callback.
214 void ScheduleMeminfoCallback(int wait);
215
216 // Reports memory statistics (static version for glib). Argument is a glib
217 // artifact.
218 static gboolean MeminfoCallbackStatic(void* handle);
219
220 // Reports memory statistics. Returns false on failure.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700221 bool MeminfoCallback();
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700222
223 // Parses content of /proc/meminfo and sends fields of interest to UMA.
Luigi Semenzato8accd332011-05-17 16:37:18 -0700224 // Returns false on errors. |meminfo_raw| contains the content of
225 // /proc/meminfo.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700226 bool ProcessMeminfo(const std::string& meminfo_raw);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700227
228 // Parses meminfo data from |meminfo_raw|. |fields| is a vector containing
229 // the fields of interest. The order of the fields must be the same in which
230 // /proc/meminfo prints them. The result of parsing fields[i] is placed in
231 // fields[i].value.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700232 bool FillMeminfo(const std::string& meminfo_raw,
233 std::vector<MeminfoRecord>* fields);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700234
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800235 // Schedule a memory use callback in |interval| seconds.
236 void ScheduleMemuseCallback(double interval);
Luigi Semenzato8accd332011-05-17 16:37:18 -0700237
238 // Static wrapper for MemuseCallback. Always returns false.
239 static gboolean MemuseCallbackStatic(void* handle);
240
241 // Calls MemuseCallbackWork, and possibly schedules next callback, if enough
242 // active time has passed. Otherwise reschedules itself to simulate active
243 // time callbacks (i.e. wall clock time minus sleep time).
244 void MemuseCallback();
245
246 // Reads /proc/meminfo and sends total anonymous memory usage to UMA.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700247 bool MemuseCallbackWork();
Luigi Semenzato8accd332011-05-17 16:37:18 -0700248
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700249 // Parses meminfo data and sends it to UMA.
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700250 bool ProcessMemuse(const std::string& meminfo_raw);
Luigi Semenzato29c7ef92011-04-12 14:12:35 -0700251
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700252 // Sends stats for thermal CPU throttling.
253 void SendCpuThrottleMetrics();
254
255 // Reads an integer CPU frequency value from sysfs.
256 bool ReadFreqToInt(const std::string& sysfs_file_name, int* value);
257
Luigi Semenzato859b3f02014-02-05 15:33:19 -0800258 // Reads the current OS version from /etc/lsb-release and hashes it
259 // to a unsigned 32-bit int.
260 uint32 GetOsVersionHash();
261
Daniel Eratc83975a2014-04-04 08:53:44 -0700262 // Updates stats, additionally sending them to UMA if enough time has elapsed
263 // since the last report.
264 void UpdateStats(base::TimeTicks now_ticks, base::Time now_wall_time);
265
266 // Invoked periodically by |update_stats_timeout_id_| to call UpdateStats().
267 static gboolean HandleUpdateStatsTimeout(gpointer data);
268
Darin Petkov2ccef012010-05-05 16:06:37 -0700269 // Test mode.
Darin Petkov41e06232010-05-03 16:45:37 -0700270 bool testing_;
Darin Petkov65b01462010-04-14 13:32:20 -0700271
Darin Petkovfc91b422010-05-12 13:05:45 -0700272 // The metrics library handle.
273 MetricsLibraryInterface* metrics_lib_;
274
Darin Petkovf27f0362010-06-04 13:14:19 -0700275 // Timestamps last network state update. This timestamp is used to
276 // sample the time from the network going online to going offline so
277 // TimeTicks ensures a monotonically increasing TimeDelta.
278 base::TimeTicks network_state_last_;
Darin Petkov65b01462010-04-14 13:32:20 -0700279
Daniel Eratc83975a2014-04-04 08:53:44 -0700280 // The last time that UpdateStats() was called.
281 base::TimeTicks last_update_stats_time_;
Darin Petkov41e06232010-05-03 16:45:37 -0700282
Daniel Eratc83975a2014-04-04 08:53:44 -0700283 // ID of a GLib timeout that repeatedly runs UpdateStats().
284 gint update_stats_timeout_id_;
Darin Petkov41e06232010-05-03 16:45:37 -0700285
Darin Petkov41e06232010-05-03 16:45:37 -0700286 // Sleep period until the next daily usage aggregation performed by
287 // the daily use monitor (see ScheduleUseMonitor).
288 int usemon_interval_;
289
290 // Scheduled daily use monitor source (see ScheduleUseMonitor).
291 GSource* usemon_source_;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800292
Luigi Semenzato0d9a9c92013-12-05 15:55:12 -0800293 // End time of current memuse stat collection interval.
294 double memuse_final_time_;
Luigi Semenzato8accd332011-05-17 16:37:18 -0700295
296 // Selects the wait time for the next memory use callback.
297 unsigned int memuse_interval_index_;
298
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700299 // Contain the most recent disk and vm cumulative stats.
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800300 long int read_sectors_;
301 long int write_sectors_;
Sonny Rao4b8aebb2013-07-31 23:18:31 -0700302 struct VmstatRecord vmstats_;
Luigi Semenzatoc88e42d2011-02-17 10:21:16 -0800303
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700304 StatsState stats_state_;
305 double stats_initial_time_;
306
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700307 // The system "HZ", or frequency of ticks. Some system data uses ticks as a
308 // unit, and this is used to convert to standard time units.
309 uint32 ticks_per_second_;
310 // Used internally by GetIncrementalCpuUse() to return the CPU utilization
311 // between calls.
312 uint64 latest_cpu_use_ticks_;
313
314 // Persistent values and accumulators for crash statistics.
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800315 scoped_ptr<PersistentInteger> daily_cycle_;
316 scoped_ptr<PersistentInteger> weekly_cycle_;
317 scoped_ptr<PersistentInteger> version_cycle_;
318
319 scoped_ptr<PersistentInteger> daily_use_;
320
Luigi Semenzatoba0c65d2014-03-17 12:28:38 -0700321 // The CPU time accumulator. This contains the CPU time, in milliseconds,
322 // used by the system since the most recent OS version update.
323 scoped_ptr<PersistentInteger> version_cumulative_cpu_use_;
324
Luigi Semenzato2fd51cc2014-02-26 11:53:16 -0800325 scoped_ptr<PersistentInteger> user_crash_interval_;
326 scoped_ptr<PersistentInteger> kernel_crash_interval_;
327 scoped_ptr<PersistentInteger> unclean_shutdown_interval_;
328
329 scoped_ptr<PersistentInteger> any_crashes_daily_count_;
330 scoped_ptr<PersistentInteger> any_crashes_weekly_count_;
331 scoped_ptr<PersistentInteger> user_crashes_daily_count_;
332 scoped_ptr<PersistentInteger> user_crashes_weekly_count_;
333 scoped_ptr<PersistentInteger> kernel_crashes_daily_count_;
334 scoped_ptr<PersistentInteger> kernel_crashes_weekly_count_;
335 scoped_ptr<PersistentInteger> kernel_crashes_version_count_;
336 scoped_ptr<PersistentInteger> unclean_shutdowns_daily_count_;
337 scoped_ptr<PersistentInteger> unclean_shutdowns_weekly_count_;
338
Luigi Semenzato0f132bb2011-02-28 11:17:43 -0800339 std::string diskstats_path_;
Luigi Semenzato5bd764f2011-10-14 12:03:35 -0700340 std::string vmstats_path_;
Luigi Semenzatofb3a8212013-05-07 16:55:00 -0700341 std::string scaling_max_freq_path_;
342 std::string cpuinfo_max_freq_path_;
Darin Petkov65b01462010-04-14 13:32:20 -0700343};
344
345#endif // METRICS_DAEMON_H_