blob: 8db9121c8210107e01313c1d676af59a902cdcaf [file] [log] [blame]
James Hawkinsabd73e62016-01-19 15:10:38 -08001/*
2 * Copyright (C) 2016 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17// The bootstat command provides options to persist boot events with the current
18// timestamp, dump the persisted events, and log all events to EventLog to be
19// uploaded to Android log storage via Tron.
20
James Hawkinsa4a1a4a2016-02-09 15:32:38 -080021#include <getopt.h>
Mark Salyzynb304f6d2017-08-04 13:35:51 -070022#include <sys/klog.h>
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -070023#include <unistd.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070024
James Hawkinse78ea772017-03-24 11:43:02 -070025#include <chrono>
James Hawkins0660b302016-03-08 16:18:15 -080026#include <cmath>
James Hawkinsabd73e62016-01-19 15:10:38 -080027#include <cstddef>
28#include <cstdio>
James Hawkins500d7152016-02-16 15:05:54 -080029#include <ctime>
James Hawkinsa4a1a4a2016-02-09 15:32:38 -080030#include <map>
James Hawkinsabd73e62016-01-19 15:10:38 -080031#include <memory>
32#include <string>
James Hawkinsbe46fd12017-02-02 16:21:25 -080033#include <vector>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070034
James Hawkinse78ea772017-03-24 11:43:02 -070035#include <android-base/chrono_utils.h>
Mark Salyzynb304f6d2017-08-04 13:35:51 -070036#include <android-base/file.h>
James Hawkinseabe08b2016-01-19 16:54:35 -080037#include <android-base/logging.h>
James Hawkins4dded612016-07-28 11:50:23 -070038#include <android-base/parseint.h>
James Hawkinsbe46fd12017-02-02 16:21:25 -080039#include <android-base/strings.h>
James Hawkinse78ea772017-03-24 11:43:02 -070040#include <android/log.h>
Mark Salyzynb304f6d2017-08-04 13:35:51 -070041#include <cutils/android_reboot.h>
James Hawkinsa4a1a4a2016-02-09 15:32:38 -080042#include <cutils/properties.h>
Mark Salyzynb304f6d2017-08-04 13:35:51 -070043#include <log/logcat.h>
James Hawkins9aec9262017-01-31 11:42:24 -080044#include <metricslogger/metrics_logger.h>
Mark Salyzynff2dcd92016-09-28 15:54:45 -070045
James Hawkinsabd73e62016-01-19 15:10:38 -080046#include "boot_event_record_store.h"
James Hawkinsabd73e62016-01-19 15:10:38 -080047
48namespace {
49
James Hawkinsabd73e62016-01-19 15:10:38 -080050// Scans the boot event record store for record files and logs each boot event
51// via EventLog.
52void LogBootEvents() {
53 BootEventRecordStore boot_event_store;
54
55 auto events = boot_event_store.GetAllBootEvents();
56 for (auto i = events.cbegin(); i != events.cend(); ++i) {
James Hawkins9aec9262017-01-31 11:42:24 -080057 android::metricslogger::LogHistogram(i->first, i->second);
James Hawkinsabd73e62016-01-19 15:10:38 -080058 }
59}
60
James Hawkinsc6275582016-03-22 10:47:44 -070061// Records the named boot |event| to the record store. If |value| is non-empty
62// and is a proper string representation of an integer value, the converted
63// integer value is associated with the boot event.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -070064void RecordBootEventFromCommandLine(const std::string& event, const std::string& value_str) {
James Hawkinsc6275582016-03-22 10:47:44 -070065 BootEventRecordStore boot_event_store;
66 if (!value_str.empty()) {
67 int32_t value = 0;
Elliott Hughesda46b392016-10-11 17:09:00 -070068 if (android::base::ParseInt(value_str, &value)) {
James Hawkins4dded612016-07-28 11:50:23 -070069 boot_event_store.AddBootEventWithValue(event, value);
70 }
James Hawkinsc6275582016-03-22 10:47:44 -070071 } else {
72 boot_event_store.AddBootEvent(event);
73 }
74}
75
James Hawkinsabd73e62016-01-19 15:10:38 -080076void PrintBootEvents() {
77 printf("Boot events:\n");
78 printf("------------\n");
79
80 BootEventRecordStore boot_event_store;
81 auto events = boot_event_store.GetAllBootEvents();
82 for (auto i = events.cbegin(); i != events.cend(); ++i) {
83 printf("%s\t%d\n", i->first.c_str(), i->second);
84 }
85}
86
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -070087void ShowHelp(const char* cmd) {
James Hawkinsabd73e62016-01-19 15:10:38 -080088 fprintf(stderr, "Usage: %s [options]\n", cmd);
89 fprintf(stderr,
90 "options include:\n"
Yongqin Liu78b2b942017-07-07 13:26:49 +080091 " -h, --help Show this help\n"
92 " -l, --log Log all metrics to logstorage\n"
93 " -p, --print Dump the boot event records to the console\n"
94 " -r, --record Record the timestamp of a named boot event\n"
95 " --value Optional value to associate with the boot event\n"
96 " --record_boot_complete Record metrics related to the time for the device boot\n"
97 " --record_boot_reason Record the reason why the device booted\n"
James Hawkins53684ea2016-02-23 16:18:19 -080098 " --record_time_since_factory_reset Record the time since the device was reset\n");
James Hawkinsabd73e62016-01-19 15:10:38 -080099}
100
101// Constructs a readable, printable string from the givencommand line
102// arguments.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700103std::string GetCommandLine(int argc, char** argv) {
James Hawkinsabd73e62016-01-19 15:10:38 -0800104 std::string cmd;
105 for (int i = 0; i < argc; ++i) {
106 cmd += argv[i];
107 cmd += " ";
108 }
109
110 return cmd;
111}
112
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800113// Convenience wrapper over the property API that returns an
114// std::string.
115std::string GetProperty(const char* key) {
116 std::vector<char> temp(PROPERTY_VALUE_MAX);
117 const int len = property_get(key, &temp[0], nullptr);
118 if (len < 0) {
119 return "";
120 }
121 return std::string(&temp[0], len);
122}
123
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700124void SetProperty(const char* key, const std::string& val) {
125 property_set(key, val.c_str());
126}
127
128void SetProperty(const char* key, const char* val) {
129 property_set(key, val);
130}
131
James Hawkins25f71222017-10-10 16:37:05 -0700132constexpr int32_t kEmptyBootReason = 0;
James Hawkins6f74c0b2016-02-12 15:49:16 -0800133constexpr int32_t kUnknownBootReason = 1;
134
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800135// A mapping from boot reason string, as read from the ro.boot.bootreason
136// system property, to a unique integer ID. Viewers of log data dashboards for
137// the boot_reason metric may refer to this mapping to discern the histogram
138// values.
James Hawkins6f74c0b2016-02-12 15:49:16 -0800139const std::map<std::string, int32_t> kBootReasonMap = {
James Hawkins25f71222017-10-10 16:37:05 -0700140 {"empty", kEmptyBootReason},
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700141 {"unknown", kUnknownBootReason},
142 {"normal", 2},
143 {"recovery", 3},
144 {"reboot", 4},
145 {"PowerKey", 5},
146 {"hard_reset", 6},
147 {"kernel_panic", 7},
148 {"rpm_err", 8},
149 {"hw_reset", 9},
150 {"tz_err", 10},
151 {"adsp_err", 11},
152 {"modem_err", 12},
153 {"mba_err", 13},
154 {"Watchdog", 14},
155 {"Panic", 15},
156 {"power_key", 16},
157 {"power_on", 17},
158 {"Reboot", 18},
159 {"rtc", 19},
160 {"edl", 20},
161 {"oem_pon1", 21},
162 {"oem_powerkey", 22},
163 {"oem_unknown_reset", 23},
164 {"srto: HWWDT reset SC", 24},
165 {"srto: HWWDT reset platform", 25},
166 {"srto: bootloader", 26},
167 {"srto: kernel panic", 27},
168 {"srto: kernel watchdog reset", 28},
169 {"srto: normal", 29},
170 {"srto: reboot", 30},
171 {"srto: reboot-bootloader", 31},
172 {"srto: security watchdog reset", 32},
173 {"srto: wakesrc", 33},
174 {"srto: watchdog", 34},
175 {"srto:1-1", 35},
176 {"srto:omap_hsmm", 36},
177 {"srto:phy0", 37},
178 {"srto:rtc0", 38},
179 {"srto:touchpad", 39},
180 {"watchdog", 40},
181 {"watchdogr", 41},
182 {"wdog_bark", 42},
183 {"wdog_bite", 43},
184 {"wdog_reset", 44},
185 {"shutdown,", 45}, // Trailing comma is intentional.
186 {"shutdown,userrequested", 46},
187 {"reboot,bootloader", 47},
188 {"reboot,cold", 48},
189 {"reboot,recovery", 49},
190 {"thermal_shutdown", 50},
191 {"s3_wakeup", 51},
192 {"kernel_panic,sysrq", 52},
193 {"kernel_panic,NULL", 53},
194 {"kernel_panic,BUG", 54},
195 {"bootloader", 55},
196 {"cold", 56},
197 {"hard", 57},
198 {"warm", 58},
199 {"recovery", 59},
200 {"thermal-shutdown", 60},
201 {"shutdown,thermal", 61},
202 {"shutdown,battery", 62},
203 {"reboot,ota", 63},
204 {"reboot,factory_reset", 64},
205 {"reboot,", 65},
206 {"reboot,shell", 66},
207 {"reboot,adb", 67},
Mark Salyzyn9033bf52017-09-21 11:30:29 -0700208 {"reboot,userrequested", 68},
Mark Salyzyn161b8622017-09-26 08:26:12 -0700209 {"shutdown,container", 69}, // Host OS asking Android Container to shutdown
Mark Salyzyn243fa292017-10-11 09:02:04 -0700210 {"cold,powerkey", 70},
211 {"warm,s3_wakeup", 71},
212 {"hard,hw_reset", 72},
213 {"shutdown,suspend", 73}, // Suspend to RAM
214 {"shutdown,hibernate", 74}, // Suspend to DISK
James Hawkins34073b52017-10-17 15:53:27 -0700215 {"power_on_key", 75},
216 {"reboot_by_key", 76},
217 {"wdt_by_pass_pwk", 77},
218 {"reboot_longkey", 78},
219 {"powerkey", 79},
220 {"usb", 80},
221 {"wdt", 81},
222 {"tool_by_pass_pwk", 82},
223 {"2sec_reboot", 83},
224 {"reboot,by_key", 84},
225 {"reboot,longkey", 85},
Mark Salyzyncabbe4f2017-10-23 13:52:39 -0700226 {"reboot,2sec", 86},
Mark Salyzync89f9da2017-10-24 15:35:34 -0700227 {"shutdown,thermal,battery", 87},
Mark Salyzyn72a8ea32017-10-25 09:23:19 -0700228 {"reboot,its_just_so_hard", 88}, // produced by boot_reason_test
229 {"reboot,Its Just So Hard", 89}, // produced by boot_reason_test
James Hawkins8ac79bc2017-10-31 10:07:34 -0700230 {"usb", 90},
James Hawkins74b17582017-11-20 14:13:41 -0800231 {"charge", 91},
232 {"oem_tz_crash", 92},
233 {"uvlo", 93},
234 {"oem_ps_hold", 94},
235 {"abnormal_reset", 95},
236 {"oemerr_unknown", 96},
237 {"reboot_fastboot_mode", 97},
James Hawkins5f85f832017-11-29 14:30:06 -0800238 {"watchdog_apps_bite", 98},
239 {"xpu_err", 99},
240 {"power_on_usb", 100},
James Hawkinsf4444f02017-11-30 15:01:40 -0800241 {"watchdog_rpm", 101},
242 {"watchdog_nonsec", 102},
243 {"watchdog_apps_bark", 103},
244 {"reboot_dmverity_corrupted", 104},
James Hawkins00433a22017-12-04 14:20:21 -0800245 {"reboot_smpl", 105},
246 {"watchdog_sdi_apps_reset", 106},
247 {"smpl", 107},
248 {"oem_modem_failed_to_powerup", 108},
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800249};
250
251// Converts a string value representing the reason the system booted to an
252// integer representation. This is necessary for logging the boot_reason metric
253// via Tron, which does not accept non-integer buckets in histograms.
254int32_t BootReasonStrToEnum(const std::string& boot_reason) {
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800255 auto mapping = kBootReasonMap.find(boot_reason);
256 if (mapping != kBootReasonMap.end()) {
257 return mapping->second;
258 }
259
James Hawkins25f71222017-10-10 16:37:05 -0700260 if (boot_reason.empty()) {
261 return kEmptyBootReason;
262 }
263
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800264 LOG(INFO) << "Unknown boot reason: " << boot_reason;
265 return kUnknownBootReason;
266}
267
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700268// Canonical list of supported primary reboot reasons.
269const std::vector<const std::string> knownReasons = {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700270 // clang-format off
271 // kernel
272 "watchdog",
273 "kernel_panic",
274 // strong
275 "recovery", // Should not happen from ro.boot.bootreason
276 "bootloader", // Should not happen from ro.boot.bootreason
277 // blunt
278 "cold",
279 "hard",
280 "warm",
Mark Salyzyn62909822017-10-09 09:27:16 -0700281 // super blunt
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700282 "shutdown", // Can not happen from ro.boot.bootreason
283 "reboot", // Default catch-all for anything unknown
284 // clang-format on
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700285};
286
287// Returns true if the supplied reason prefix is considered detailed enough.
288bool isStrongRebootReason(const std::string& r) {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700289 for (auto& s : knownReasons) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700290 if (s == "cold") break;
291 // Prefix defined as terminated by a nul or comma (,).
292 if (android::base::StartsWith(r, s.c_str()) &&
293 ((r.length() == s.length()) || (r[s.length()] == ','))) {
294 return true;
295 }
296 }
297 return false;
298}
299
300// Returns true if the supplied reason prefix is associated with the kernel.
301bool isKernelRebootReason(const std::string& r) {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700302 for (auto& s : knownReasons) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700303 if (s == "recovery") break;
304 // Prefix defined as terminated by a nul or comma (,).
305 if (android::base::StartsWith(r, s.c_str()) &&
306 ((r.length() == s.length()) || (r[s.length()] == ','))) {
307 return true;
308 }
309 }
310 return false;
311}
312
313// Returns true if the supplied reason prefix is considered known.
314bool isKnownRebootReason(const std::string& r) {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700315 for (auto& s : knownReasons) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700316 // Prefix defined as terminated by a nul or comma (,).
317 if (android::base::StartsWith(r, s.c_str()) &&
318 ((r.length() == s.length()) || (r[s.length()] == ','))) {
319 return true;
320 }
321 }
322 return false;
323}
324
325// If the reboot reason should be improved, report true if is too blunt.
326bool isBluntRebootReason(const std::string& r) {
327 if (isStrongRebootReason(r)) return false;
328
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700329 if (!isKnownRebootReason(r)) return true; // Can not support unknown as detail
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700330
331 size_t pos = 0;
332 while ((pos = r.find(',', pos)) != std::string::npos) {
333 ++pos;
334 std::string next(r.substr(pos));
335 if (next.length() == 0) break;
336 if (next[0] == ',') continue;
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700337 if (!isKnownRebootReason(next)) return false; // Unknown subreason is good.
338 if (isStrongRebootReason(next)) return false; // eg: reboot,reboot
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700339 }
340 return true;
341}
342
Mark Salyzyn64610892017-09-18 10:41:14 -0700343bool readPstoreConsole(std::string& console) {
344 if (android::base::ReadFileToString("/sys/fs/pstore/console-ramoops-0", &console)) {
345 return true;
346 }
347 return android::base::ReadFileToString("/sys/fs/pstore/console-ramoops", &console);
348}
349
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700350// Implement a variant of std::string::rfind that is resilient to errors in
351// the data stream being inspected.
352class pstoreConsole {
353 private:
354 const size_t kBitErrorRate = 8; // number of bits per error
355 const std::string& console;
356
357 // Number of bits that differ between the two arguments l and r.
358 // Returns zero if the values for l and r are identical.
359 size_t numError(uint8_t l, uint8_t r) const { return std::bitset<8>(l ^ r).count(); }
360
361 // A string comparison function, reports the number of errors discovered
362 // in the match to a maximum of the bitLength / kBitErrorRate, at that
363 // point returning npos to indicate match is too poor.
364 //
365 // Since called in rfind which works backwards, expect cache locality will
366 // help if we check in reverse here as well for performance.
367 //
368 // Assumption: l (from console.c_str() + pos) is long enough to house
369 // _r.length(), checked in rfind caller below.
370 //
371 size_t numError(size_t pos, const std::string& _r) const {
372 const char* l = console.c_str() + pos;
373 const char* r = _r.c_str();
374 size_t n = _r.length();
375 const uint8_t* le = reinterpret_cast<const uint8_t*>(l) + n;
376 const uint8_t* re = reinterpret_cast<const uint8_t*>(r) + n;
377 size_t count = 0;
378 n = 0;
379 do {
380 // individual character bit error rate > threshold + slop
381 size_t num = numError(*--le, *--re);
382 if (num > ((8 + kBitErrorRate) / kBitErrorRate)) return std::string::npos;
383 // total bit error rate > threshold + slop
384 count += num;
385 ++n;
386 if (count > ((n * 8 + kBitErrorRate - (n > 2)) / kBitErrorRate)) {
387 return std::string::npos;
388 }
389 } while (le != reinterpret_cast<const uint8_t*>(l));
390 return count;
391 }
392
393 public:
394 explicit pstoreConsole(const std::string& console) : console(console) {}
395 // scope of argument must be equal to or greater than scope of pstoreConsole
396 explicit pstoreConsole(const std::string&& console) = delete;
397 explicit pstoreConsole(std::string&& console) = delete;
398
399 // Our implementation of rfind, use exact match first, then resort to fuzzy.
400 size_t rfind(const std::string& needle) const {
401 size_t pos = console.rfind(needle); // exact match?
402 if (pos != std::string::npos) return pos;
403
404 // Check to make sure needle fits in console string.
405 pos = console.length();
406 if (needle.length() > pos) return std::string::npos;
407 pos -= needle.length();
408 // fuzzy match to maximum kBitErrorRate
Ivan Lozano04506432017-11-07 13:13:55 -0800409 for (;;) {
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700410 if (numError(pos, needle) != std::string::npos) return pos;
Ivan Lozano04506432017-11-07 13:13:55 -0800411 if (pos == 0) break;
412 --pos;
413 }
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700414 return std::string::npos;
415 }
416
417 // Our implementation of find, use only fuzzy match.
418 size_t find(const std::string& needle, size_t start = 0) const {
419 // Check to make sure needle fits in console string.
420 if (needle.length() > console.length()) return std::string::npos;
421 const size_t last_pos = console.length() - needle.length();
422 // fuzzy match to maximum kBitErrorRate
423 for (size_t pos = start; pos <= last_pos; ++pos) {
424 if (numError(pos, needle) != std::string::npos) return pos;
425 }
426 return std::string::npos;
427 }
428};
429
430// If bit error match to needle, correct it.
431// Return true if any corrections were discovered and applied.
432bool correctForBer(std::string& reason, const std::string& needle) {
433 bool corrected = false;
434 if (reason.length() < needle.length()) return corrected;
435 const pstoreConsole console(reason);
436 const size_t last_pos = reason.length() - needle.length();
437 for (size_t pos = 0; pos <= last_pos; pos += needle.length()) {
438 pos = console.find(needle, pos);
439 if (pos == std::string::npos) break;
440
441 // exact match has no malice
442 if (needle == reason.substr(pos, needle.length())) continue;
443
444 corrected = true;
445 reason = reason.substr(0, pos) + needle + reason.substr(pos + needle.length());
446 }
447 return corrected;
448}
449
450bool addKernelPanicSubReason(const pstoreConsole& console, std::string& ret) {
Mark Salyzyn64610892017-09-18 10:41:14 -0700451 // Check for kernel panic types to refine information
452 if (console.rfind("SysRq : Trigger a crash") != std::string::npos) {
453 // Can not happen, except on userdebug, during testing/debugging.
454 ret = "kernel_panic,sysrq";
455 return true;
456 }
457 if (console.rfind("Unable to handle kernel NULL pointer dereference at virtual address") !=
458 std::string::npos) {
459 ret = "kernel_panic,NULL";
460 return true;
461 }
462 if (console.rfind("Kernel BUG at ") != std::string::npos) {
463 ret = "kernel_panic,BUG";
464 return true;
465 }
466 return false;
467}
468
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700469bool addKernelPanicSubReason(const std::string& content, std::string& ret) {
470 return addKernelPanicSubReason(pstoreConsole(content), ret);
471}
472
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700473// std::transform Helper callback functions:
474// Converts a string value representing the reason the system booted to a
475// string complying with Android system standard reason.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700476char tounderline(char c) {
477 return ::isblank(c) ? '_' : c;
478}
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700479
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700480char toprintable(char c) {
481 return ::isprint(c) ? c : '?';
482}
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700483
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700484// Cleanup boot_reason regarding acceptable character set
485void transformReason(std::string& reason) {
486 std::transform(reason.begin(), reason.end(), reason.begin(), ::tolower);
487 std::transform(reason.begin(), reason.end(), reason.begin(), tounderline);
488 std::transform(reason.begin(), reason.end(), reason.begin(), toprintable);
489}
490
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700491const char system_reboot_reason_property[] = "sys.boot.reason";
492const char last_reboot_reason_property[] = LAST_REBOOT_REASON_PROPERTY;
493const char bootloader_reboot_reason_property[] = "ro.boot.bootreason";
494
495// Scrub, Sanitize, Standardize and Enhance the boot reason string supplied.
496std::string BootReasonStrToReason(const std::string& boot_reason) {
Mark Salyzyna16e4372017-09-20 08:36:12 -0700497 static const size_t max_reason_length = 256;
498
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700499 std::string ret(GetProperty(system_reboot_reason_property));
500 std::string reason(boot_reason);
501 // If sys.boot.reason == ro.boot.bootreason, let's re-evaluate
502 if (reason == ret) ret = "";
503
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700504 transformReason(reason);
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700505
506 // Is the current system boot reason sys.boot.reason valid?
507 if (!isKnownRebootReason(ret)) ret = "";
508
509 if (ret == "") {
510 // Is the bootloader boot reason ro.boot.bootreason known?
511 std::vector<std::string> words(android::base::Split(reason, ",_-"));
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700512 for (auto& s : knownReasons) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700513 std::string blunt;
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700514 for (auto& r : words) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700515 if (r == s) {
516 if (isBluntRebootReason(s)) {
517 blunt = s;
518 } else {
519 ret = s;
520 break;
521 }
522 }
523 }
524 if (ret == "") ret = blunt;
525 if (ret != "") break;
526 }
527 }
528
529 if (ret == "") {
530 // A series of checks to take some officially unsupported reasons
531 // reported by the bootloader and find some logical and canonical
532 // sense. In an ideal world, we would require those bootloaders
533 // to behave and follow our standards.
534 static const std::vector<std::pair<const std::string, const std::string>> aliasReasons = {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700535 {"watchdog", "wdog"},
536 {"cold,powerkey", "powerkey"},
537 {"kernel_panic", "panic"},
538 {"shutdown,thermal", "thermal"},
539 {"warm,s3_wakeup", "s3_wakeup"},
540 {"hard,hw_reset", "hw_reset"},
Mark Salyzyncabbe4f2017-10-23 13:52:39 -0700541 {"reboot,2sec", "2sec_reboot"},
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700542 {"bootloader", ""},
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700543 };
544
545 // Either the primary or alias is found _somewhere_ in the reason string.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700546 for (auto& s : aliasReasons) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700547 if (reason.find(s.first) != std::string::npos) {
548 ret = s.first;
549 break;
550 }
551 if (s.second.size() && (reason.find(s.second) != std::string::npos)) {
552 ret = s.first;
553 break;
554 }
555 }
556 }
557
558 // If watchdog is the reason, see if there is a security angle?
559 if (ret == "watchdog") {
560 if (reason.find("sec") != std::string::npos) {
561 ret += ",security";
562 }
563 }
564
Mark Salyzyn64610892017-09-18 10:41:14 -0700565 if (ret == "kernel_panic") {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700566 // Check to see if last klog has some refinement hints.
567 std::string content;
Mark Salyzyn64610892017-09-18 10:41:14 -0700568 if (readPstoreConsole(content)) {
569 addKernelPanicSubReason(content, ret);
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700570 }
Mark Salyzyn64610892017-09-18 10:41:14 -0700571 } else if (isBluntRebootReason(ret)) {
572 // Check the other available reason resources if the reason is still blunt.
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700573
Mark Salyzyn64610892017-09-18 10:41:14 -0700574 // Check to see if last klog has some refinement hints.
575 std::string content;
576 if (readPstoreConsole(content)) {
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700577 const pstoreConsole console(content);
Mark Salyzyn64610892017-09-18 10:41:14 -0700578 // The toybox reboot command used directly (unlikely)? But also
579 // catches init's response to Android's more controlled reboot command.
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700580 if (console.rfind("reboot: Power down") != std::string::npos) {
Mark Salyzyn64610892017-09-18 10:41:14 -0700581 ret = "shutdown"; // Still too blunt, but more accurate.
582 // ToDo: init should record the shutdown reason to kernel messages ala:
583 // init: shutdown system with command 'last_reboot_reason'
584 // so that if pstore has persistence we can get some details
585 // that could be missing in last_reboot_reason_property.
586 }
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700587
Mark Salyzyn64610892017-09-18 10:41:14 -0700588 static const char cmd[] = "reboot: Restarting system with command '";
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700589 size_t pos = console.rfind(cmd);
Mark Salyzyn64610892017-09-18 10:41:14 -0700590 if (pos != std::string::npos) {
591 pos += strlen(cmd);
Mark Salyzyna16e4372017-09-20 08:36:12 -0700592 std::string subReason(content.substr(pos, max_reason_length));
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700593 // Correct against any known strings that Bit Error Match
594 for (const auto& s : knownReasons) {
595 correctForBer(subReason, s);
596 }
597 for (const auto& m : kBootReasonMap) {
598 if (m.first.length() <= strlen("cold")) continue; // too short?
599 if (correctForBer(subReason, m.first + "'")) continue;
600 if (m.first.length() <= strlen("reboot,cold")) continue; // short?
601 if (!android::base::StartsWith(m.first, "reboot,")) continue;
602 correctForBer(subReason, m.first.substr(strlen("reboot,")) + "'");
603 }
Mark Salyzyna16e4372017-09-20 08:36:12 -0700604 for (pos = 0; pos < subReason.length(); ++pos) {
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700605 char c = subReason[pos];
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700606 // #, &, %, / are common single bit error for ' that we can block
607 if (!::isprint(c) || (c == '\'') || (c == '#') || (c == '&') || (c == '%') || (c == '/')) {
Mark Salyzyna16e4372017-09-20 08:36:12 -0700608 subReason.erase(pos);
609 break;
610 }
Mark Salyzyna16e4372017-09-20 08:36:12 -0700611 }
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700612 transformReason(subReason);
Mark Salyzyn64610892017-09-18 10:41:14 -0700613 if (subReason != "") { // Will not land "reboot" as that is too blunt.
614 if (isKernelRebootReason(subReason)) {
615 ret = "reboot," + subReason; // User space can't talk kernel reasons.
Mark Salyzyndafced92017-09-20 08:37:46 -0700616 } else if (isKnownRebootReason(subReason)) {
Mark Salyzyn64610892017-09-18 10:41:14 -0700617 ret = subReason;
Mark Salyzyndafced92017-09-20 08:37:46 -0700618 } else {
619 ret = "reboot," + subReason; // legitimize unknown reasons
Mark Salyzyn64610892017-09-18 10:41:14 -0700620 }
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700621 }
622 }
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700623
Mark Salyzyn64610892017-09-18 10:41:14 -0700624 // Check for kernel panics, allowed to override reboot command.
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700625 if (!addKernelPanicSubReason(console, ret) &&
Mark Salyzyn64610892017-09-18 10:41:14 -0700626 // check for long-press power down
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700627 ((console.rfind("Power held for ") != std::string::npos) ||
628 (console.rfind("charger: [") != std::string::npos))) {
Mark Salyzyn64610892017-09-18 10:41:14 -0700629 ret = "cold";
630 }
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700631 }
632
633 // The following battery test should migrate to a default system health HAL
634
635 // Let us not worry if the reboot command was issued, for the cases of
636 // reboot -p, reboot <no reason>, reboot cold, reboot warm and reboot hard.
637 // Same for bootloader and ro.boot.bootreasons of this set, but a dead
638 // battery could conceivably lead to these, so worthy of override.
639 if (isBluntRebootReason(ret)) {
640 // Heuristic to determine if shutdown possibly because of a dead battery?
641 // Really a hail-mary pass to find it in last klog content ...
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700642 static const int battery_dead_threshold = 2; // percent
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700643 static const char battery[] = "healthd: battery l=";
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700644 const pstoreConsole console(content);
645 size_t pos = console.rfind(battery); // last one
Mark Salyzyna16e4372017-09-20 08:36:12 -0700646 std::string digits;
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700647 if (pos != std::string::npos) {
Mark Salyzyn747c0e62017-09-20 08:37:46 -0700648 digits = content.substr(pos + strlen(battery), strlen("100 "));
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700649 // correct common errors
650 correctForBer(digits, "100 ");
651 if (digits[0] == '!') digits[0] = '1';
652 if (digits[1] == '!') digits[1] = '1';
Mark Salyzyna16e4372017-09-20 08:36:12 -0700653 }
Mark Salyzyn747c0e62017-09-20 08:37:46 -0700654 const char* endptr = digits.c_str();
655 unsigned level = 0;
656 while (::isdigit(*endptr)) {
657 level *= 10;
658 level += *endptr++ - '0';
659 // make sure no leading zeros, except zero itself, and range check.
660 if ((level == 0) || (level > 100)) break;
661 }
Mark Salyzyn293cb3b2017-09-20 08:37:46 -0700662 // example bit error rate issues for 10%
663 // 'l=10 ' no bits in error
664 // 'l=00 ' single bit error (fails above)
665 // 'l=1 ' single bit error
666 // 'l=0 ' double bit error
667 // There are others, not typically critical because of 2%
668 // battery_dead_threshold. KISS check, make sure second
669 // character after digit sequence is not a space.
670 if ((level <= 100) && (endptr != digits.c_str()) && (endptr[0] == ' ') && (endptr[1] != ' ')) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700671 LOG(INFO) << "Battery level at shutdown " << level << "%";
672 if (level <= battery_dead_threshold) {
673 ret = "shutdown,battery";
674 }
Mark Salyzyna16e4372017-09-20 08:36:12 -0700675 } else { // Most likely
676 digits = ""; // reset digits
677
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700678 // Content buffer no longer will have console data. Beware if more
679 // checks added below, that depend on parsing console content.
680 content = "";
681
682 LOG(DEBUG) << "Can not find last low battery in last console messages";
683 android_logcat_context ctx = create_android_logcat();
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700684 FILE* fp = android_logcat_popen(&ctx, "logcat -b kernel -v brief -d");
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700685 if (fp != nullptr) {
686 android::base::ReadFdToString(fileno(fp), &content);
687 }
688 android_logcat_pclose(&ctx, fp);
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700689 static const char logcat_battery[] = "W/healthd ( 0): battery l=";
690 const char* match = logcat_battery;
691
692 if (content == "") {
693 // Service logd.klog not running, go to smaller buffer in the kernel.
694 int rc = klogctl(KLOG_SIZE_BUFFER, nullptr, 0);
695 if (rc > 0) {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700696 ssize_t len = rc + 1024; // 1K Margin should it grow between calls.
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700697 std::unique_ptr<char[]> buf(new char[len]);
698 rc = klogctl(KLOG_READ_ALL, buf.get(), len);
699 if (rc < len) {
700 len = rc + 1;
701 }
702 buf[--len] = '\0';
703 content = buf.get();
704 }
705 match = battery;
706 }
707
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700708 pos = content.find(match); // The first one it finds.
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700709 if (pos != std::string::npos) {
Mark Salyzyn747c0e62017-09-20 08:37:46 -0700710 digits = content.substr(pos + strlen(match), strlen("100 "));
Mark Salyzyna16e4372017-09-20 08:36:12 -0700711 }
Mark Salyzyn747c0e62017-09-20 08:37:46 -0700712 endptr = digits.c_str();
713 level = 0;
714 while (::isdigit(*endptr)) {
715 level *= 10;
716 level += *endptr++ - '0';
717 // make sure no leading zeros, except zero itself, and range check.
718 if ((level == 0) || (level > 100)) break;
719 }
Mark Salyzyna16e4372017-09-20 08:36:12 -0700720 if ((level <= 100) && (endptr != digits.c_str()) && (*endptr == ' ')) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700721 LOG(INFO) << "Battery level at startup " << level << "%";
722 if (level <= battery_dead_threshold) {
723 ret = "shutdown,battery";
724 }
725 } else {
726 LOG(DEBUG) << "Can not find first battery level in dmesg or logcat";
727 }
728 }
729 }
730
731 // Is there a controlled shutdown hint in last_reboot_reason_property?
732 if (isBluntRebootReason(ret)) {
733 // Content buffer no longer will have console data. Beware if more
734 // checks added below, that depend on parsing console content.
735 content = GetProperty(last_reboot_reason_property);
Mark Salyzyn88d692c2017-09-20 08:37:46 -0700736 transformReason(content);
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700737
Mark Salyzyn62909822017-10-09 09:27:16 -0700738 // Anything in last is better than 'super-blunt' reboot or shutdown.
739 if ((ret == "") || (ret == "reboot") || (ret == "shutdown") || !isBluntRebootReason(content)) {
740 ret = content;
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700741 }
742 }
743
744 // Other System Health HAL reasons?
745
746 // ToDo: /proc/sys/kernel/boot_reason needs a HAL interface to
747 // possibly offer hardware-specific clues from the PMIC.
748 }
749
750 // If unknown left over from above, make it "reboot,<boot_reason>"
751 if (ret == "") {
752 ret = "reboot";
753 if (android::base::StartsWith(reason, "reboot")) {
754 reason = reason.substr(strlen("reboot"));
Mark Salyzyn0af71a52017-10-05 13:58:04 -0700755 while ((reason[0] == ',') || (reason[0] == '_')) {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700756 reason = reason.substr(1);
757 }
758 }
759 if (reason != "") {
760 ret += ",";
761 ret += reason;
762 }
763 }
764
765 LOG(INFO) << "Canonical boot reason: " << ret;
766 if (isKernelRebootReason(ret) && (GetProperty(last_reboot_reason_property) != "")) {
767 // Rewrite as it must be old news, kernel reasons trump user space.
768 SetProperty(last_reboot_reason_property, ret);
769 }
770 return ret;
771}
772
James Hawkinsb9cf7712016-04-08 15:32:19 -0700773// Returns the appropriate metric key prefix for the boot_complete metric such
774// that boot metrics after a system update are labeled as ota_boot_complete;
775// otherwise, they are labeled as boot_complete. This method encapsulates the
776// bookkeeping required to track when a system update has occurred by storing
777// the UTC timestamp of the system build date and comparing against the current
778// system build date.
779std::string CalculateBootCompletePrefix() {
780 static const std::string kBuildDateKey = "build_date";
781 std::string boot_complete_prefix = "boot_complete";
782
783 std::string build_date_str = GetProperty("ro.build.date.utc");
James Hawkins4dded612016-07-28 11:50:23 -0700784 int32_t build_date;
Elliott Hughesda46b392016-10-11 17:09:00 -0700785 if (!android::base::ParseInt(build_date_str, &build_date)) {
James Hawkins4dded612016-07-28 11:50:23 -0700786 return std::string();
787 }
James Hawkinsb9cf7712016-04-08 15:32:19 -0700788
789 BootEventRecordStore boot_event_store;
790 BootEventRecordStore::BootEventRecord record;
James Hawkins0bc4ad42017-05-30 15:03:15 -0700791 if (!boot_event_store.GetBootEvent(kBuildDateKey, &record)) {
792 boot_complete_prefix = "factory_reset_" + boot_complete_prefix;
793 boot_event_store.AddBootEventWithValue(kBuildDateKey, build_date);
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700794 LOG(INFO) << "Canonical boot reason: reboot,factory_reset";
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700795 SetProperty(system_reboot_reason_property, "reboot,factory_reset");
James Hawkins0bc4ad42017-05-30 15:03:15 -0700796 } else if (build_date != record.second) {
James Hawkinsb9cf7712016-04-08 15:32:19 -0700797 boot_complete_prefix = "ota_" + boot_complete_prefix;
798 boot_event_store.AddBootEventWithValue(kBuildDateKey, build_date);
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700799 LOG(INFO) << "Canonical boot reason: reboot,ota";
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700800 SetProperty(system_reboot_reason_property, "reboot,ota");
James Hawkinsb9cf7712016-04-08 15:32:19 -0700801 }
802
803 return boot_complete_prefix;
804}
805
James Hawkinsef0a0902017-01-06 14:38:23 -0800806// Records the value of a given ro.boottime.init property in milliseconds.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700807void RecordInitBootTimeProp(BootEventRecordStore* boot_event_store, const char* property) {
James Hawkinsef0a0902017-01-06 14:38:23 -0800808 std::string value = GetProperty(property);
809
James Hawkins27c05222017-01-26 11:55:44 -0800810 int32_t time_in_ms;
811 if (android::base::ParseInt(value, &time_in_ms)) {
James Hawkinsef0a0902017-01-06 14:38:23 -0800812 boot_event_store->AddBootEventWithValue(property, time_in_ms);
813 }
814}
815
James Hawkins1bfcaec2017-05-19 14:27:27 -0700816// A map from bootloader timing stage to the time that stage took during boot.
817typedef std::map<std::string, int32_t> BootloaderTimingMap;
818
819// Returns a mapping from bootloader stage names to the time those stages
820// took to boot.
821const BootloaderTimingMap GetBootLoaderTimings() {
822 BootloaderTimingMap timings;
823
824 // |ro.boot.boottime| is of the form 'stage1:time1,...,stageN:timeN',
825 // where timeN is in milliseconds.
James Hawkinsbe46fd12017-02-02 16:21:25 -0800826 std::string value = GetProperty("ro.boot.boottime");
James Hawkins6b5c5aa2017-02-16 11:53:03 -0800827 if (value.empty()) {
828 // ro.boot.boottime is not reported on all devices.
James Hawkins1bfcaec2017-05-19 14:27:27 -0700829 return BootloaderTimingMap();
James Hawkins6b5c5aa2017-02-16 11:53:03 -0800830 }
James Hawkinsbe46fd12017-02-02 16:21:25 -0800831
832 auto stages = android::base::Split(value, ",");
James Hawkins1bfcaec2017-05-19 14:27:27 -0700833 for (const auto& stageTiming : stages) {
James Hawkinsbe46fd12017-02-02 16:21:25 -0800834 // |stageTiming| is of the form 'stage:time'.
835 auto stageTimingValues = android::base::Split(stageTiming, ":");
James Hawkins0bc4ad42017-05-30 15:03:15 -0700836 DCHECK_EQ(2U, stageTimingValues.size());
James Hawkinsbe46fd12017-02-02 16:21:25 -0800837
838 std::string stageName = stageTimingValues[0];
839 int32_t time_ms;
840 if (android::base::ParseInt(stageTimingValues[1], &time_ms)) {
James Hawkins1bfcaec2017-05-19 14:27:27 -0700841 timings[stageName] = time_ms;
James Hawkinsbe46fd12017-02-02 16:21:25 -0800842 }
843 }
James Hawkins6b5c5aa2017-02-16 11:53:03 -0800844
James Hawkins1bfcaec2017-05-19 14:27:27 -0700845 return timings;
846}
847
848// Parses and records the set of bootloader stages and associated boot times
849// from the ro.boot.boottime system property.
850void RecordBootloaderTimings(BootEventRecordStore* boot_event_store,
851 const BootloaderTimingMap& bootloader_timings) {
852 int32_t total_time = 0;
853 for (const auto& timing : bootloader_timings) {
854 total_time += timing.second;
855 boot_event_store->AddBootEventWithValue("boottime.bootloader." + timing.first, timing.second);
856 }
857
James Hawkins6b5c5aa2017-02-16 11:53:03 -0800858 boot_event_store->AddBootEventWithValue("boottime.bootloader.total", total_time);
James Hawkinsbe46fd12017-02-02 16:21:25 -0800859}
860
James Hawkins1bfcaec2017-05-19 14:27:27 -0700861// Records the closest estimation to the absolute device boot time, i.e.,
862// from power on to boot_complete, including bootloader times.
863void RecordAbsoluteBootTime(BootEventRecordStore* boot_event_store,
864 const BootloaderTimingMap& bootloader_timings,
865 std::chrono::milliseconds uptime) {
866 int32_t bootloader_time_ms = 0;
867
868 for (const auto& timing : bootloader_timings) {
869 if (timing.first.compare("SW") != 0) {
870 bootloader_time_ms += timing.second;
871 }
872 }
873
874 auto bootloader_duration = std::chrono::milliseconds(bootloader_time_ms);
875 auto absolute_total =
876 std::chrono::duration_cast<std::chrono::seconds>(bootloader_duration + uptime);
877 boot_event_store->AddBootEventWithValue("absolute_boot_time", absolute_total.count());
878}
879
James Hawkinsc08e9962016-03-11 14:59:50 -0800880// Records several metrics related to the time it takes to boot the device,
881// including disambiguating boot time on encrypted or non-encrypted devices.
882void RecordBootComplete() {
883 BootEventRecordStore boot_event_store;
James Hawkinsb9cf7712016-04-08 15:32:19 -0700884 BootEventRecordStore::BootEventRecord record;
James Hawkins2d8b3e62016-04-14 14:13:20 -0700885
James Hawkins1bfcaec2017-05-19 14:27:27 -0700886 auto time_since_epoch = android::base::boot_clock::now().time_since_epoch();
887 auto uptime = std::chrono::duration_cast<std::chrono::seconds>(time_since_epoch);
James Hawkins2d8b3e62016-04-14 14:13:20 -0700888 time_t current_time_utc = time(nullptr);
889
890 if (boot_event_store.GetBootEvent("last_boot_time_utc", &record)) {
891 time_t last_boot_time_utc = record.second;
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700892 time_t time_since_last_boot = difftime(current_time_utc, last_boot_time_utc);
893 boot_event_store.AddBootEventWithValue("time_since_last_boot", time_since_last_boot);
James Hawkins2d8b3e62016-04-14 14:13:20 -0700894 }
895
896 boot_event_store.AddBootEventWithValue("last_boot_time_utc", current_time_utc);
James Hawkinsc08e9962016-03-11 14:59:50 -0800897
James Hawkinsb9cf7712016-04-08 15:32:19 -0700898 // The boot_complete metric has two variants: boot_complete and
899 // ota_boot_complete. The latter signifies that the device is booting after
900 // a system update.
901 std::string boot_complete_prefix = CalculateBootCompletePrefix();
James Hawkins4dded612016-07-28 11:50:23 -0700902 if (boot_complete_prefix.empty()) {
903 // The system is hosed because the build date property could not be read.
904 return;
905 }
James Hawkinsc08e9962016-03-11 14:59:50 -0800906
907 // post_decrypt_time_elapsed is only logged on encrypted devices.
908 if (boot_event_store.GetBootEvent("post_decrypt_time_elapsed", &record)) {
909 // Log the amount of time elapsed until the device is decrypted, which
910 // includes the variable amount of time the user takes to enter the
911 // decryption password.
James Hawkinse78ea772017-03-24 11:43:02 -0700912 boot_event_store.AddBootEventWithValue("boot_decryption_complete", uptime.count());
James Hawkinsc08e9962016-03-11 14:59:50 -0800913
914 // Subtract the decryption time to normalize the boot cycle timing.
James Hawkinse78ea772017-03-24 11:43:02 -0700915 std::chrono::seconds boot_complete = std::chrono::seconds(uptime.count() - record.second);
James Hawkinsb9cf7712016-04-08 15:32:19 -0700916 boot_event_store.AddBootEventWithValue(boot_complete_prefix + "_post_decrypt",
James Hawkinse78ea772017-03-24 11:43:02 -0700917 boot_complete.count());
James Hawkinsc08e9962016-03-11 14:59:50 -0800918 } else {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700919 boot_event_store.AddBootEventWithValue(boot_complete_prefix + "_no_encryption", uptime.count());
James Hawkinsc08e9962016-03-11 14:59:50 -0800920 }
921
922 // Record the total time from device startup to boot complete, regardless of
923 // encryption state.
James Hawkinse78ea772017-03-24 11:43:02 -0700924 boot_event_store.AddBootEventWithValue(boot_complete_prefix, uptime.count());
James Hawkinsef0a0902017-01-06 14:38:23 -0800925
926 RecordInitBootTimeProp(&boot_event_store, "ro.boottime.init");
927 RecordInitBootTimeProp(&boot_event_store, "ro.boottime.init.selinux");
928 RecordInitBootTimeProp(&boot_event_store, "ro.boottime.init.cold_boot_wait");
James Hawkinsbe46fd12017-02-02 16:21:25 -0800929
James Hawkins1bfcaec2017-05-19 14:27:27 -0700930 const BootloaderTimingMap bootloader_timings = GetBootLoaderTimings();
931 RecordBootloaderTimings(&boot_event_store, bootloader_timings);
932
933 auto uptime_ms = std::chrono::duration_cast<std::chrono::milliseconds>(time_since_epoch);
934 RecordAbsoluteBootTime(&boot_event_store, bootloader_timings, uptime_ms);
James Hawkinsc08e9962016-03-11 14:59:50 -0800935}
936
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800937// Records the boot_reason metric by querying the ro.boot.bootreason system
938// property.
939void RecordBootReason() {
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700940 const std::string reason(GetProperty(bootloader_reboot_reason_property));
James Hawkins25f71222017-10-10 16:37:05 -0700941
942 if (reason.empty()) {
943 // Log an empty boot reason value as '<EMPTY>' to ensure the value is intentional
944 // (and not corruption anywhere else in the reporting pipeline).
945 android::metricslogger::LogMultiAction(android::metricslogger::ACTION_BOOT,
946 android::metricslogger::FIELD_PLATFORM_REASON, "<EMPTY>");
947 } else {
948 android::metricslogger::LogMultiAction(android::metricslogger::ACTION_BOOT,
949 android::metricslogger::FIELD_PLATFORM_REASON, reason);
950 }
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700951
952 // Log the raw bootloader_boot_reason property value.
953 int32_t boot_reason = BootReasonStrToEnum(reason);
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800954 BootEventRecordStore boot_event_store;
955 boot_event_store.AddBootEventWithValue("boot_reason", boot_reason);
Mark Salyzynb304f6d2017-08-04 13:35:51 -0700956
957 // Log the scrubbed system_boot_reason.
958 const std::string system_reason(BootReasonStrToReason(reason));
959 int32_t system_boot_reason = BootReasonStrToEnum(system_reason);
960 boot_event_store.AddBootEventWithValue("system_boot_reason", system_boot_reason);
961
962 // Record the scrubbed system_boot_reason to the property
963 SetProperty(system_reboot_reason_property, system_reason);
964 if (reason == "") {
965 SetProperty(bootloader_reboot_reason_property, system_reason);
966 }
James Hawkinsa4a1a4a2016-02-09 15:32:38 -0800967}
968
James Hawkins500d7152016-02-16 15:05:54 -0800969// Records two metrics related to the user resetting a device: the time at
970// which the device is reset, and the time since the user last reset the
971// device. The former is only set once per-factory reset.
972void RecordFactoryReset() {
973 BootEventRecordStore boot_event_store;
974 BootEventRecordStore::BootEventRecord record;
975
976 time_t current_time_utc = time(nullptr);
977
James Hawkins0660b302016-03-08 16:18:15 -0800978 if (current_time_utc < 0) {
979 // UMA does not display negative values in buckets, so convert to positive.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700980 android::metricslogger::LogHistogram("factory_reset_current_time_failure",
981 std::abs(current_time_utc));
James Hawkinsfff95ba2016-03-29 16:13:49 -0700982
James Hawkins9aec9262017-01-31 11:42:24 -0800983 // Logging via BootEventRecordStore to see if using android::metricslogger::LogHistogram
James Hawkinsfff95ba2016-03-29 16:13:49 -0700984 // is losing records somehow.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700985 boot_event_store.AddBootEventWithValue("factory_reset_current_time_failure",
986 std::abs(current_time_utc));
James Hawkins0660b302016-03-08 16:18:15 -0800987 return;
988 } else {
James Hawkins9aec9262017-01-31 11:42:24 -0800989 android::metricslogger::LogHistogram("factory_reset_current_time", current_time_utc);
James Hawkinsfff95ba2016-03-29 16:13:49 -0700990
James Hawkins9aec9262017-01-31 11:42:24 -0800991 // Logging via BootEventRecordStore to see if using android::metricslogger::LogHistogram
James Hawkinsfff95ba2016-03-29 16:13:49 -0700992 // is losing records somehow.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -0700993 boot_event_store.AddBootEventWithValue("factory_reset_current_time", current_time_utc);
James Hawkins0660b302016-03-08 16:18:15 -0800994 }
995
James Hawkins500d7152016-02-16 15:05:54 -0800996 // The factory_reset boot event does not exist after the device is reset, so
997 // use this signal to mark the time of the factory reset.
998 if (!boot_event_store.GetBootEvent("factory_reset", &record)) {
999 boot_event_store.AddBootEventWithValue("factory_reset", current_time_utc);
James Hawkins3bf9b142016-03-03 14:50:24 -08001000
1001 // Don't log the time_since_factory_reset until some time has elapsed.
1002 // The data is not meaningful yet and skews the histogram buckets.
James Hawkins500d7152016-02-16 15:05:54 -08001003 return;
1004 }
1005
1006 // Calculate and record the difference in time between now and the
1007 // factory_reset time.
1008 time_t factory_reset_utc = record.second;
James Hawkins9aec9262017-01-31 11:42:24 -08001009 android::metricslogger::LogHistogram("factory_reset_record_value", factory_reset_utc);
James Hawkinsfff95ba2016-03-29 16:13:49 -07001010
James Hawkins9aec9262017-01-31 11:42:24 -08001011 // Logging via BootEventRecordStore to see if using android::metricslogger::LogHistogram
James Hawkinsfff95ba2016-03-29 16:13:49 -07001012 // is losing records somehow.
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -07001013 boot_event_store.AddBootEventWithValue("factory_reset_record_value", factory_reset_utc);
James Hawkinsfff95ba2016-03-29 16:13:49 -07001014
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -07001015 time_t time_since_factory_reset = difftime(current_time_utc, factory_reset_utc);
1016 boot_event_store.AddBootEventWithValue("time_since_factory_reset", time_since_factory_reset);
James Hawkins500d7152016-02-16 15:05:54 -08001017}
1018
James Hawkinsabd73e62016-01-19 15:10:38 -08001019} // namespace
1020
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -07001021int main(int argc, char** argv) {
James Hawkinsabd73e62016-01-19 15:10:38 -08001022 android::base::InitLogging(argv);
1023
1024 const std::string cmd_line = GetCommandLine(argc, argv);
1025 LOG(INFO) << "Service started: " << cmd_line;
1026
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001027 int option_index = 0;
James Hawkinsc6275582016-03-22 10:47:44 -07001028 static const char value_str[] = "value";
James Hawkinsc08e9962016-03-11 14:59:50 -08001029 static const char boot_complete_str[] = "record_boot_complete";
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001030 static const char boot_reason_str[] = "record_boot_reason";
James Hawkins53684ea2016-02-23 16:18:19 -08001031 static const char factory_reset_str[] = "record_time_since_factory_reset";
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001032 static const struct option long_options[] = {
Mark Salyzyn14b1e6d2017-09-18 10:41:14 -07001033 // clang-format off
1034 { "help", no_argument, NULL, 'h' },
1035 { "log", no_argument, NULL, 'l' },
1036 { "print", no_argument, NULL, 'p' },
1037 { "record", required_argument, NULL, 'r' },
1038 { value_str, required_argument, NULL, 0 },
1039 { boot_complete_str, no_argument, NULL, 0 },
1040 { boot_reason_str, no_argument, NULL, 0 },
1041 { factory_reset_str, no_argument, NULL, 0 },
1042 { NULL, 0, NULL, 0 }
1043 // clang-format on
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001044 };
1045
James Hawkinsc6275582016-03-22 10:47:44 -07001046 std::string boot_event;
1047 std::string value;
James Hawkinsabd73e62016-01-19 15:10:38 -08001048 int opt = 0;
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001049 while ((opt = getopt_long(argc, argv, "hlpr:", long_options, &option_index)) != -1) {
James Hawkinsabd73e62016-01-19 15:10:38 -08001050 switch (opt) {
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001051 // This case handles long options which have no single-character mapping.
1052 case 0: {
1053 const std::string option_name = long_options[option_index].name;
James Hawkinsc6275582016-03-22 10:47:44 -07001054 if (option_name == value_str) {
1055 // |optarg| is an external variable set by getopt representing
1056 // the option argument.
1057 value = optarg;
1058 } else if (option_name == boot_complete_str) {
James Hawkinsc08e9962016-03-11 14:59:50 -08001059 RecordBootComplete();
1060 } else if (option_name == boot_reason_str) {
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001061 RecordBootReason();
James Hawkins500d7152016-02-16 15:05:54 -08001062 } else if (option_name == factory_reset_str) {
1063 RecordFactoryReset();
James Hawkinsa4a1a4a2016-02-09 15:32:38 -08001064 } else {
1065 LOG(ERROR) << "Invalid option: " << option_name;
1066 }
1067 break;
1068 }
1069
James Hawkinsabd73e62016-01-19 15:10:38 -08001070 case 'h': {
1071 ShowHelp(argv[0]);
1072 break;
1073 }
1074
1075 case 'l': {
1076 LogBootEvents();
1077 break;
1078 }
1079
1080 case 'p': {
1081 PrintBootEvents();
1082 break;
1083 }
1084
1085 case 'r': {
1086 // |optarg| is an external variable set by getopt representing
1087 // the option argument.
James Hawkinsc6275582016-03-22 10:47:44 -07001088 boot_event = optarg;
James Hawkinsabd73e62016-01-19 15:10:38 -08001089 break;
1090 }
1091
1092 default: {
1093 DCHECK_EQ(opt, '?');
1094
1095 // |optopt| is an external variable set by getopt representing
1096 // the value of the invalid option.
1097 LOG(ERROR) << "Invalid option: " << optopt;
1098 ShowHelp(argv[0]);
1099 return EXIT_FAILURE;
1100 }
1101 }
1102 }
1103
James Hawkinsc6275582016-03-22 10:47:44 -07001104 if (!boot_event.empty()) {
1105 RecordBootEventFromCommandLine(boot_event, value);
1106 }
1107
James Hawkinsabd73e62016-01-19 15:10:38 -08001108 return 0;
1109}