metrics/metrics_daemon.cc - platform/system/core - Git at Google

 // Copyright (c) 2011 The Chromium OS Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "metrics_daemon.h"

 #include <fcntl.h>
 #include <math.h>
 #include <string.h>
 #include <time.h>

 #include <base/file_util.h>
 #include <base/logging.h>
 #include <base/string_util.h>
 #include <base/stringprintf.h>
 #include <dbus/dbus-glib-lowlevel.h>

 #include "counter.h"

 using base::Time;
 using base::TimeDelta;
 using base::TimeTicks;
 using std::map;
 using std::string;
 using std::vector;


 #define SAFE_MESSAGE(e) (e.message ? e.message : "unknown error")
 #define DBUS_IFACE_CRASH_REPORTER "org.chromium.CrashReporter"
 #define DBUS_IFACE_POWER_MANAGER "org.chromium.PowerManager"
 #define DBUS_IFACE_SESSION_MANAGER "org.chromium.SessionManagerInterface"

 static const int kSecondsPerMinute = 60;
 static const int kMinutesPerHour = 60;
 static const int kHoursPerDay = 24;
 static const int kMinutesPerDay = kHoursPerDay * kMinutesPerHour;
 static const int kSecondsPerDay = kSecondsPerMinute * kMinutesPerDay;
 static const int kDaysPerWeek = 7;
 static const int kSecondsPerWeek = kSecondsPerDay * kDaysPerWeek;

 // The daily use monitor is scheduled to a 1-minute interval after
 // initial user activity and then it's exponentially backed off to
 // 10-minute intervals. Although not required, the back off is
 // implemented because the histogram buckets are spaced exponentially
 // anyway and to avoid too frequent metrics daemon process wake-ups
 // and file I/O.
 static const int kUseMonitorIntervalInit = 1 * kSecondsPerMinute;
 static const int kUseMonitorIntervalMax = 10 * kSecondsPerMinute;

 const char kKernelCrashDetectedFile[] = "/tmp/kernel-crash-detected";
 static const char kUncleanShutdownDetectedFile[] =
       "/tmp/unclean-shutdown-detected";

 // static metrics parameters
 const char MetricsDaemon::kMetricDailyUseTimeName[] =
     "Logging.DailyUseTime";
 const int MetricsDaemon::kMetricDailyUseTimeMin = 1;
 const int MetricsDaemon::kMetricDailyUseTimeMax = kMinutesPerDay;
 const int MetricsDaemon::kMetricDailyUseTimeBuckets = 50;

 // crash interval metrics
 const char MetricsDaemon::kMetricKernelCrashIntervalName[] =
     "Logging.KernelCrashInterval";
 const char MetricsDaemon::kMetricUncleanShutdownIntervalName[] =
     "Logging.UncleanShutdownInterval";
 const char MetricsDaemon::kMetricUserCrashIntervalName[] =
     "Logging.UserCrashInterval";

 const int MetricsDaemon::kMetricCrashIntervalMin = 1;
 const int MetricsDaemon::kMetricCrashIntervalMax =
     4 * kSecondsPerWeek;
 const int MetricsDaemon::kMetricCrashIntervalBuckets = 50;

 // crash frequency metrics
 const char MetricsDaemon::kMetricAnyCrashesDailyName[] =
     "Logging.AnyCrashesDaily";
 const char MetricsDaemon::kMetricAnyCrashesWeeklyName[] =
     "Logging.AnyCrashesWeekly";
 const char MetricsDaemon::kMetricKernelCrashesDailyName[] =
     "Logging.KernelCrashesDaily";
 const char MetricsDaemon::kMetricKernelCrashesWeeklyName[] =
     "Logging.KernelCrashesWeekly";
 const char MetricsDaemon::kMetricUncleanShutdownsDailyName[] =
     "Logging.UncleanShutdownsDaily";
 const char MetricsDaemon::kMetricUncleanShutdownsWeeklyName[] =
     "Logging.UncleanShutdownsWeekly";
 const char MetricsDaemon::kMetricUserCrashesDailyName[] =
     "Logging.UserCrashesDaily";
 const char MetricsDaemon::kMetricUserCrashesWeeklyName[] =
     "Logging.UserCrashesWeekly";
 const char MetricsDaemon::kMetricCrashFrequencyMin = 1;
 const char MetricsDaemon::kMetricCrashFrequencyMax = 100;
 const char MetricsDaemon::kMetricCrashFrequencyBuckets = 50;

 // disk stats metrics

 // The {Read,Write}Sectors numbers are in sectors/second.
 // A sector is usually 512 bytes.

 const char MetricsDaemon::kMetricReadSectorsLongName[] =
     "Platform.ReadSectorsLong";
 const char MetricsDaemon::kMetricWriteSectorsLongName[] =
     "Platform.WriteSectorsLong";
 const char MetricsDaemon::kMetricReadSectorsShortName[] =
     "Platform.ReadSectorsShort";
 const char MetricsDaemon::kMetricWriteSectorsShortName[] =
     "Platform.WriteSectorsShort";

 const int MetricsDaemon::kMetricStatsShortInterval = 1;  // seconds
 const int MetricsDaemon::kMetricStatsLongInterval = 30;  // seconds

 const int MetricsDaemon::kMetricMeminfoInterval = 30;        // seconds

 // Assume a max rate of 250Mb/s for reads (worse for writes) and 512 byte
 // sectors.
 const int MetricsDaemon::kMetricSectorsIOMax = 500000;  // sectors/second
 const int MetricsDaemon::kMetricSectorsBuckets = 50;    // buckets
 // Page size is 4k, sector size is 0.5k.  We're not interested in page fault
 // rates that the disk cannot sustain.
 const int MetricsDaemon::kMetricPageFaultsMax = kMetricSectorsIOMax / 8;
 const int MetricsDaemon::kMetricPageFaultsBuckets = 50;

 // Major page faults, i.e. the ones that require data to be read from disk.

 const char MetricsDaemon::kMetricPageFaultsLongName[] =
     "Platform.PageFaultsLong";
 const char MetricsDaemon::kMetricPageFaultsShortName[] =
     "Platform.PageFaultsShort";

 // persistent metrics path
 const char MetricsDaemon::kMetricsPath[] = "/var/log/metrics";


 // static
 const char* MetricsDaemon::kDBusMatches_[] = {
   "type='signal',"
   "interface='" DBUS_IFACE_CRASH_REPORTER "',"
   "path='/',"
   "member='UserCrash'",

   "type='signal',"
   "interface='" DBUS_IFACE_POWER_MANAGER "',"
   "path='/'",

   "type='signal',"
   "sender='org.chromium.SessionManager',"
   "interface='" DBUS_IFACE_SESSION_MANAGER "',"
   "path='/org/chromium/SessionManager',"
   "member='SessionStateChanged'",
 };

 // static
 const char* MetricsDaemon::kPowerStates_[] = {
 #define STATE(name, capname) #name,
 #include "power_states.h"
 };

 // static
 const char* MetricsDaemon::kSessionStates_[] = {
 #define STATE(name, capname) #name,
 #include "session_states.h"
 };

 // Memory use stats collection intervals.  We collect some memory use interval
 // at these intervals after boot, and we stop collecting after the last one,
 // with the assumption that in most cases the memory use won't change much
 // after that.
 static const int kMemuseIntervals[] = {
   1 * kSecondsPerMinute,    // 1 minute mark
   4 * kSecondsPerMinute,    // 5 minute mark
   25 * kSecondsPerMinute,   // 0.5 hour mark
   120 * kSecondsPerMinute,  // 2.5 hour mark
   600 * kSecondsPerMinute,  // 12.5 hour mark
 };

 MetricsDaemon::MetricsDaemon()
     : power_state_(kUnknownPowerState),
       session_state_(kUnknownSessionState),
       user_active_(false),
       usemon_interval_(0),
       usemon_source_(NULL),
       memuse_initial_time_(0),
       memuse_interval_index_(0),
       read_sectors_(0),
       write_sectors_(0),
       page_faults_(0),
       stats_state_(kStatsShort),
       stats_initial_time_(0) {}

 MetricsDaemon::~MetricsDaemon() {
   DeleteFrequencyCounters();
 }

 double MetricsDaemon::GetActiveTime() {
   struct timespec ts;
   int r = clock_gettime(CLOCK_MONOTONIC, &ts);
   if (r < 0) {
     PLOG(WARNING) << "clock_gettime(CLOCK_MONOTONIC) failed";
     return 0;
   } else {
     return ts.tv_sec + ((double) ts.tv_nsec) / (1000 * 1000 * 1000);
   }
 }

 void MetricsDaemon::DeleteFrequencyCounters() {
   for (FrequencyCounters::iterator i = frequency_counters_.begin();
        i != frequency_counters_.end(); ++i) {
     delete i->second;
     i->second = NULL;
   }
 }

 void MetricsDaemon::Run(bool run_as_daemon) {
   if (run_as_daemon && daemon(0, 0) != 0)
     return;

   if (CheckSystemCrash(kKernelCrashDetectedFile)) {
     ProcessKernelCrash();
   }

   if (CheckSystemCrash(kUncleanShutdownDetectedFile)) {
     ProcessUncleanShutdown();
   }

   Loop();
 }

 FilePath MetricsDaemon::GetHistogramPath(const char* histogram_name) {
   return FilePath(kMetricsPath).Append(histogram_name);
 }

 void MetricsDaemon::ConfigureCrashIntervalReporter(
     const char* histogram_name,
     scoped_ptr<chromeos_metrics::TaggedCounterReporter>* reporter) {
   reporter->reset(new chromeos_metrics::TaggedCounterReporter());
   FilePath file_path = GetHistogramPath(histogram_name);
   (*reporter)->Init(file_path.value().c_str(),
                     histogram_name,
                     kMetricCrashIntervalMin,
                     kMetricCrashIntervalMax,
                     kMetricCrashIntervalBuckets);
 }

 void MetricsDaemon::ConfigureCrashFrequencyReporter(
     const char* histogram_name) {
   scoped_ptr<chromeos_metrics::TaggedCounterReporter> reporter(
       new chromeos_metrics::TaggedCounterReporter());
   FilePath file_path = GetHistogramPath(histogram_name);
   reporter->Init(file_path.value().c_str(),
                  histogram_name,
                  kMetricCrashFrequencyMin,
                  kMetricCrashFrequencyMax,
                  kMetricCrashFrequencyBuckets);
   scoped_ptr<chromeos_metrics::FrequencyCounter> new_counter(
       new chromeos_metrics::FrequencyCounter());
   time_t cycle_duration = strstr(histogram_name, "Weekly") != NULL ?
       chromeos_metrics::kSecondsPerWeek :
       chromeos_metrics::kSecondsPerDay;
   new_counter->Init(
       static_cast<chromeos_metrics::TaggedCounterInterface*>(
           reporter.release()),
       cycle_duration);
   frequency_counters_[histogram_name] = new_counter.release();
 }

 void MetricsDaemon::Init(bool testing, MetricsLibraryInterface* metrics_lib,
                          const string& diskstats_path,
                          const string& vmstats_path) {
   testing_ = testing;
   DCHECK(metrics_lib != NULL);
   metrics_lib_ = metrics_lib;
   chromeos_metrics::TaggedCounterReporter::
       SetMetricsLibraryInterface(metrics_lib);

   static const char kDailyUseRecordFile[] = "/var/log/metrics/daily-usage";
   daily_use_.reset(new chromeos_metrics::TaggedCounter());
   daily_use_->Init(kDailyUseRecordFile, &ReportDailyUse, this);

   ConfigureCrashIntervalReporter(kMetricKernelCrashIntervalName,
                                  &kernel_crash_interval_);
   ConfigureCrashIntervalReporter(kMetricUncleanShutdownIntervalName,
                                  &unclean_shutdown_interval_);
   ConfigureCrashIntervalReporter(kMetricUserCrashIntervalName,
                                  &user_crash_interval_);

   DeleteFrequencyCounters();
   ConfigureCrashFrequencyReporter(kMetricAnyCrashesDailyName);
   ConfigureCrashFrequencyReporter(kMetricAnyCrashesWeeklyName);
   ConfigureCrashFrequencyReporter(kMetricKernelCrashesDailyName);
   ConfigureCrashFrequencyReporter(kMetricKernelCrashesWeeklyName);
   ConfigureCrashFrequencyReporter(kMetricUncleanShutdownsDailyName);
   ConfigureCrashFrequencyReporter(kMetricUncleanShutdownsWeeklyName);
   ConfigureCrashFrequencyReporter(kMetricUserCrashesDailyName);
   ConfigureCrashFrequencyReporter(kMetricUserCrashesWeeklyName);

   diskstats_path_ = diskstats_path;
   vmstats_path_ = vmstats_path;
   StatsReporterInit();

   // Start collecting meminfo stats.
   ScheduleMeminfoCallback(kMetricMeminfoInterval);
   ScheduleMemuseCallback(true, 0);

   // Don't setup D-Bus and GLib in test mode.
   if (testing)
     return;

   g_thread_init(NULL);
   g_type_init();
   dbus_g_thread_init();

   DBusError error;
   dbus_error_init(&error);

   DBusConnection* connection = dbus_bus_get(DBUS_BUS_SYSTEM, &error);
   LOG_IF(FATAL, dbus_error_is_set(&error)) <<
       "No D-Bus connection: " << SAFE_MESSAGE(error);

   dbus_connection_setup_with_g_main(connection, NULL);

   // Registers D-Bus matches for the signals we would like to catch.
   for (unsigned int m = 0; m < arraysize(kDBusMatches_); m++) {
     const char* match = kDBusMatches_[m];
     DLOG(INFO) << "adding dbus match: " << match;
     dbus_bus_add_match(connection, match, &error);
     LOG_IF(FATAL, dbus_error_is_set(&error)) <<
         "unable to add a match: " << SAFE_MESSAGE(error);
   }

   // Adds the D-Bus filter routine to be called back whenever one of
   // the registered D-Bus matches is successful. The daemon is not
   // activated for D-Bus messages that don't match.
   CHECK(dbus_connection_add_filter(connection, MessageFilter, this, NULL));
 }

 void MetricsDaemon::Loop() {
   GMainLoop* loop = g_main_loop_new(NULL, false);
   g_main_loop_run(loop);
 }

 // static
 DBusHandlerResult MetricsDaemon::MessageFilter(DBusConnection* connection,
                                                DBusMessage* message,
                                                void* user_data) {
   Time now = Time::Now();
   DLOG(INFO) << "message intercepted @ " << now.ToInternalValue();

   int message_type = dbus_message_get_type(message);
   if (message_type != DBUS_MESSAGE_TYPE_SIGNAL) {
     DLOG(WARNING) << "unexpected message type " << message_type;
     return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
   }

   // Signal messages always have interfaces.
   const char* interface = dbus_message_get_interface(message);
   CHECK(interface != NULL);

   MetricsDaemon* daemon = static_cast<MetricsDaemon*>(user_data);

   DBusMessageIter iter;
   dbus_message_iter_init(message, &iter);
   if (strcmp(interface, DBUS_IFACE_CRASH_REPORTER) == 0) {
     CHECK(strcmp(dbus_message_get_member(message),
                  "UserCrash") == 0);
     daemon->ProcessUserCrash();
   } else if (strcmp(interface, DBUS_IFACE_POWER_MANAGER) == 0) {
     const char* member = dbus_message_get_member(message);
     if (strcmp(member, "ScreenIsLocked") == 0) {
       daemon->SetUserActiveState(false, now);
     } else if (strcmp(member, "ScreenIsUnlocked") == 0) {
       daemon->SetUserActiveState(true, now);
     } else if (strcmp(member, "PowerStateChanged") == 0) {
       char* state_name;
       dbus_message_iter_get_basic(&iter, &state_name);
       daemon->PowerStateChanged(state_name, now);
     }
   } else if (strcmp(interface, DBUS_IFACE_SESSION_MANAGER) == 0) {
     CHECK(strcmp(dbus_message_get_member(message),
                  "SessionStateChanged") == 0);

     char* state_name;
     dbus_message_iter_get_basic(&iter, &state_name);
     daemon->SessionStateChanged(state_name, now);
   } else {
     DLOG(WARNING) << "unexpected interface: " << interface;
     return DBUS_HANDLER_RESULT_NOT_YET_HANDLED;
   }

   return DBUS_HANDLER_RESULT_HANDLED;
 }

 void MetricsDaemon::PowerStateChanged(const char* state_name, Time now) {
   DLOG(INFO) << "power state: " << state_name;
   power_state_ = LookupPowerState(state_name);

   if (power_state_ != kPowerStateOn)
     SetUserActiveState(false, now);
 }

 MetricsDaemon::PowerState
 MetricsDaemon::LookupPowerState(const char* state_name) {
   for (int i = 0; i < kNumberPowerStates; i++) {
     if (strcmp(state_name, kPowerStates_[i]) == 0) {
       return static_cast<PowerState>(i);
     }
   }
   DLOG(WARNING) << "unknown power state: " << state_name;
   return kUnknownPowerState;
 }

 void MetricsDaemon::SessionStateChanged(const char* state_name, Time now) {
   DLOG(INFO) << "user session state: " << state_name;
   session_state_ = LookupSessionState(state_name);
   SetUserActiveState(session_state_ == kSessionStateStarted, now);
 }

 MetricsDaemon::SessionState
 MetricsDaemon::LookupSessionState(const char* state_name) {
   for (int i = 0; i < kNumberSessionStates; i++) {
     if (strcmp(state_name, kSessionStates_[i]) == 0) {
       return static_cast<SessionState>(i);
     }
   }
   DLOG(WARNING) << "unknown user session state: " << state_name;
   return kUnknownSessionState;
 }

 void MetricsDaemon::SetUserActiveState(bool active, Time now) {
   DLOG(INFO) << "user: " << (active ? "active" : "inactive");

   // Calculates the seconds of active use since the last update and
   // the day since Epoch, and logs the usage data.  Guards against the
   // time jumping back and forth due to the user changing it by
   // discarding the new use time.
   int seconds = 0;
   if (user_active_ && now > user_active_last_) {
     TimeDelta since_active = now - user_active_last_;
     if (since_active < TimeDelta::FromSeconds(
             kUseMonitorIntervalMax + kSecondsPerMinute)) {
       seconds = static_cast<int>(since_active.InSeconds());
     }
   }
   TimeDelta since_epoch = now - Time();
   int day = since_epoch.InDays();
   daily_use_->Update(day, seconds);
   user_crash_interval_->Update(0, seconds);
   kernel_crash_interval_->Update(0, seconds);

   // Flush finished cycles of all frequency counters.
   for (FrequencyCounters::iterator i = frequency_counters_.begin();
        i != frequency_counters_.end(); ++i) {
     i->second->FlushFinishedCycles();
   }

   // Schedules a use monitor on inactive->active transitions and
   // unschedules it on active->inactive transitions.
   if (!user_active_ && active)
     ScheduleUseMonitor(kUseMonitorIntervalInit, /* backoff */ false);
   else if (user_active_ && !active)
     UnscheduleUseMonitor();

   // Remembers the current active state and the time of the last
   // activity update.
   user_active_ = active;
   user_active_last_ = now;
 }

 void MetricsDaemon::ProcessUserCrash() {
   // Counts the active use time up to now.
   SetUserActiveState(user_active_, Time::Now());

   // Reports the active use time since the last crash and resets it.
   user_crash_interval_->Flush();

   frequency_counters_[kMetricUserCrashesDailyName]->Update(1);
   frequency_counters_[kMetricUserCrashesWeeklyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesDailyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesWeeklyName]->Update(1);
 }

 void MetricsDaemon::ProcessKernelCrash() {
   // Counts the active use time up to now.
   SetUserActiveState(user_active_, Time::Now());

   // Reports the active use time since the last crash and resets it.
   kernel_crash_interval_->Flush();

   frequency_counters_[kMetricKernelCrashesDailyName]->Update(1);
   frequency_counters_[kMetricKernelCrashesWeeklyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesDailyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesWeeklyName]->Update(1);
 }

 void MetricsDaemon::ProcessUncleanShutdown() {
   // Counts the active use time up to now.
   SetUserActiveState(user_active_, Time::Now());

   // Reports the active use time since the last crash and resets it.
   unclean_shutdown_interval_->Flush();

   frequency_counters_[kMetricUncleanShutdownsDailyName]->Update(1);
   frequency_counters_[kMetricUncleanShutdownsWeeklyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesDailyName]->Update(1);
   frequency_counters_[kMetricAnyCrashesWeeklyName]->Update(1);
 }

 bool MetricsDaemon::CheckSystemCrash(const string& crash_file) {
   FilePath crash_detected(crash_file);
   if (!file_util::PathExists(crash_detected))
     return false;

   // Deletes the crash-detected file so that the daemon doesn't report
   // another kernel crash in case it's restarted.
   file_util::Delete(crash_detected,
                     false);  // recursive
   return true;
 }

 // static
 gboolean MetricsDaemon::UseMonitorStatic(gpointer data) {
   return static_cast<MetricsDaemon*>(data)->UseMonitor() ? TRUE : FALSE;
 }

 bool MetricsDaemon::UseMonitor() {
   SetUserActiveState(user_active_, Time::Now());

   // If a new monitor source/instance is scheduled, returns false to
   // tell GLib to destroy this monitor source/instance. Returns true
   // otherwise to keep calling back this monitor.
   return !ScheduleUseMonitor(usemon_interval_ * 2, /* backoff */ true);
 }

 bool MetricsDaemon::ScheduleUseMonitor(int interval, bool backoff)
 {
   if (testing_)
     return false;

   // Caps the interval -- the bigger the interval, the more active use
   // time will be potentially dropped on system shutdown.
   if (interval > kUseMonitorIntervalMax)
     interval = kUseMonitorIntervalMax;

   if (backoff) {
     // Back-off mode is used by the use monitor to reschedule itself
     // with exponential back-off in time. This mode doesn't create a
     // new timeout source if the new interval is the same as the old
     // one. Also, if a new timeout source is created, the old one is
     // not destroyed explicitly here -- it will be destroyed by GLib
     // when the monitor returns FALSE (see UseMonitor and
     // UseMonitorStatic).
     if (interval == usemon_interval_)
       return false;
   } else {
     UnscheduleUseMonitor();
   }

   // Schedules a new use monitor for |interval| seconds from now.
   DLOG(INFO) << "scheduling use monitor in " << interval << " seconds";
   usemon_source_ = g_timeout_source_new_seconds(interval);
   g_source_set_callback(usemon_source_, UseMonitorStatic, this,
                         NULL); // No destroy notification.
   g_source_attach(usemon_source_,
                   NULL); // Default context.
   usemon_interval_ = interval;
   return true;
 }

 void MetricsDaemon::UnscheduleUseMonitor() {
   // If there's a use monitor scheduled already, destroys it.
   if (usemon_source_ == NULL)
     return;

   DLOG(INFO) << "destroying use monitor";
   g_source_destroy(usemon_source_);
   usemon_source_ = NULL;
   usemon_interval_ = 0;
 }

 void MetricsDaemon::StatsReporterInit() {
   DiskStatsReadStats(&read_sectors_, &write_sectors_);
   VmStatsReadStats(&page_faults_);
   // The first time around just run the long stat, so we don't delay boot.
   stats_state_ = kStatsLong;
   stats_initial_time_ = GetActiveTime();
   if (stats_initial_time_ < 0) {
     LOG(WARNING) << "not collecting disk stats";
   } else {
     ScheduleStatsCallback(kMetricStatsLongInterval);
   }
 }

 void MetricsDaemon::ScheduleStatsCallback(int wait) {
   if (testing_) {
     return;
   }
   g_timeout_add_seconds(wait, StatsCallbackStatic, this);
 }

 bool MetricsDaemon::DiskStatsReadStats(long int* read_sectors,
                                        long int* write_sectors) {
   int nchars;
   int nitems;
   bool success = false;
   char line[200];
   if (diskstats_path_.empty()) {
     return false;
   }
   int file = HANDLE_EINTR(open(diskstats_path_.c_str(), O_RDONLY));
   if (file < 0) {
     PLOG(WARNING) << "cannot open " << diskstats_path_;
     return false;
   }
   nchars = HANDLE_EINTR(read(file, line, sizeof(line)));
   if (nchars < 0) {
     PLOG(WARNING) << "cannot read from " << diskstats_path_;
     return false;
   } else {
     LOG_IF(WARNING, nchars == sizeof(line))
         << "line too long in " << diskstats_path_;
     line[nchars] = '\0';
     nitems = sscanf(line, "%*d %*d %ld %*d %*d %*d %ld",
                     read_sectors, write_sectors);
     if (nitems == 2) {
       success = true;
     } else {
       LOG(WARNING) << "found " << nitems << " items in "
                    << diskstats_path_ << ", expected 2";
     }
   }
   HANDLE_EINTR(close(file));
   return success;
 }

 bool MetricsDaemon::VmStatsParseStats(char* stats, long int* page_faults) {
   static const char kPageFaultSearchString[] = "\npgmajfault ";
   bool success = false;
   /* Each line in the file has the form
    * <ID> <VALUE>
    * for instance:
    * nr_free_pages 213427
    */
   char* s = strstr(stats, kPageFaultSearchString);
   if (s == NULL) {
     LOG(WARNING) << "cannot find page fault entry in vmstats";
   } else {
     char* endp;
     /* Skip <ID> and space.  Don't count the terminating null. */
     s += sizeof(kPageFaultSearchString) - 1;
     *page_faults = strtol(s, &endp, 10);
     if (*endp == '\n') {
       success = true;
     } else {
       LOG(WARNING) << "error parsing vmstats";
     }
   }
   return success;
 }

 bool MetricsDaemon::VmStatsReadStats(long int* page_faults) {
   char buffer[4000];
   int nchars;
   int success = false;
   if (testing_) {
     return false;
   }
   int file = HANDLE_EINTR(open(vmstats_path_.c_str(), O_RDONLY));
   if (file < 0) {
     PLOG(WARNING) << "cannot open " << vmstats_path_;
     return false;
   }
   nchars = HANDLE_EINTR(read(file, buffer, sizeof(buffer) - 1));
   LOG_IF(WARNING, nchars == sizeof(buffer) - 1)
       << "file too large in " << vmstats_path_;
   if (nchars < 0) {
     PLOG(WARNING) << "cannot read from " << vmstats_path_;
   } else if (nchars == 0) {
     LOG(WARNING) << vmstats_path_ << " is empty";
   } else {
     buffer[nchars] = '\0';
     success = VmStatsParseStats(buffer, page_faults);
   }
   HANDLE_EINTR(close(file));
   return success;
 }

 // static
 gboolean MetricsDaemon::StatsCallbackStatic(void* handle) {
   (static_cast<MetricsDaemon*>(handle))->StatsCallback();
   return false;  // one-time callback
 }

 // Collects disk and vm stats alternating over a short and a long interval.

 void MetricsDaemon::StatsCallback() {
   long int read_sectors_now, write_sectors_now, page_faults_now;
   double time_now = GetActiveTime();
   double delta_time = time_now - stats_initial_time_;
   if (testing_) {
     // Fake the time when testing.
     delta_time = stats_state_ == kStatsShort ?
         kMetricStatsShortInterval : kMetricStatsLongInterval;
   }
   bool diskstats_success = DiskStatsReadStats(&read_sectors_now,
                                               &write_sectors_now);
   int delta_read = read_sectors_now - read_sectors_;
   int delta_write = write_sectors_now - write_sectors_;
   int read_sectors_per_second = delta_read / delta_time;
   int write_sectors_per_second = delta_write / delta_time;
   bool vmstats_success = VmStatsReadStats(&page_faults_now);
   int delta_faults = page_faults_now - page_faults_;
   int page_faults_per_second = delta_faults / delta_time;

   switch (stats_state_) {
     case kStatsShort:
       if (diskstats_success) {
         SendMetric(kMetricReadSectorsShortName,
                    read_sectors_per_second,
                    1,
                    kMetricSectorsIOMax,
                    kMetricSectorsBuckets);
         SendMetric(kMetricWriteSectorsShortName,
                    write_sectors_per_second,
                    1,
                    kMetricSectorsIOMax,
                    kMetricSectorsBuckets);
       }
       if (vmstats_success) {
         SendMetric(kMetricPageFaultsShortName,
                    page_faults_per_second,
                    1,
                    kMetricPageFaultsMax,
                    kMetricPageFaultsBuckets);
       }
       // Schedule long callback.
       stats_state_ = kStatsLong;
       ScheduleStatsCallback(kMetricStatsLongInterval -
                             kMetricStatsShortInterval);
       break;
     case kStatsLong:
       if (diskstats_success) {
         SendMetric(kMetricReadSectorsLongName,
                    read_sectors_per_second,
                    1,
                    kMetricSectorsIOMax,
                    kMetricSectorsBuckets);
         SendMetric(kMetricWriteSectorsLongName,
                    write_sectors_per_second,
                    1,
                    kMetricSectorsIOMax,
                    kMetricSectorsBuckets);
         // Reset sector counters.
         read_sectors_ = read_sectors_now;
         write_sectors_ = write_sectors_now;
       }
       if (vmstats_success) {
         SendMetric(kMetricPageFaultsLongName,
                    page_faults_per_second,
                    1,
                    kMetricPageFaultsMax,
                    kMetricPageFaultsBuckets);
         page_faults_ = page_faults_now;
       }
       // Set start time for new cycle.
       stats_initial_time_ = time_now;
       // Schedule short callback.
       stats_state_ = kStatsShort;
       ScheduleStatsCallback(kMetricStatsShortInterval);
       break;
     default:
       LOG(FATAL) << "Invalid stats state";
   }
 }

 void MetricsDaemon::ScheduleMeminfoCallback(int wait) {
   if (testing_) {
     return;
   }
   g_timeout_add_seconds(wait, MeminfoCallbackStatic, this);
 }

 // static
 gboolean MetricsDaemon::MeminfoCallbackStatic(void* handle) {
   return (static_cast<MetricsDaemon*>(handle))->MeminfoCallback();
 }

 bool MetricsDaemon::MeminfoCallback() {
   string meminfo_raw;
   const FilePath meminfo_path("/proc/meminfo");
   if (!file_util::ReadFileToString(meminfo_path, &meminfo_raw)) {
     LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
     return false;
   }
   return ProcessMeminfo(meminfo_raw);
 }

 bool MetricsDaemon::ProcessMeminfo(const string& meminfo_raw) {
   static const MeminfoRecord fields_array[] = {
     { "MemTotal", "MemTotal" },  // SPECIAL CASE: total system memory
     { "MemFree", "MemFree" },
     { "Buffers", "Buffers" },
     { "Cached", "Cached" },
     // { "SwapCached", "SwapCached" },
     { "Active", "Active" },
     { "Inactive", "Inactive" },
     { "ActiveAnon", "Active(anon)" },
     { "InactiveAnon", "Inactive(anon)" },
     { "ActiveFile" , "Active(file)" },
     { "InactiveFile", "Inactive(file)" },
     { "Unevictable", "Unevictable", kMeminfoOp_HistLog },
     // { "Mlocked", "Mlocked" },
     { "SwapTotal", "SwapTotal", kMeminfoOp_SwapTotal },
     { "SwapFree", "SwapFree", kMeminfoOp_SwapFree },
     // { "Dirty", "Dirty" },
     // { "Writeback", "Writeback" },
     { "AnonPages", "AnonPages" },
     { "Mapped", "Mapped" },
     { "Shmem", "Shmem", kMeminfoOp_HistLog },
     { "Slab", "Slab", kMeminfoOp_HistLog },
     // { "SReclaimable", "SReclaimable" },
     // { "SUnreclaim", "SUnreclaim" },
   };
   vector<MeminfoRecord> fields(fields_array,
                                fields_array + arraysize(fields_array));
   if (!FillMeminfo(meminfo_raw, &fields)) {
     return false;
   }
   int total_memory = fields[0].value;
   if (total_memory == 0) {
     // this "cannot happen"
     LOG(WARNING) << "borked meminfo parser";
     return false;
   }
   int swap_total = 0;
   int swap_free = 0;
   // Send all fields retrieved, except total memory.
   for (unsigned int i = 1; i < fields.size(); i++) {
     string metrics_name = StringPrintf("Platform.Meminfo%s", fields[i].name);
     int percent;
     switch (fields[i].op) {
       case kMeminfoOp_HistPercent:
         // report value as percent of total memory
         percent = fields[i].value * 100 / total_memory;
         SendLinearMetric(metrics_name, percent, 100, 101);
         break;
       case kMeminfoOp_HistLog:
         // report value in kbytes, log scale, 4Gb max
         SendMetric(metrics_name, fields[i].value, 1, 4 * 1000 * 1000, 100);
         break;
       case kMeminfoOp_SwapTotal:
         swap_total = fields[i].value;
       case kMeminfoOp_SwapFree:
         swap_free = fields[i].value;
         break;
     }
   }
   if (swap_total > 0) {
     int swap_used = swap_total - swap_free;
     int swap_used_percent = swap_used * 100 / swap_total;
     SendMetric("Platform.MeminfoSwapUsed", swap_used, 1, 8 * 1000 * 1000, 100);
     SendLinearMetric("Platform.MeminfoSwapUsedPercent", swap_used_percent,
                      100, 101);
   }
   return true;
 }

 bool MetricsDaemon::FillMeminfo(const string& meminfo_raw,
                                 vector<MeminfoRecord>* fields) {
   vector<string> lines;
   unsigned int nlines = Tokenize(meminfo_raw, "\n", &lines);

   // Scan meminfo output and collect field values.  Each field name has to
   // match a meminfo entry (case insensitive) after removing non-alpha
   // characters from the entry.
   unsigned int ifield = 0;
   for (unsigned int iline = 0;
        iline < nlines && ifield < fields->size();
        iline++) {
     vector<string> tokens;
     Tokenize(lines[iline], ": ", &tokens);
     if (strcmp((*fields)[ifield].match, tokens[0].c_str()) == 0) {
       // Name matches. Parse value and save.
       char* rest;
       (*fields)[ifield].value =
           static_cast<int>(strtol(tokens[1].c_str(), &rest, 10));
       if (*rest != '\0') {
         LOG(WARNING) << "missing meminfo value";
         return false;
       }
       ifield++;
     }
   }
   if (ifield < fields->size()) {
     // End of input reached while scanning.
     LOG(WARNING) << "cannot find field " << (*fields)[ifield].match
                  << " and following";
     return false;
   }
   return true;
 }

 void MetricsDaemon::ScheduleMemuseCallback(bool new_callback,
                                            double time_elapsed) {
   if (testing_) {
     return;
   }
   int interval = kMemuseIntervals[memuse_interval_index_];
   int wait;
   if (new_callback) {
     memuse_initial_time_ = GetActiveTime();
     wait = interval;
   } else {
     wait = ceil(interval - time_elapsed);  // round up
   }
   g_timeout_add_seconds(wait, MemuseCallbackStatic, this);
 }

 // static
 gboolean MetricsDaemon::MemuseCallbackStatic(void* handle) {
   MetricsDaemon* daemon = static_cast<MetricsDaemon*>(handle);
   daemon->MemuseCallback();
   return false;
 }

 void MetricsDaemon::MemuseCallback() {
   // Since we only care about active time (i.e. uptime minus sleep time) but
   // the callbacks are driven by real time (uptime), we check if we should
   // reschedule this callback due to intervening sleep periods.
   double now = GetActiveTime();
   double active_time = now - memuse_initial_time_;
   if (active_time < kMemuseIntervals[memuse_interval_index_]) {
     // Not enough active time has passed.  Reschedule the callback.
     ScheduleMemuseCallback(false, active_time);
   } else {
     // Enough active time has passed.  Do the work, and (if we succeed) see if
     // we need to do more.
     if (MemuseCallbackWork() &&
         memuse_interval_index_ < arraysize(kMemuseIntervals)) {
       memuse_interval_index_++;
       ScheduleMemuseCallback(true, 0);
     }
   }
 }

 bool MetricsDaemon::MemuseCallbackWork() {
   string meminfo_raw;
   const FilePath meminfo_path("/proc/meminfo");
   if (!file_util::ReadFileToString(meminfo_path, &meminfo_raw)) {
     LOG(WARNING) << "cannot read " << meminfo_path.value().c_str();
     return false;
   }
   return ProcessMemuse(meminfo_raw);
 }

 bool MetricsDaemon::ProcessMemuse(const string& meminfo_raw) {
   static const MeminfoRecord fields_array[] = {
     { "MemTotal", "MemTotal" },  // SPECIAL CASE: total system memory
     { "ActiveAnon", "Active(anon)" },
     { "InactiveAnon", "Inactive(anon)" },
   };
   vector<MeminfoRecord> fields(fields_array,
                                fields_array + arraysize(fields_array));
   if (!FillMeminfo(meminfo_raw, &fields)) {
     return false;
   }
   int total = fields[0].value;
   int active_anon = fields[1].value;
   int inactive_anon = fields[2].value;
   if (total == 0) {
     // this "cannot happen"
     LOG(WARNING) << "borked meminfo parser";
     return false;
   }
   string metrics_name = StringPrintf("Platform.MemuseAnon%d",
                                      memuse_interval_index_);
   SendLinearMetric(metrics_name, (active_anon + inactive_anon) * 100 / total,
                    100, 101);
   return true;
 }

 // static
 void MetricsDaemon::ReportDailyUse(void* handle, int tag, int count) {
   if (count <= 0)
     return;

   MetricsDaemon* daemon = static_cast<MetricsDaemon*>(handle);
   int minutes = (count + kSecondsPerMinute / 2) / kSecondsPerMinute;
   daemon->SendMetric(kMetricDailyUseTimeName, minutes,
                      kMetricDailyUseTimeMin,
                      kMetricDailyUseTimeMax,
                      kMetricDailyUseTimeBuckets);
 }

 void MetricsDaemon::SendMetric(const string& name, int sample,
                                int min, int max, int nbuckets) {
   DLOG(INFO) << "received metric: " << name << " " << sample << " "
              << min << " " << max << " " << nbuckets;
   metrics_lib_->SendToUMA(name, sample, min, max, nbuckets);
 }

 void MetricsDaemon::SendLinearMetric(const string& name, int sample,
                                      int max, int nbuckets) {
   DLOG(INFO) << "received linear metric: " << name << " " << sample << " "
              << max << " " << nbuckets;
   // TODO(semenzato): add a proper linear histogram to the Chrome external
   // metrics API.
   LOG_IF(FATAL, nbuckets != max + 1) << "unsupported histogram scale";
   metrics_lib_->SendEnumToUMA(name, sample, max);
 }