// Copyright 2014 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "components/metrics/metrics_state_manager.h" #include #include #include #include #include #include "base/guid.h" #include "base/metrics/histogram_functions.h" #include "base/metrics/histogram_macros.h" #include "base/numerics/safe_conversions.h" #include "base/rand_util.h" #include "base/strings/string_number_conversions.h" #include "base/threading/thread_restrictions.h" #include "base/time/time.h" #include "build/build_config.h" #include "components/metrics/cloned_install_detector.h" #include "components/metrics/enabled_state_provider.h" #include "components/metrics/entropy_state.h" #include "components/metrics/metrics_log.h" #include "components/metrics/metrics_pref_names.h" #include "components/metrics/metrics_provider.h" #include "components/metrics/metrics_switches.h" #include "components/prefs/pref_registry_simple.h" #include "components/prefs/pref_service.h" #include "components/variations/entropy_provider.h" #include "components/variations/pref_names.h" #include "third_party/metrics_proto/chrome_user_metrics_extension.pb.h" #include "third_party/metrics_proto/system_profile.pb.h" namespace metrics { namespace { // The argument used to generate a non-identifying entropy source. We want no // more than 13 bits of entropy, so use this max to return a number in the range // [0, 7999] as the entropy source (12.97 bits of entropy). const int kThisMaxLowEntropySize = 8000; int64_t ReadEnabledDate(PrefService* local_state) { return local_state->GetInt64(prefs::kMetricsReportingEnabledTimestamp); } int64_t ReadInstallDate(PrefService* local_state) { return local_state->GetInt64(prefs::kInstallDate); } std::string ReadClientId(PrefService* local_state) { return local_state->GetString(prefs::kMetricsClientID); } // Round a timestamp measured in seconds since epoch to one with a granularity // of an hour. This can be used before uploaded potentially sensitive // timestamps. int64_t RoundSecondsToHour(int64_t time_in_seconds) { return 3600 * (time_in_seconds / 3600); } // Records the cloned install histogram. void LogClonedInstall() { // Equivalent to UMA_HISTOGRAM_BOOLEAN with the stability flag set. UMA_STABILITY_HISTOGRAM_ENUMERATION("UMA.IsClonedInstall", 1, 2); } class MetricsStateMetricsProvider : public MetricsProvider { public: MetricsStateMetricsProvider( PrefService* local_state, bool metrics_ids_were_reset, std::string previous_client_id, std::string initial_client_id, ClonedInstallDetector const& cloned_install_detector) : local_state_(local_state), metrics_ids_were_reset_(metrics_ids_were_reset), previous_client_id_(std::move(previous_client_id)), initial_client_id_(std::move(initial_client_id)), cloned_install_detector_(cloned_install_detector) {} // MetricsProvider: void ProvideSystemProfileMetrics( SystemProfileProto* system_profile) override { system_profile->set_uma_enabled_date( RoundSecondsToHour(ReadEnabledDate(local_state_))); system_profile->set_install_date( RoundSecondsToHour(ReadInstallDate(local_state_))); // Client id in the log shouldn't be different than the |local_state_| one // except when the client disabled UMA before we populate this field to the // log. If that's the case, the client id in the |local_state_| should be // empty and we should set |client_id_was_used_for_trial_assignment| to // false. std::string client_id = ReadClientId(local_state_); system_profile->set_client_id_was_used_for_trial_assignment( !client_id.empty() && client_id == initial_client_id_); } void ProvidePreviousSessionData( ChromeUserMetricsExtension* uma_proto) override { if (metrics_ids_were_reset_) { LogClonedInstall(); if (!previous_client_id_.empty()) { // If we know the previous client id, overwrite the client id for the // previous session log so the log contains the client id at the time // of the previous session. This allows better attribution of crashes // to earlier behavior. If the previous client id is unknown, leave // the current client id. uma_proto->set_client_id(MetricsLog::Hash(previous_client_id_)); } } } void ProvideCurrentSessionData( ChromeUserMetricsExtension* uma_proto) override { if (cloned_install_detector_.ClonedInstallDetectedInCurrentSession()) LogClonedInstall(); } private: PrefService* const local_state_; const bool metrics_ids_were_reset_; // |previous_client_id_| is set only (if known) when |metrics_ids_were_reset_| const std::string previous_client_id_; // The client id that was used to randomize field trials. An empty string if // the low entropy source was used to do randomization. const std::string initial_client_id_; const ClonedInstallDetector& cloned_install_detector_; DISALLOW_COPY_AND_ASSIGN(MetricsStateMetricsProvider); }; } // namespace // static bool MetricsStateManager::instance_exists_ = false; MetricsStateManager::MetricsStateManager( PrefService* local_state, EnabledStateProvider* enabled_state_provider, const base::string16& backup_registry_key, StoreClientInfoCallback store_client_info, LoadClientInfoCallback retrieve_client_info) : local_state_(local_state), enabled_state_provider_(enabled_state_provider), store_client_info_(std::move(store_client_info)), load_client_info_(std::move(retrieve_client_info)), clean_exit_beacon_(backup_registry_key, local_state), entropy_state_(local_state), entropy_source_returned_(ENTROPY_SOURCE_NONE), metrics_ids_were_reset_(false) { ResetMetricsIDsIfNecessary(); bool is_first_run = false; int64_t install_date = local_state_->GetInt64(prefs::kInstallDate); // Set the install date if this is our first run. if (install_date == 0) { local_state_->SetInt64(prefs::kInstallDate, base::Time::Now().ToTimeT()); is_first_run = true; } if (enabled_state_provider_->IsConsentGiven()) ForceClientIdCreation(); #if !defined(OS_WIN) if (is_first_run) { // If this is a first run (no install date) and there's no client id, then // generate a provisional client id now. This id will be used for field // trial randomization on first run and will be promoted to become the // client id if UMA is enabled during this session, via the logic in // ForceClientIdCreation(). // // Note: We don't do this on Windows because on Windows, there's no UMA // checkbox on first run and instead it comes from the install page. So if // UMA is not enabled at this point, it's unlikely it will be enabled in // the same session since that requires the user to manually do that via // settings page after they unchecked it on the download page. // // Note: Windows first run is covered by browser tests // FirstRunMasterPrefsVariationsSeedTest.PRE_SecondRun and // FirstRunMasterPrefsVariationsSeedTest.SecondRun. If the platform ifdef // for this logic changes, the tests should be updated as well. if (client_id_.empty()) provisional_client_id_ = base::GenerateGUID(); } #endif // !defined(OS_WIN) // The |initial_client_id_| should only be set if UMA is enabled or there's a // provisional client id. initial_client_id_ = (client_id_.empty() ? provisional_client_id_ : client_id_); DCHECK(!instance_exists_); instance_exists_ = true; } MetricsStateManager::~MetricsStateManager() { DCHECK(instance_exists_); instance_exists_ = false; } std::unique_ptr MetricsStateManager::GetProvider() { return std::make_unique( local_state_, metrics_ids_were_reset_, previous_client_id_, initial_client_id_, cloned_install_detector_); } bool MetricsStateManager::IsMetricsReportingEnabled() { return enabled_state_provider_->IsReportingEnabled(); } int64_t MetricsStateManager::GetInstallDate() const { return ReadInstallDate(local_state_); } int MetricsStateManager::GetLowEntropySource() { return entropy_state_.GetLowEntropySource(); } void MetricsStateManager::ForceClientIdCreation() { // TODO(asvitkine): Ideally, all tests would actually set up consent properly, // so the command-line check wouldn't be needed here. // Currently, kForceEnableMetricsReporting is used by Java UkmTest and // kMetricsRecordingOnly is used by Chromedriver tests. DCHECK(enabled_state_provider_->IsConsentGiven() || base::CommandLine::ForCurrentProcess()->HasSwitch( switches::kForceEnableMetricsReporting) || base::CommandLine::ForCurrentProcess()->HasSwitch( switches::kMetricsRecordingOnly)); { std::string client_id_from_prefs = ReadClientId(local_state_); // If client id in prefs matches the cached copy, return early. if (!client_id_from_prefs.empty() && client_id_from_prefs == client_id_) return; client_id_.swap(client_id_from_prefs); } if (!client_id_.empty()) return; const std::unique_ptr client_info_backup = LoadClientInfo(); if (client_info_backup) { client_id_ = client_info_backup->client_id; const base::Time now = base::Time::Now(); // Save the recovered client id and also try to reinstantiate the backup // values for the dates corresponding with that client id in order to avoid // weird scenarios where we could report an old client id with a recent // install date. local_state_->SetString(prefs::kMetricsClientID, client_id_); local_state_->SetInt64(prefs::kInstallDate, client_info_backup->installation_date != 0 ? client_info_backup->installation_date : now.ToTimeT()); local_state_->SetInt64(prefs::kMetricsReportingEnabledTimestamp, client_info_backup->reporting_enabled_date != 0 ? client_info_backup->reporting_enabled_date : now.ToTimeT()); base::TimeDelta recovered_installation_age; if (client_info_backup->installation_date != 0) { recovered_installation_age = now - base::Time::FromTimeT(client_info_backup->installation_date); } UMA_HISTOGRAM_COUNTS_10000("UMA.ClientIdBackupRecoveredWithAge", recovered_installation_age.InHours()); // Flush the backup back to persistent storage in case we re-generated // missing data above. BackUpCurrentClientInfo(); return; } // If we're here, there was no client ID yet (either in prefs or backup), // so generate a new one. If there's a provisional client id (e.g. UMA // was enabled as part of first run), promote that to the client id, // otherwise (e.g. UMA enabled in a future session), generate a new one. if (provisional_client_id_.empty()) { client_id_ = base::GenerateGUID(); } else { client_id_ = provisional_client_id_; provisional_client_id_.clear(); } local_state_->SetString(prefs::kMetricsClientID, client_id_); // Record the timestamp of when the user opted in to UMA. local_state_->SetInt64(prefs::kMetricsReportingEnabledTimestamp, base::Time::Now().ToTimeT()); BackUpCurrentClientInfo(); } void MetricsStateManager::CheckForClonedInstall() { cloned_install_detector_.CheckForClonedInstall(local_state_); } bool MetricsStateManager::ShouldResetClientIdsOnClonedInstall() { return cloned_install_detector_.ShouldResetClientIds(local_state_); } std::unique_ptr MetricsStateManager::CreateDefaultEntropyProvider() { // Note: the |initial_client_id_| should not be empty iff we have client's // consent on enabling UMA on startup or we have the |provisional_client_id_| // for the first run. if (!initial_client_id_.empty()) { UpdateEntropySourceReturnedValue(ENTROPY_SOURCE_HIGH); return std::make_unique( GetHighEntropySource()); } UpdateEntropySourceReturnedValue(ENTROPY_SOURCE_LOW); return CreateLowEntropyProvider(); } std::unique_ptr MetricsStateManager::CreateLowEntropyProvider() { int source = GetLowEntropySource(); return std::make_unique( base::checked_cast(source), kThisMaxLowEntropySize); } // static std::unique_ptr MetricsStateManager::Create( PrefService* local_state, EnabledStateProvider* enabled_state_provider, const base::string16& backup_registry_key, StoreClientInfoCallback store_client_info, LoadClientInfoCallback retrieve_client_info) { std::unique_ptr result; // Note: |instance_exists_| is updated in the constructor and destructor. if (!instance_exists_) { result.reset(new MetricsStateManager( local_state, enabled_state_provider, backup_registry_key, std::move(store_client_info), std::move(retrieve_client_info))); } return result; } // static void MetricsStateManager::RegisterPrefs(PrefRegistrySimple* registry) { registry->RegisterStringPref(prefs::kMetricsClientID, std::string()); registry->RegisterInt64Pref(prefs::kMetricsReportingEnabledTimestamp, 0); registry->RegisterInt64Pref(prefs::kInstallDate, 0); EntropyState::RegisterPrefs(registry); ClonedInstallDetector::RegisterPrefs(registry); } void MetricsStateManager::BackUpCurrentClientInfo() { ClientInfo client_info; client_info.client_id = client_id_; client_info.installation_date = ReadInstallDate(local_state_); client_info.reporting_enabled_date = ReadEnabledDate(local_state_); store_client_info_.Run(client_info); } std::unique_ptr MetricsStateManager::LoadClientInfo() { std::unique_ptr client_info = load_client_info_.Run(); // The GUID retrieved should be valid unless retrieval failed. // If not, return nullptr. This will result in a new GUID being generated by // the calling function ForceClientIdCreation(). if (client_info && !base::IsValidGUID(client_info->client_id)) return nullptr; return client_info; } std::string MetricsStateManager::GetHighEntropySource() { // This should only be called if the |initial_client_id_| is not empty. The // user shouldn't be able to enable UMA between the constructor and calling // this, because field trial setup happens at Chrome initialization. DCHECK(!initial_client_id_.empty()); return entropy_state_.GetHighEntropySource(initial_client_id_); } int MetricsStateManager::GetOldLowEntropySource() { return entropy_state_.GetOldLowEntropySource(); } void MetricsStateManager::UpdateEntropySourceReturnedValue( EntropySourceType type) { if (entropy_source_returned_ != ENTROPY_SOURCE_NONE) return; entropy_source_returned_ = type; UMA_HISTOGRAM_ENUMERATION("UMA.EntropySourceType", type, ENTROPY_SOURCE_ENUM_SIZE); } void MetricsStateManager::ResetMetricsIDsIfNecessary() { if (!ShouldResetClientIdsOnClonedInstall()) return; metrics_ids_were_reset_ = true; previous_client_id_ = ReadClientId(local_state_); UMA_HISTOGRAM_BOOLEAN("UMA.MetricsIDsReset", true); DCHECK(client_id_.empty()); local_state_->ClearPref(prefs::kMetricsClientID); EntropyState::ClearPrefs(local_state_); // Also clear the backed up client info. store_client_info_.Run(ClientInfo()); } } // namespace metrics