// Copyright 2014 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "components/metrics/persisted_logs.h" #include #include #include #include "base/base64.h" #include "base/md5.h" #include "base/metrics/histogram_macros.h" #include "base/sha1.h" #include "base/strings/string_number_conversions.h" #include "base/timer/elapsed_timer.h" #include "components/metrics/persisted_logs_metrics.h" #include "components/prefs/pref_service.h" #include "components/prefs/scoped_user_pref_update.h" #include "third_party/zlib/google/compression_utils.h" namespace metrics { namespace { const char kLogHashKey[] = "hash"; const char kLogTimestampKey[] = "timestamp"; const char kLogDataKey[] = "data"; std::string EncodeToBase64(const std::string& to_convert) { // CHECK to diagnose crbug.com/695433 CHECK(to_convert.data()); std::string base64_result; base::Base64Encode(to_convert, &base64_result); return base64_result; } std::string DecodeFromBase64(const std::string& to_convert) { std::string result; base::Base64Decode(to_convert, &result); return result; } } // namespace void PersistedLogs::LogInfo::Init(PersistedLogsMetrics* metrics, const std::string& log_data, const std::string& log_timestamp) { DCHECK(!log_data.empty()); if (!compression::GzipCompress(log_data, &compressed_log_data)) { NOTREACHED(); return; } metrics->RecordCompressionRatio(compressed_log_data.size(), log_data.size()); hash = base::SHA1HashString(log_data); timestamp = log_timestamp; } PersistedLogs::PersistedLogs(std::unique_ptr metrics, PrefService* local_state, const char* pref_name, size_t min_log_count, size_t min_log_bytes, size_t max_log_size) : metrics_(std::move(metrics)), local_state_(local_state), pref_name_(pref_name), min_log_count_(min_log_count), min_log_bytes_(min_log_bytes), max_log_size_(max_log_size != 0 ? max_log_size : static_cast(-1)), staged_log_index_(-1) { DCHECK(local_state_); // One of the limit arguments must be non-zero. DCHECK(min_log_count_ > 0 || min_log_bytes_ > 0); } PersistedLogs::~PersistedLogs() {} bool PersistedLogs::has_unsent_logs() const { return !!size(); } // True if a log has been staged. bool PersistedLogs::has_staged_log() const { return staged_log_index_ != -1; } // Returns the element in the front of the list. const std::string& PersistedLogs::staged_log() const { DCHECK(has_staged_log()); return list_[staged_log_index_].compressed_log_data; } // Returns the element in the front of the list. const std::string& PersistedLogs::staged_log_hash() const { DCHECK(has_staged_log()); return list_[staged_log_index_].hash; } // Returns the timestamp of the element in the front of the list. const std::string& PersistedLogs::staged_log_timestamp() const { DCHECK(has_staged_log()); return list_[staged_log_index_].timestamp; } void PersistedLogs::StageNextLog() { // CHECK, rather than DCHECK, because swap()ing with an empty list causes // hard-to-identify crashes much later. CHECK(!list_.empty()); DCHECK(!has_staged_log()); staged_log_index_ = list_.size() - 1; DCHECK(has_staged_log()); } void PersistedLogs::DiscardStagedLog() { // CHECK, rather than DCHECK, to diagnose cause of crashes from the field, // for crbug.com/695433. CHECK(has_staged_log()); DCHECK_LT(static_cast(staged_log_index_), list_.size()); list_.erase(list_.begin() + staged_log_index_); staged_log_index_ = -1; } void PersistedLogs::PersistUnsentLogs() const { ListPrefUpdate update(local_state_, pref_name_); WriteLogsToPrefList(update.Get()); } void PersistedLogs::LoadPersistedUnsentLogs() { ReadLogsFromPrefList(*local_state_->GetList(pref_name_)); } void PersistedLogs::StoreLog(const std::string& log_data) { list_.push_back(LogInfo()); list_.back().Init(metrics_.get(), log_data, base::Int64ToString(base::Time::Now().ToTimeT())); } void PersistedLogs::Purge() { if (has_staged_log()) { DiscardStagedLog(); } list_.clear(); local_state_->ClearPref(pref_name_); } void PersistedLogs::ReadLogsFromPrefList(const base::ListValue& list_value) { if (list_value.empty()) { metrics_->RecordLogReadStatus(PersistedLogsMetrics::LIST_EMPTY); return; } const size_t log_count = list_value.GetSize(); DCHECK(list_.empty()); list_.resize(log_count); for (size_t i = 0; i < log_count; ++i) { const base::DictionaryValue* dict; if (!list_value.GetDictionary(i, &dict) || !dict->GetString(kLogDataKey, &list_[i].compressed_log_data) || !dict->GetString(kLogHashKey, &list_[i].hash)) { list_.clear(); metrics_->RecordLogReadStatus( PersistedLogsMetrics::LOG_STRING_CORRUPTION); return; } list_[i].compressed_log_data = DecodeFromBase64(list_[i].compressed_log_data); list_[i].hash = DecodeFromBase64(list_[i].hash); // Ignoring the success of this step as timestamp might not be there for // older logs. // NOTE: Should be added to the check with other fields once migration is // over. dict->GetString(kLogTimestampKey, &list_[i].timestamp); } metrics_->RecordLogReadStatus(PersistedLogsMetrics::RECALL_SUCCESS); } void PersistedLogs::WriteLogsToPrefList(base::ListValue* list_value) const { list_value->Clear(); // Keep the most recent logs which are smaller than |max_log_size_|. // We keep at least |min_log_bytes_| and |min_log_count_| of logs before // discarding older logs. size_t start = list_.size(); size_t saved_log_count = 0; size_t bytes_used = 0; for (; start > 0; --start) { size_t log_size = list_[start - 1].compressed_log_data.length(); if (bytes_used >= min_log_bytes_ && saved_log_count >= min_log_count_) { break; } // Oversized logs won't be persisted, so don't count them. if (log_size > max_log_size_) continue; bytes_used += log_size; ++saved_log_count; } int dropped_logs_num = start - 1; for (size_t i = start; i < list_.size(); ++i) { size_t log_size = list_[i].compressed_log_data.length(); if (log_size > max_log_size_) { metrics_->RecordDroppedLogSize(log_size); dropped_logs_num++; continue; } std::unique_ptr dict_value( new base::DictionaryValue); dict_value->SetString(kLogHashKey, EncodeToBase64(list_[i].hash)); dict_value->SetString(kLogDataKey, EncodeToBase64(list_[i].compressed_log_data)); dict_value->SetString(kLogTimestampKey, list_[i].timestamp); list_value->Append(std::move(dict_value)); } if (dropped_logs_num > 0) metrics_->RecordDroppedLogsNum(dropped_logs_num); } } // namespace metrics