blob: 74d1ca71d4ccf95bdc7265235a4b28099f32dfb3 [file] [log] [blame]
// Copyright 2014 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "components/metrics/persisted_logs.h"
#include <memory>
#include <string>
#include <utility>
#include "base/base64.h"
#include "base/md5.h"
#include "base/metrics/histogram_macros.h"
#include "base/sha1.h"
#include "base/strings/string_number_conversions.h"
#include "base/timer/elapsed_timer.h"
#include "components/metrics/persisted_logs_metrics.h"
#include "components/prefs/pref_service.h"
#include "components/prefs/scoped_user_pref_update.h"
#include "third_party/zlib/google/compression_utils.h"
namespace metrics {
namespace {
const char kLogHashKey[] = "hash";
const char kLogTimestampKey[] = "timestamp";
const char kLogDataKey[] = "data";
std::string EncodeToBase64(const std::string& to_convert) {
// CHECK to diagnose crbug.com/695433
CHECK(to_convert.data());
std::string base64_result;
base::Base64Encode(to_convert, &base64_result);
return base64_result;
}
std::string DecodeFromBase64(const std::string& to_convert) {
std::string result;
base::Base64Decode(to_convert, &result);
return result;
}
} // namespace
void PersistedLogs::LogInfo::Init(PersistedLogsMetrics* metrics,
const std::string& log_data,
const std::string& log_timestamp) {
DCHECK(!log_data.empty());
if (!compression::GzipCompress(log_data, &compressed_log_data)) {
NOTREACHED();
return;
}
metrics->RecordCompressionRatio(compressed_log_data.size(), log_data.size());
hash = base::SHA1HashString(log_data);
timestamp = log_timestamp;
}
PersistedLogs::PersistedLogs(std::unique_ptr<PersistedLogsMetrics> metrics,
PrefService* local_state,
const char* pref_name,
size_t min_log_count,
size_t min_log_bytes,
size_t max_log_size)
: metrics_(std::move(metrics)),
local_state_(local_state),
pref_name_(pref_name),
min_log_count_(min_log_count),
min_log_bytes_(min_log_bytes),
max_log_size_(max_log_size != 0 ? max_log_size : static_cast<size_t>(-1)),
staged_log_index_(-1) {
DCHECK(local_state_);
// One of the limit arguments must be non-zero.
DCHECK(min_log_count_ > 0 || min_log_bytes_ > 0);
}
PersistedLogs::~PersistedLogs() {}
bool PersistedLogs::has_unsent_logs() const {
return !!size();
}
// True if a log has been staged.
bool PersistedLogs::has_staged_log() const {
return staged_log_index_ != -1;
}
// Returns the element in the front of the list.
const std::string& PersistedLogs::staged_log() const {
DCHECK(has_staged_log());
return list_[staged_log_index_].compressed_log_data;
}
// Returns the element in the front of the list.
const std::string& PersistedLogs::staged_log_hash() const {
DCHECK(has_staged_log());
return list_[staged_log_index_].hash;
}
// Returns the timestamp of the element in the front of the list.
const std::string& PersistedLogs::staged_log_timestamp() const {
DCHECK(has_staged_log());
return list_[staged_log_index_].timestamp;
}
void PersistedLogs::StageNextLog() {
// CHECK, rather than DCHECK, because swap()ing with an empty list causes
// hard-to-identify crashes much later.
CHECK(!list_.empty());
DCHECK(!has_staged_log());
staged_log_index_ = list_.size() - 1;
DCHECK(has_staged_log());
}
void PersistedLogs::DiscardStagedLog() {
// CHECK, rather than DCHECK, to diagnose cause of crashes from the field,
// for crbug.com/695433.
CHECK(has_staged_log());
DCHECK_LT(static_cast<size_t>(staged_log_index_), list_.size());
list_.erase(list_.begin() + staged_log_index_);
staged_log_index_ = -1;
}
void PersistedLogs::PersistUnsentLogs() const {
ListPrefUpdate update(local_state_, pref_name_);
WriteLogsToPrefList(update.Get());
}
void PersistedLogs::LoadPersistedUnsentLogs() {
ReadLogsFromPrefList(*local_state_->GetList(pref_name_));
}
void PersistedLogs::StoreLog(const std::string& log_data) {
list_.push_back(LogInfo());
list_.back().Init(metrics_.get(), log_data,
base::Int64ToString(base::Time::Now().ToTimeT()));
}
void PersistedLogs::Purge() {
if (has_staged_log()) {
DiscardStagedLog();
}
list_.clear();
local_state_->ClearPref(pref_name_);
}
void PersistedLogs::ReadLogsFromPrefList(const base::ListValue& list_value) {
if (list_value.empty()) {
metrics_->RecordLogReadStatus(PersistedLogsMetrics::LIST_EMPTY);
return;
}
const size_t log_count = list_value.GetSize();
DCHECK(list_.empty());
list_.resize(log_count);
for (size_t i = 0; i < log_count; ++i) {
const base::DictionaryValue* dict;
if (!list_value.GetDictionary(i, &dict) ||
!dict->GetString(kLogDataKey, &list_[i].compressed_log_data) ||
!dict->GetString(kLogHashKey, &list_[i].hash)) {
list_.clear();
metrics_->RecordLogReadStatus(
PersistedLogsMetrics::LOG_STRING_CORRUPTION);
return;
}
list_[i].compressed_log_data =
DecodeFromBase64(list_[i].compressed_log_data);
list_[i].hash = DecodeFromBase64(list_[i].hash);
// Ignoring the success of this step as timestamp might not be there for
// older logs.
// NOTE: Should be added to the check with other fields once migration is
// over.
dict->GetString(kLogTimestampKey, &list_[i].timestamp);
}
metrics_->RecordLogReadStatus(PersistedLogsMetrics::RECALL_SUCCESS);
}
void PersistedLogs::WriteLogsToPrefList(base::ListValue* list_value) const {
list_value->Clear();
// Keep the most recent logs which are smaller than |max_log_size_|.
// We keep at least |min_log_bytes_| and |min_log_count_| of logs before
// discarding older logs.
size_t start = list_.size();
size_t saved_log_count = 0;
size_t bytes_used = 0;
for (; start > 0; --start) {
size_t log_size = list_[start - 1].compressed_log_data.length();
if (bytes_used >= min_log_bytes_ &&
saved_log_count >= min_log_count_) {
break;
}
// Oversized logs won't be persisted, so don't count them.
if (log_size > max_log_size_)
continue;
bytes_used += log_size;
++saved_log_count;
}
int dropped_logs_num = start - 1;
for (size_t i = start; i < list_.size(); ++i) {
size_t log_size = list_[i].compressed_log_data.length();
if (log_size > max_log_size_) {
metrics_->RecordDroppedLogSize(log_size);
dropped_logs_num++;
continue;
}
std::unique_ptr<base::DictionaryValue> dict_value(
new base::DictionaryValue);
dict_value->SetString(kLogHashKey, EncodeToBase64(list_[i].hash));
dict_value->SetString(kLogDataKey,
EncodeToBase64(list_[i].compressed_log_data));
dict_value->SetString(kLogTimestampKey, list_[i].timestamp);
list_value->Append(std::move(dict_value));
}
if (dropped_logs_num > 0)
metrics_->RecordDroppedLogsNum(dropped_logs_num);
}
} // namespace metrics