// Copyright 2014 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "components/variations/variations_http_header_provider.h"
#include <vector>
#include "base/base64.h"
#include "base/memory/singleton.h"
#include "base/metrics/histogram.h"
#include "base/strings/string_number_conversions.h"
#include "base/strings/string_split.h"
#include "base/strings/string_util.h"
#include "components/google/core/browser/google_util.h"
#include "components/variations/proto/client_variations.pb.h"
#include "net/base/registry_controlled_domains/registry_controlled_domain.h"
#include "net/http/http_request_headers.h"
#include "url/gurl.h"
namespace variations {
namespace {
const char* kSuffixesToSetHeadersFor[] = {
".android.com",
".doubleclick.com",
".doubleclick.net",
".ggpht.com",
".googleadservices.com",
".googleapis.com",
".googlesyndication.com",
".googleusercontent.com",
".googlevideo.com",
".gstatic.com",
".ytimg.com",
};
} // namespace
VariationsHttpHeaderProvider* VariationsHttpHeaderProvider::GetInstance() {
return Singleton<VariationsHttpHeaderProvider>::get();
}
void VariationsHttpHeaderProvider::AppendHeaders(
const GURL& url,
bool incognito,
bool uma_enabled,
net::HttpRequestHeaders* headers) {
// Note the criteria for attaching client experiment headers:
// 1. We only transmit to Google owned domains which can evaluate experiments.
// 1a. These include hosts which have a standard postfix such as:
// *.doubleclick.net or *.googlesyndication.com or
// exactly www.googleadservices.com or
// international TLD domains *.google.<TLD> or *.youtube.<TLD>.
// 2. Only transmit for non-Incognito profiles.
// 3. For the X-Chrome-UMA-Enabled bit, only set it if UMA is in fact enabled
// for this install of Chrome.
// 4. For the X-Client-Data header, only include non-empty variation IDs.
if (incognito || !ShouldAppendHeaders(url))
return;
if (uma_enabled)
headers->SetHeaderIfMissing("X-Chrome-UMA-Enabled", "1");
// Lazily initialize the header, if not already done, before attempting to
// transmit it.
InitVariationIDsCacheIfNeeded();
std::string variation_ids_header_copy;
{
base::AutoLock scoped_lock(lock_);
variation_ids_header_copy = variation_ids_header_;
}
if (!variation_ids_header_copy.empty()) {
// Note that prior to M33 this header was named X-Chrome-Variations.
headers->SetHeaderIfMissing("X-Client-Data",
variation_ids_header_copy);
}
}
bool VariationsHttpHeaderProvider::SetDefaultVariationIds(
const std::string& variation_ids) {
default_variation_ids_set_.clear();
default_trigger_id_set_.clear();
std::vector<std::string> entries;
base::SplitString(variation_ids, ',', &entries);
for (std::vector<std::string>::const_iterator it = entries.begin();
it != entries.end(); ++it) {
if (it->empty()) {
default_variation_ids_set_.clear();
default_trigger_id_set_.clear();
return false;
}
bool trigger_id = StartsWithASCII(*it, "t", true);
// Remove the "t" prefix if it's there.
std::string entry = trigger_id ? it->substr(1) : *it;
int variation_id = 0;
if (!base::StringToInt(entry, &variation_id)) {
default_variation_ids_set_.clear();
default_trigger_id_set_.clear();
return false;
}
if (trigger_id)
default_trigger_id_set_.insert(variation_id);
else
default_variation_ids_set_.insert(variation_id);
}
return true;
}
VariationsHttpHeaderProvider::VariationsHttpHeaderProvider()
: variation_ids_cache_initialized_(false) {
}
VariationsHttpHeaderProvider::~VariationsHttpHeaderProvider() {
}
void VariationsHttpHeaderProvider::OnFieldTrialGroupFinalized(
const std::string& trial_name,
const std::string& group_name) {
VariationID new_id =
GetGoogleVariationID(GOOGLE_WEB_PROPERTIES, trial_name, group_name);
VariationID new_trigger_id = GetGoogleVariationID(
GOOGLE_WEB_PROPERTIES_TRIGGER, trial_name, group_name);
if (new_id == EMPTY_ID && new_trigger_id == EMPTY_ID)
return;
base::AutoLock scoped_lock(lock_);
if (new_id != EMPTY_ID)
variation_ids_set_.insert(new_id);
if (new_trigger_id != EMPTY_ID)
variation_trigger_ids_set_.insert(new_trigger_id);
UpdateVariationIDsHeaderValue();
}
void VariationsHttpHeaderProvider::InitVariationIDsCacheIfNeeded() {
base::AutoLock scoped_lock(lock_);
if (variation_ids_cache_initialized_)
return;
// Register for additional cache updates. This is done first to avoid a race
// that could cause registered FieldTrials to be missed.
DCHECK(base::MessageLoop::current());
base::FieldTrialList::AddObserver(this);
base::TimeTicks before_time = base::TimeTicks::Now();
base::FieldTrial::ActiveGroups initial_groups;
base::FieldTrialList::GetActiveFieldTrialGroups(&initial_groups);
for (base::FieldTrial::ActiveGroups::const_iterator it =
initial_groups.begin();
it != initial_groups.end(); ++it) {
const VariationID id =
GetGoogleVariationID(GOOGLE_WEB_PROPERTIES, it->trial_name,
it->group_name);
if (id != EMPTY_ID)
variation_ids_set_.insert(id);
const VariationID trigger_id =
GetGoogleVariationID(GOOGLE_WEB_PROPERTIES_TRIGGER, it->trial_name,
it->group_name);
if (trigger_id != EMPTY_ID)
variation_trigger_ids_set_.insert(trigger_id);
}
UpdateVariationIDsHeaderValue();
UMA_HISTOGRAM_CUSTOM_COUNTS(
"Variations.HeaderConstructionTime",
(base::TimeTicks::Now() - before_time).InMicroseconds(),
0,
base::TimeDelta::FromSeconds(1).InMicroseconds(),
50);
variation_ids_cache_initialized_ = true;
}
void VariationsHttpHeaderProvider::UpdateVariationIDsHeaderValue() {
lock_.AssertAcquired();
// The header value is a serialized protobuffer of Variation IDs which is
// base64 encoded before transmitting as a string.
variation_ids_header_.clear();
if (variation_ids_set_.empty() && default_variation_ids_set_.empty() &&
variation_trigger_ids_set_.empty() && default_trigger_id_set_.empty()) {
return;
}
// This is the bottleneck for the creation of the header, so validate the size
// here. Force a hard maximum on the ID count in case the Variations server
// returns too many IDs and DOSs receiving servers with large requests.
const size_t total_id_count =
variation_ids_set_.size() + variation_trigger_ids_set_.size();
DCHECK_LE(total_id_count, 10U);
UMA_HISTOGRAM_COUNTS_100("Variations.Headers.ExperimentCount",
total_id_count);
if (total_id_count > 20)
return;
// Merge the two sets of experiment ids.
std::set<VariationID> all_variation_ids_set = default_variation_ids_set_;
for (std::set<VariationID>::const_iterator it = variation_ids_set_.begin();
it != variation_ids_set_.end(); ++it) {
all_variation_ids_set.insert(*it);
}
ClientVariations proto;
for (std::set<VariationID>::const_iterator it = all_variation_ids_set.begin();
it != all_variation_ids_set.end(); ++it) {
proto.add_variation_id(*it);
}
std::set<VariationID> all_trigger_ids_set = default_trigger_id_set_;
for (std::set<VariationID>::const_iterator it =
variation_trigger_ids_set_.begin();
it != variation_trigger_ids_set_.end(); ++it) {
all_trigger_ids_set.insert(*it);
}
for (std::set<VariationID>::const_iterator it = all_trigger_ids_set.begin();
it != all_trigger_ids_set.end(); ++it) {
proto.add_trigger_variation_id(*it);
}
std::string serialized;
proto.SerializeToString(&serialized);
std::string hashed;
base::Base64Encode(serialized, &hashed);
// If successful, swap the header value with the new one.
// Note that the list of IDs and the header could be temporarily out of sync
// if IDs are added as the header is recreated. The receiving servers are OK
// with such discrepancies.
variation_ids_header_ = hashed;
}
// static
bool VariationsHttpHeaderProvider::ShouldAppendHeaders(const GURL& url) {
if (google_util::IsGoogleDomainUrl(url, google_util::ALLOW_SUBDOMAIN,
google_util::ALLOW_NON_STANDARD_PORTS)) {
return true;
}
if (!url.is_valid() || !url.SchemeIsHTTPOrHTTPS())
return false;
// Some domains don't have international TLD extensions, so testing for them
// is very straight forward.
const std::string host = url.host();
for (size_t i = 0; i < arraysize(kSuffixesToSetHeadersFor); ++i) {
if (EndsWith(host, kSuffixesToSetHeadersFor[i], false))
return true;
}
return google_util::IsYoutubeDomainUrl(url, google_util::ALLOW_SUBDOMAIN,
google_util::ALLOW_NON_STANDARD_PORTS);
}
} // namespace variations