blob: 79a935ab32182498e502438b2923c80c38928172 [file] [log] [blame]
[email protected]71011c1682014-07-09 17:19:161// Copyright 2014 The Chromium Authors. All rights reserved.
[email protected]bd3b4712012-12-18 17:01:302// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
isherman3be67db2014-10-24 05:57:445#include "components/variations/net/variations_http_header_provider.h"
[email protected]bd3b4712012-12-18 17:01:306
horoe09b6c82014-11-01 02:08:287#include <set>
8#include <string>
[email protected]1bd918d2013-10-13 18:23:099#include <vector>
10
[email protected]bd3b4712012-12-18 17:01:3011#include "base/base64.h"
12#include "base/memory/singleton.h"
[email protected]999f7b42013-02-04 16:14:2513#include "base/metrics/histogram.h"
[email protected]1bd918d2013-10-13 18:23:0914#include "base/strings/string_number_conversions.h"
15#include "base/strings/string_split.h"
[email protected]7f8a9932013-07-26 20:43:3416#include "base/strings/string_util.h"
[email protected]8e44a5b02014-06-19 19:03:2417#include "components/google/core/browser/google_util.h"
[email protected]ea15bd52014-07-14 22:42:5018#include "components/variations/proto/client_variations.pb.h"
[email protected]7f8a9932013-07-26 20:43:3419#include "net/base/registry_controlled_domains/registry_controlled_domain.h"
[email protected]bd3b4712012-12-18 17:01:3020#include "net/http/http_request_headers.h"
[email protected]7f8a9932013-07-26 20:43:3421#include "url/gurl.h"
[email protected]bd3b4712012-12-18 17:01:3022
[email protected]71011c1682014-07-09 17:19:1623namespace variations {
[email protected]ab7780792013-01-10 01:26:0924
[email protected]64d617e2014-05-31 04:37:5425namespace {
26
27const char* kSuffixesToSetHeadersFor[] = {
28 ".android.com",
29 ".doubleclick.com",
30 ".doubleclick.net",
31 ".ggpht.com",
32 ".googleadservices.com",
33 ".googleapis.com",
34 ".googlesyndication.com",
35 ".googleusercontent.com",
36 ".googlevideo.com",
37 ".gstatic.com",
38 ".ytimg.com",
39};
40
horoe09b6c82014-11-01 02:08:2841const char kChromeUMAEnabled[] = "X-Chrome-UMA-Enabled";
42const char kClientData[] = "X-Client-Data";
43
[email protected]64d617e2014-05-31 04:37:5444} // namespace
45
[email protected]ab7780792013-01-10 01:26:0946VariationsHttpHeaderProvider* VariationsHttpHeaderProvider::GetInstance() {
47 return Singleton<VariationsHttpHeaderProvider>::get();
[email protected]bd3b4712012-12-18 17:01:3048}
49
[email protected]ab7780792013-01-10 01:26:0950void VariationsHttpHeaderProvider::AppendHeaders(
51 const GURL& url,
52 bool incognito,
53 bool uma_enabled,
54 net::HttpRequestHeaders* headers) {
[email protected]ea15bd52014-07-14 22:42:5055 // Note the criteria for attaching client experiment headers:
[email protected]0eea1cf72014-04-01 19:39:1956 // 1. We only transmit to Google owned domains which can evaluate experiments.
57 // 1a. These include hosts which have a standard postfix such as:
58 // *.doubleclick.net or *.googlesyndication.com or
59 // exactly www.googleadservices.com or
60 // international TLD domains *.google.<TLD> or *.youtube.<TLD>.
[email protected]bd3b4712012-12-18 17:01:3061 // 2. Only transmit for non-Incognito profiles.
62 // 3. For the X-Chrome-UMA-Enabled bit, only set it if UMA is in fact enabled
63 // for this install of Chrome.
[email protected]05ef1f22013-12-05 22:24:3464 // 4. For the X-Client-Data header, only include non-empty variation IDs.
[email protected]7f8a9932013-07-26 20:43:3465 if (incognito || !ShouldAppendHeaders(url))
[email protected]bd3b4712012-12-18 17:01:3066 return;
[email protected]bd3b4712012-12-18 17:01:3067
68 if (uma_enabled)
horoe09b6c82014-11-01 02:08:2869 headers->SetHeaderIfMissing(kChromeUMAEnabled, "1");
[email protected]bd3b4712012-12-18 17:01:3070
71 // Lazily initialize the header, if not already done, before attempting to
72 // transmit it.
73 InitVariationIDsCacheIfNeeded();
[email protected]ab7780792013-01-10 01:26:0974
75 std::string variation_ids_header_copy;
76 {
77 base::AutoLock scoped_lock(lock_);
78 variation_ids_header_copy = variation_ids_header_;
79 }
80
81 if (!variation_ids_header_copy.empty()) {
[email protected]05ef1f22013-12-05 22:24:3482 // Note that prior to M33 this header was named X-Chrome-Variations.
horoe09b6c82014-11-01 02:08:2883 headers->SetHeaderIfMissing(kClientData, variation_ids_header_copy);
[email protected]ab7780792013-01-10 01:26:0984 }
[email protected]bd3b4712012-12-18 17:01:3085}
86
[email protected]1bd918d2013-10-13 18:23:0987bool VariationsHttpHeaderProvider::SetDefaultVariationIds(
88 const std::string& variation_ids) {
89 default_variation_ids_set_.clear();
[email protected]8c2c5442014-04-04 18:55:2990 default_trigger_id_set_.clear();
[email protected]1bd918d2013-10-13 18:23:0991 std::vector<std::string> entries;
92 base::SplitString(variation_ids, ',', &entries);
93 for (std::vector<std::string>::const_iterator it = entries.begin();
94 it != entries.end(); ++it) {
[email protected]8c2c5442014-04-04 18:55:2995 if (it->empty()) {
[email protected]1bd918d2013-10-13 18:23:0996 default_variation_ids_set_.clear();
[email protected]8c2c5442014-04-04 18:55:2997 default_trigger_id_set_.clear();
[email protected]1bd918d2013-10-13 18:23:0998 return false;
99 }
[email protected]8c2c5442014-04-04 18:55:29100 bool trigger_id = StartsWithASCII(*it, "t", true);
101 // Remove the "t" prefix if it's there.
102 std::string entry = trigger_id ? it->substr(1) : *it;
103
104 int variation_id = 0;
105 if (!base::StringToInt(entry, &variation_id)) {
106 default_variation_ids_set_.clear();
107 default_trigger_id_set_.clear();
108 return false;
109 }
110 if (trigger_id)
111 default_trigger_id_set_.insert(variation_id);
112 else
113 default_variation_ids_set_.insert(variation_id);
[email protected]1bd918d2013-10-13 18:23:09114 }
115 return true;
116}
117
[email protected]ab7780792013-01-10 01:26:09118VariationsHttpHeaderProvider::VariationsHttpHeaderProvider()
[email protected]bd3b4712012-12-18 17:01:30119 : variation_ids_cache_initialized_(false) {
120}
121
[email protected]ab7780792013-01-10 01:26:09122VariationsHttpHeaderProvider::~VariationsHttpHeaderProvider() {
[email protected]bd3b4712012-12-18 17:01:30123}
124
[email protected]ab7780792013-01-10 01:26:09125void VariationsHttpHeaderProvider::OnFieldTrialGroupFinalized(
[email protected]bd3b4712012-12-18 17:01:30126 const std::string& trial_name,
127 const std::string& group_name) {
[email protected]ab7780792013-01-10 01:26:09128 VariationID new_id =
129 GetGoogleVariationID(GOOGLE_WEB_PROPERTIES, trial_name, group_name);
[email protected]e51dcb0c2014-05-06 16:56:10130 VariationID new_trigger_id = GetGoogleVariationID(
131 GOOGLE_WEB_PROPERTIES_TRIGGER, trial_name, group_name);
132 if (new_id == EMPTY_ID && new_trigger_id == EMPTY_ID)
[email protected]bd3b4712012-12-18 17:01:30133 return;
[email protected]ab7780792013-01-10 01:26:09134
[email protected]bd3b4712012-12-18 17:01:30135 base::AutoLock scoped_lock(lock_);
[email protected]e51dcb0c2014-05-06 16:56:10136 if (new_id != EMPTY_ID)
137 variation_ids_set_.insert(new_id);
138 if (new_trigger_id != EMPTY_ID)
139 variation_trigger_ids_set_.insert(new_trigger_id);
140
[email protected]bd3b4712012-12-18 17:01:30141 UpdateVariationIDsHeaderValue();
142}
143
asvitkinee0dbdbe2014-10-31 21:59:57144void VariationsHttpHeaderProvider::OnSyntheticTrialsChanged(
145 const std::vector<metrics::SyntheticTrialGroup>& groups) {
146 base::AutoLock scoped_lock(lock_);
147
148 synthetic_variation_ids_set_.clear();
149 for (const metrics::SyntheticTrialGroup& group : groups) {
150 const VariationID id =
151 GetGoogleVariationIDFromHashes(GOOGLE_WEB_PROPERTIES, group.id);
152 if (id != EMPTY_ID)
153 synthetic_variation_ids_set_.insert(id);
154 }
155 UpdateVariationIDsHeaderValue();
156}
157
[email protected]ab7780792013-01-10 01:26:09158void VariationsHttpHeaderProvider::InitVariationIDsCacheIfNeeded() {
[email protected]bd3b4712012-12-18 17:01:30159 base::AutoLock scoped_lock(lock_);
160 if (variation_ids_cache_initialized_)
161 return;
162
163 // Register for additional cache updates. This is done first to avoid a race
164 // that could cause registered FieldTrials to be missed.
[email protected]b3a25092013-05-28 22:08:16165 DCHECK(base::MessageLoop::current());
[email protected]bd3b4712012-12-18 17:01:30166 base::FieldTrialList::AddObserver(this);
167
[email protected]999f7b42013-02-04 16:14:25168 base::TimeTicks before_time = base::TimeTicks::Now();
169
[email protected]bd3b4712012-12-18 17:01:30170 base::FieldTrial::ActiveGroups initial_groups;
171 base::FieldTrialList::GetActiveFieldTrialGroups(&initial_groups);
172 for (base::FieldTrial::ActiveGroups::const_iterator it =
[email protected]ab7780792013-01-10 01:26:09173 initial_groups.begin();
174 it != initial_groups.end(); ++it) {
175 const VariationID id =
176 GetGoogleVariationID(GOOGLE_WEB_PROPERTIES, it->trial_name,
177 it->group_name);
[email protected]90acad02013-01-16 17:17:54178 if (id != EMPTY_ID)
[email protected]bd3b4712012-12-18 17:01:30179 variation_ids_set_.insert(id);
[email protected]e51dcb0c2014-05-06 16:56:10180
181 const VariationID trigger_id =
182 GetGoogleVariationID(GOOGLE_WEB_PROPERTIES_TRIGGER, it->trial_name,
183 it->group_name);
184 if (trigger_id != EMPTY_ID)
185 variation_trigger_ids_set_.insert(trigger_id);
[email protected]bd3b4712012-12-18 17:01:30186 }
187 UpdateVariationIDsHeaderValue();
188
[email protected]999f7b42013-02-04 16:14:25189 UMA_HISTOGRAM_CUSTOM_COUNTS(
190 "Variations.HeaderConstructionTime",
191 (base::TimeTicks::Now() - before_time).InMicroseconds(),
192 0,
193 base::TimeDelta::FromSeconds(1).InMicroseconds(),
194 50);
195
[email protected]bd3b4712012-12-18 17:01:30196 variation_ids_cache_initialized_ = true;
197}
198
[email protected]ab7780792013-01-10 01:26:09199void VariationsHttpHeaderProvider::UpdateVariationIDsHeaderValue() {
200 lock_.AssertAcquired();
201
[email protected]bd3b4712012-12-18 17:01:30202 // The header value is a serialized protobuffer of Variation IDs which is
203 // base64 encoded before transmitting as a string.
[email protected]1bd918d2013-10-13 18:23:09204 variation_ids_header_.clear();
205
[email protected]8c2c5442014-04-04 18:55:29206 if (variation_ids_set_.empty() && default_variation_ids_set_.empty() &&
asvitkinee0dbdbe2014-10-31 21:59:57207 variation_trigger_ids_set_.empty() && default_trigger_id_set_.empty() &&
208 synthetic_variation_ids_set_.empty()) {
[email protected]bd3b4712012-12-18 17:01:30209 return;
[email protected]8c2c5442014-04-04 18:55:29210 }
[email protected]bd3b4712012-12-18 17:01:30211
212 // This is the bottleneck for the creation of the header, so validate the size
213 // here. Force a hard maximum on the ID count in case the Variations server
214 // returns too many IDs and DOSs receiving servers with large requests.
[email protected]e51dcb0c2014-05-06 16:56:10215 const size_t total_id_count =
216 variation_ids_set_.size() + variation_trigger_ids_set_.size();
217 DCHECK_LE(total_id_count, 10U);
[email protected]a27ae2a2014-08-01 16:17:52218 UMA_HISTOGRAM_COUNTS_100("Variations.Headers.ExperimentCount",
219 total_id_count);
[email protected]e51dcb0c2014-05-06 16:56:10220 if (total_id_count > 20)
[email protected]bd3b4712012-12-18 17:01:30221 return;
[email protected]bd3b4712012-12-18 17:01:30222
[email protected]1bd918d2013-10-13 18:23:09223 // Merge the two sets of experiment ids.
224 std::set<VariationID> all_variation_ids_set = default_variation_ids_set_;
asvitkinee0dbdbe2014-10-31 21:59:57225 for (VariationID id : variation_ids_set_)
226 all_variation_ids_set.insert(id);
227 for (VariationID id : synthetic_variation_ids_set_)
228 all_variation_ids_set.insert(id);
[email protected]bd3b4712012-12-18 17:01:30229
[email protected]e51dcb0c2014-05-06 16:56:10230 std::set<VariationID> all_trigger_ids_set = default_trigger_id_set_;
asvitkinee0dbdbe2014-10-31 21:59:57231 for (VariationID id : variation_trigger_ids_set_)
232 all_trigger_ids_set.insert(id);
233
234 ClientVariations proto;
235 for (VariationID id : all_variation_ids_set)
236 proto.add_variation_id(id);
237 for (VariationID id : all_trigger_ids_set)
238 proto.add_trigger_variation_id(id);
[email protected]8c2c5442014-04-04 18:55:29239
[email protected]bd3b4712012-12-18 17:01:30240 std::string serialized;
241 proto.SerializeToString(&serialized);
242
243 std::string hashed;
[email protected]33fca122013-12-11 01:48:50244 base::Base64Encode(serialized, &hashed);
245 // If successful, swap the header value with the new one.
246 // Note that the list of IDs and the header could be temporarily out of sync
247 // if IDs are added as the header is recreated. The receiving servers are OK
248 // with such discrepancies.
249 variation_ids_header_ = hashed;
[email protected]bd3b4712012-12-18 17:01:30250}
[email protected]ab7780792013-01-10 01:26:09251
[email protected]7f8a9932013-07-26 20:43:34252// static
253bool VariationsHttpHeaderProvider::ShouldAppendHeaders(const GURL& url) {
254 if (google_util::IsGoogleDomainUrl(url, google_util::ALLOW_SUBDOMAIN,
255 google_util::ALLOW_NON_STANDARD_PORTS)) {
256 return true;
257 }
258
[email protected]91f5689032013-08-22 01:43:33259 if (!url.is_valid() || !url.SchemeIsHTTPOrHTTPS())
[email protected]7f8a9932013-07-26 20:43:34260 return false;
261
[email protected]0eea1cf72014-04-01 19:39:19262 // Some domains don't have international TLD extensions, so testing for them
263 // is very straight forward.
[email protected]7f8a9932013-07-26 20:43:34264 const std::string host = url.host();
[email protected]64d617e2014-05-31 04:37:54265 for (size_t i = 0; i < arraysize(kSuffixesToSetHeadersFor); ++i) {
266 if (EndsWith(host, kSuffixesToSetHeadersFor[i], false))
267 return true;
[email protected]0eea1cf72014-04-01 19:39:19268 }
269
[email protected]87abe9ea2014-06-17 03:29:54270 return google_util::IsYoutubeDomainUrl(url, google_util::ALLOW_SUBDOMAIN,
271 google_util::ALLOW_NON_STANDARD_PORTS);
[email protected]7f8a9932013-07-26 20:43:34272}
273
horoe09b6c82014-11-01 02:08:28274std::set<std::string> VariationsHttpHeaderProvider::GetVariationHeaderNames()
275 const {
276 std::set<std::string> headers;
277 headers.insert(kChromeUMAEnabled);
278 headers.insert(kClientData);
279 return headers;
280}
281
[email protected]71011c1682014-07-09 17:19:16282} // namespace variations