zero_suggest_provider.cc revision 424c4d7b64af9d0d8fd9624f381f469654d5e3d2
1// Copyright (c) 2012 The Chromium Authors. All rights reserved. 2// Use of this source code is governed by a BSD-style license that can be 3// found in the LICENSE file. 4 5#include "chrome/browser/autocomplete/zero_suggest_provider.h" 6 7#include "base/callback.h" 8#include "base/i18n/case_conversion.h" 9#include "base/json/json_string_value_serializer.h" 10#include "base/metrics/histogram.h" 11#include "base/prefs/pref_service.h" 12#include "base/strings/string16.h" 13#include "base/strings/string_util.h" 14#include "base/strings/utf_string_conversions.h" 15#include "base/time/time.h" 16#include "chrome/browser/autocomplete/autocomplete_classifier.h" 17#include "chrome/browser/autocomplete/autocomplete_classifier_factory.h" 18#include "chrome/browser/autocomplete/autocomplete_input.h" 19#include "chrome/browser/autocomplete/autocomplete_match.h" 20#include "chrome/browser/autocomplete/autocomplete_provider_listener.h" 21#include "chrome/browser/autocomplete/history_url_provider.h" 22#include "chrome/browser/autocomplete/search_provider.h" 23#include "chrome/browser/autocomplete/url_prefix.h" 24#include "chrome/browser/google/google_util.h" 25#include "chrome/browser/metrics/variations/variations_http_header_provider.h" 26#include "chrome/browser/omnibox/omnibox_field_trial.h" 27#include "chrome/browser/profiles/profile.h" 28#include "chrome/browser/search/search.h" 29#include "chrome/browser/search_engines/template_url_service.h" 30#include "chrome/browser/search_engines/template_url_service_factory.h" 31#include "chrome/browser/sync/profile_sync_service.h" 32#include "chrome/browser/sync/profile_sync_service_factory.h" 33#include "chrome/common/net/url_fixer_upper.h" 34#include "chrome/common/pref_names.h" 35#include "chrome/common/url_constants.h" 36#include "net/base/escape.h" 37#include "net/base/load_flags.h" 38#include "net/base/net_util.h" 39#include "net/http/http_request_headers.h" 40#include "net/http/http_response_headers.h" 41#include "net/url_request/url_fetcher.h" 42#include "net/url_request/url_request_status.h" 43#include "url/gurl.h" 44 45namespace { 46 47// TODO(hfung): The histogram code was copied and modified from 48// search_provider.cc. Refactor and consolidate the code. 49// We keep track in a histogram how many suggest requests we send, how 50// many suggest requests we invalidate (e.g., due to a user typing 51// another character), and how many replies we receive. 52// *** ADD NEW ENUMS AFTER ALL PREVIOUSLY DEFINED ONES! *** 53// (excluding the end-of-list enum value) 54// We do not want values of existing enums to change or else it screws 55// up the statistics. 56enum ZeroSuggestRequestsHistogramValue { 57 ZERO_SUGGEST_REQUEST_SENT = 1, 58 ZERO_SUGGEST_REQUEST_INVALIDATED, 59 ZERO_SUGGEST_REPLY_RECEIVED, 60 ZERO_SUGGEST_MAX_REQUEST_HISTOGRAM_VALUE 61}; 62 63void LogOmniboxZeroSuggestRequest( 64 ZeroSuggestRequestsHistogramValue request_value) { 65 UMA_HISTOGRAM_ENUMERATION("Omnibox.ZeroSuggestRequests", request_value, 66 ZERO_SUGGEST_MAX_REQUEST_HISTOGRAM_VALUE); 67} 68 69// The maximum relevance of the top match from this provider. 70const int kDefaultVerbatimZeroSuggestRelevance = 1300; 71 72// Relevance value to use if it was not set explicitly by the server. 73const int kDefaultZeroSuggestRelevance = 100; 74 75} // namespace 76 77// static 78ZeroSuggestProvider* ZeroSuggestProvider::Create( 79 AutocompleteProviderListener* listener, 80 Profile* profile) { 81 return new ZeroSuggestProvider(listener, profile); 82} 83 84void ZeroSuggestProvider::Start(const AutocompleteInput& input, 85 bool /*minimal_changes*/) { 86} 87 88void ZeroSuggestProvider::Stop(bool clear_cached_results) { 89 if (have_pending_request_) 90 LogOmniboxZeroSuggestRequest(ZERO_SUGGEST_REQUEST_INVALIDATED); 91 have_pending_request_ = false; 92 fetcher_.reset(); 93 done_ = true; 94 if (clear_cached_results) { 95 query_matches_map_.clear(); 96 navigation_results_.clear(); 97 current_query_.clear(); 98 matches_.clear(); 99 } 100} 101 102void ZeroSuggestProvider::AddProviderInfo(ProvidersInfo* provider_info) const { 103 provider_info->push_back(metrics::OmniboxEventProto_ProviderInfo()); 104 metrics::OmniboxEventProto_ProviderInfo& new_entry = provider_info->back(); 105 new_entry.set_provider(AsOmniboxEventProviderType()); 106 new_entry.set_provider_done(done_); 107 std::vector<uint32> field_trial_hashes; 108 OmniboxFieldTrial::GetActiveSuggestFieldTrialHashes(&field_trial_hashes); 109 for (size_t i = 0; i < field_trial_hashes.size(); ++i) { 110 if (field_trial_triggered_) 111 new_entry.mutable_field_trial_triggered()->Add(field_trial_hashes[i]); 112 if (field_trial_triggered_in_session_) { 113 new_entry.mutable_field_trial_triggered_in_session()->Add( 114 field_trial_hashes[i]); 115 } 116 } 117} 118 119void ZeroSuggestProvider::ResetSession() { 120 // The user has started editing in the omnibox, so leave 121 // |field_trial_triggered_in_session_| unchanged and set 122 // |field_trial_triggered_| to false since zero suggest is inactive now. 123 field_trial_triggered_ = false; 124 Stop(true); 125} 126 127void ZeroSuggestProvider::OnURLFetchComplete(const net::URLFetcher* source) { 128 have_pending_request_ = false; 129 LogOmniboxZeroSuggestRequest(ZERO_SUGGEST_REPLY_RECEIVED); 130 131 std::string json_data; 132 source->GetResponseAsString(&json_data); 133 const bool request_succeeded = 134 source->GetStatus().is_success() && source->GetResponseCode() == 200; 135 136 bool have_results = false; 137 if (request_succeeded) { 138 JSONStringValueSerializer deserializer(json_data); 139 deserializer.set_allow_trailing_comma(true); 140 scoped_ptr<Value> data(deserializer.Deserialize(NULL, NULL)); 141 if (data.get()) { 142 ParseSuggestResults(*data.get()); 143 have_results = !query_matches_map_.empty() || 144 !navigation_results_.empty(); 145 } 146 } 147 done_ = true; 148 149 if (have_results) { 150 ConvertResultsToAutocompleteMatches(); 151 listener_->OnProviderUpdate(true); 152 } 153} 154 155void ZeroSuggestProvider::StartZeroSuggest( 156 const GURL& url, 157 AutocompleteInput::PageClassification page_classification, 158 const string16& permanent_text) { 159 Stop(true); 160 field_trial_triggered_ = false; 161 field_trial_triggered_in_session_ = false; 162 if (!ShouldRunZeroSuggest(url)) 163 return; 164 verbatim_relevance_ = kDefaultVerbatimZeroSuggestRelevance; 165 done_ = false; 166 permanent_text_ = permanent_text; 167 current_query_ = url.spec(); 168 current_page_classification_ = page_classification; 169 current_url_match_ = MatchForCurrentURL(); 170 // TODO(jered): Consider adding locally-sourced zero-suggestions here too. 171 // These may be useful on the NTP or more relevant to the user than server 172 // suggestions, if based on local browsing history. 173 Run(); 174} 175 176ZeroSuggestProvider::ZeroSuggestProvider( 177 AutocompleteProviderListener* listener, 178 Profile* profile) 179 : AutocompleteProvider(listener, profile, 180 AutocompleteProvider::TYPE_ZERO_SUGGEST), 181 template_url_service_(TemplateURLServiceFactory::GetForProfile(profile)), 182 have_pending_request_(false), 183 verbatim_relevance_(kDefaultVerbatimZeroSuggestRelevance), 184 field_trial_triggered_(false), 185 field_trial_triggered_in_session_(false) { 186} 187 188ZeroSuggestProvider::~ZeroSuggestProvider() { 189} 190 191bool ZeroSuggestProvider::ShouldRunZeroSuggest(const GURL& url) const { 192 if (!ShouldSendURL(url)) 193 return false; 194 195 // Don't run if there's no profile or in incognito mode. 196 if (profile_ == NULL || profile_->IsOffTheRecord()) 197 return false; 198 199 // Don't run if we can't get preferences or search suggest is not enabled. 200 PrefService* prefs = profile_->GetPrefs(); 201 if (prefs == NULL || !prefs->GetBoolean(prefs::kSearchSuggestEnabled)) 202 return false; 203 204 ProfileSyncService* service = 205 ProfileSyncServiceFactory::GetInstance()->GetForProfile(profile_); 206 browser_sync::SyncPrefs sync_prefs(prefs); 207 // The user has needs to have Chrome Sync enabled (for permissions to 208 // transmit their current URL) and be in the field trial. 209 if (!OmniboxFieldTrial::InZeroSuggestFieldTrial() || 210 service == NULL || 211 !service->IsSyncEnabledAndLoggedIn() || 212 !sync_prefs.HasKeepEverythingSynced()) { 213 return false; 214 } 215 return true; 216} 217 218bool ZeroSuggestProvider::ShouldSendURL(const GURL& url) const { 219 if (!url.is_valid()) 220 return false; 221 222 // Only allow HTTP URLs or Google HTTPS URLs (including Google search 223 // result pages). For the latter case, Google was already sent the HTTPS 224 // URLs when requesting the page, so the information is just re-sent. 225 return (url.scheme() == chrome::kHttpScheme) || 226 google_util::IsGoogleDomainUrl(url, google_util::ALLOW_SUBDOMAIN, 227 google_util::ALLOW_NON_STANDARD_PORTS); 228} 229 230void ZeroSuggestProvider::FillResults( 231 const Value& root_val, 232 int* verbatim_relevance, 233 SearchProvider::SuggestResults* suggest_results, 234 SearchProvider::NavigationResults* navigation_results) { 235 string16 query; 236 const ListValue* root_list = NULL; 237 const ListValue* results = NULL; 238 const ListValue* relevances = NULL; 239 // The response includes the query, which should be empty for ZeroSuggest 240 // responses. 241 if (!root_val.GetAsList(&root_list) || !root_list->GetString(0, &query) || 242 (!query.empty()) || !root_list->GetList(1, &results)) 243 return; 244 245 // 3rd element: Description list. 246 const ListValue* descriptions = NULL; 247 root_list->GetList(2, &descriptions); 248 249 // 4th element: Disregard the query URL list for now. 250 251 // Reset suggested relevance information from the provider. 252 *verbatim_relevance = kDefaultVerbatimZeroSuggestRelevance; 253 254 // 5th element: Optional key-value pairs from the Suggest server. 255 const ListValue* types = NULL; 256 const DictionaryValue* extras = NULL; 257 if (root_list->GetDictionary(4, &extras)) { 258 extras->GetList("google:suggesttype", &types); 259 260 // Discard this list if its size does not match that of the suggestions. 261 if (extras->GetList("google:suggestrelevance", &relevances) && 262 relevances->GetSize() != results->GetSize()) 263 relevances = NULL; 264 extras->GetInteger("google:verbatimrelevance", verbatim_relevance); 265 266 // Check if the active suggest field trial (if any) has triggered. 267 bool triggered = false; 268 extras->GetBoolean("google:fieldtrialtriggered", &triggered); 269 field_trial_triggered_ |= triggered; 270 field_trial_triggered_in_session_ |= triggered; 271 } 272 273 // Clear the previous results now that new results are available. 274 suggest_results->clear(); 275 navigation_results->clear(); 276 277 string16 result, title; 278 std::string type; 279 for (size_t index = 0; results->GetString(index, &result); ++index) { 280 // Google search may return empty suggestions for weird input characters, 281 // they make no sense at all and can cause problems in our code. 282 if (result.empty()) 283 continue; 284 285 int relevance = kDefaultZeroSuggestRelevance; 286 287 // Apply valid suggested relevance scores; discard invalid lists. 288 if (relevances != NULL && !relevances->GetInteger(index, &relevance)) 289 relevances = NULL; 290 if (types && types->GetString(index, &type) && (type == "NAVIGATION")) { 291 // Do not blindly trust the URL coming from the server to be valid. 292 GURL url(URLFixerUpper::FixupURL(UTF16ToUTF8(result), std::string())); 293 if (url.is_valid()) { 294 if (descriptions != NULL) 295 descriptions->GetString(index, &title); 296 navigation_results->push_back(SearchProvider::NavigationResult( 297 *this, url, title, false, relevance, relevances != NULL)); 298 } 299 } else { 300 suggest_results->push_back(SearchProvider::SuggestResult( 301 result, false, relevance, relevances != NULL, false)); 302 } 303 } 304} 305 306void ZeroSuggestProvider::AddSuggestResultsToMap( 307 const SearchProvider::SuggestResults& results, 308 const TemplateURL* template_url, 309 SearchProvider::MatchMap* map) { 310 for (size_t i = 0; i < results.size(); ++i) { 311 AddMatchToMap(results[i].relevance(), AutocompleteMatchType::SEARCH_SUGGEST, 312 template_url, results[i].suggestion(), i, map); 313 } 314} 315 316void ZeroSuggestProvider::AddMatchToMap(int relevance, 317 AutocompleteMatch::Type type, 318 const TemplateURL* template_url, 319 const string16& query_string, 320 int accepted_suggestion, 321 SearchProvider::MatchMap* map) { 322 // Pass in query_string as the input_text since we don't want any bolding. 323 // TODO(samarth|melevin): use the actual omnibox margin here as well instead 324 // of passing in -1. 325 AutocompleteMatch match = SearchProvider::CreateSearchSuggestion( 326 this, relevance, type, template_url, query_string, query_string, 327 AutocompleteInput(), false, accepted_suggestion, -1, true); 328 if (!match.destination_url.is_valid()) 329 return; 330 331 // Try to add |match| to |map|. If a match for |query_string| is already in 332 // |map|, replace it if |match| is more relevant. 333 // NOTE: Keep this ToLower() call in sync with url_database.cc. 334 const std::pair<SearchProvider::MatchMap::iterator, bool> i(map->insert( 335 std::make_pair(base::i18n::ToLower(query_string), match))); 336 // NOTE: We purposefully do a direct relevance comparison here instead of 337 // using AutocompleteMatch::MoreRelevant(), so that we'll prefer "items added 338 // first" rather than "items alphabetically first" when the scores are equal. 339 // The only case this matters is when a user has results with the same score 340 // that differ only by capitalization; because the history system returns 341 // results sorted by recency, this means we'll pick the most recent such 342 // result even if the precision of our relevance score is too low to 343 // distinguish the two. 344 if (!i.second && (match.relevance > i.first->second.relevance)) 345 i.first->second = match; 346} 347 348AutocompleteMatch ZeroSuggestProvider::NavigationToMatch( 349 const SearchProvider::NavigationResult& navigation) { 350 AutocompleteMatch match(this, navigation.relevance(), false, 351 AutocompleteMatchType::NAVSUGGEST); 352 match.destination_url = navigation.url(); 353 354 const std::string languages( 355 profile_->GetPrefs()->GetString(prefs::kAcceptLanguages)); 356 match.contents = net::FormatUrl(navigation.url(), languages, 357 net::kFormatUrlOmitAll, net::UnescapeRule::SPACES, NULL, NULL, NULL); 358 match.fill_into_edit += 359 AutocompleteInput::FormattedStringWithEquivalentMeaning(navigation.url(), 360 match.contents); 361 362 AutocompleteMatch::ClassifyLocationInString(string16::npos, 0, 363 match.contents.length(), ACMatchClassification::URL, 364 &match.contents_class); 365 366 match.description = 367 AutocompleteMatch::SanitizeString(navigation.description()); 368 AutocompleteMatch::ClassifyLocationInString(string16::npos, 0, 369 match.description.length(), ACMatchClassification::NONE, 370 &match.description_class); 371 return match; 372} 373 374void ZeroSuggestProvider::Run() { 375 have_pending_request_ = false; 376 const int kFetcherID = 1; 377 378 const TemplateURL* default_provider = 379 template_url_service_->GetDefaultSearchProvider(); 380 // TODO(hfung): Generalize if the default provider supports zero suggest. 381 // Only make the request if we know that the provider supports zero suggest 382 // (currently only the prepopulated Google provider). 383 if (default_provider == NULL || !default_provider->SupportsReplacement() || 384 default_provider->prepopulate_id() != 1) { 385 Stop(true); 386 return; 387 } 388 string16 prefix; 389 TemplateURLRef::SearchTermsArgs search_term_args(prefix); 390 search_term_args.zero_prefix_url = current_query_; 391 std::string req_url = default_provider->suggestions_url_ref(). 392 ReplaceSearchTerms(search_term_args); 393 GURL suggest_url(req_url); 394 // Make sure we are sending the suggest request through HTTPS. 395 if (!suggest_url.SchemeIs(content::kHttpsScheme)) { 396 Stop(true); 397 return; 398 } 399 400 fetcher_.reset( 401 net::URLFetcher::Create(kFetcherID, 402 suggest_url, 403 net::URLFetcher::GET, this)); 404 fetcher_->SetRequestContext(profile_->GetRequestContext()); 405 fetcher_->SetLoadFlags(net::LOAD_DO_NOT_SAVE_COOKIES); 406 // Add Chrome experiment state to the request headers. 407 net::HttpRequestHeaders headers; 408 chrome_variations::VariationsHttpHeaderProvider::GetInstance()->AppendHeaders( 409 fetcher_->GetOriginalURL(), profile_->IsOffTheRecord(), false, &headers); 410 fetcher_->SetExtraRequestHeaders(headers.ToString()); 411 412 fetcher_->Start(); 413 have_pending_request_ = true; 414 LogOmniboxZeroSuggestRequest(ZERO_SUGGEST_REQUEST_SENT); 415} 416 417void ZeroSuggestProvider::ParseSuggestResults(const Value& root_val) { 418 SearchProvider::SuggestResults suggest_results; 419 FillResults(root_val, &verbatim_relevance_, 420 &suggest_results, &navigation_results_); 421 422 query_matches_map_.clear(); 423 AddSuggestResultsToMap(suggest_results, 424 template_url_service_->GetDefaultSearchProvider(), 425 &query_matches_map_); 426} 427 428void ZeroSuggestProvider::ConvertResultsToAutocompleteMatches() { 429 matches_.clear(); 430 431 const TemplateURL* default_provider = 432 template_url_service_->GetDefaultSearchProvider(); 433 // Fail if we can't set the clickthrough URL for query suggestions. 434 if (default_provider == NULL || !default_provider->SupportsReplacement()) 435 return; 436 437 const int num_query_results = query_matches_map_.size(); 438 const int num_nav_results = navigation_results_.size(); 439 const int num_results = num_query_results + num_nav_results; 440 UMA_HISTOGRAM_COUNTS("ZeroSuggest.QueryResults", num_query_results); 441 UMA_HISTOGRAM_COUNTS("ZeroSuggest.URLResults", num_nav_results); 442 UMA_HISTOGRAM_COUNTS("ZeroSuggest.AllResults", num_results); 443 444 if (num_results == 0) 445 return; 446 447 // TODO(jered): Rip this out once the first match is decoupled from the 448 // current typing in the omnibox. 449 matches_.push_back(current_url_match_); 450 451 for (SearchProvider::MatchMap::const_iterator it(query_matches_map_.begin()); 452 it != query_matches_map_.end(); ++it) 453 matches_.push_back(it->second); 454 455 for (SearchProvider::NavigationResults::const_iterator it( 456 navigation_results_.begin()); it != navigation_results_.end(); ++it) 457 matches_.push_back(NavigationToMatch(*it)); 458} 459 460AutocompleteMatch ZeroSuggestProvider::MatchForCurrentURL() { 461 AutocompleteInput input(permanent_text_, string16::npos, string16(), 462 GURL(current_query_), current_page_classification_, 463 false, false, true, AutocompleteInput::ALL_MATCHES); 464 465 AutocompleteMatch match; 466 AutocompleteClassifierFactory::GetForProfile(profile_)->Classify( 467 permanent_text_, false, true, &match, NULL); 468 match.is_history_what_you_typed_match = false; 469 match.allowed_to_be_default_match = true; 470 471 // The placeholder suggestion for the current URL has high relevance so 472 // that it is in the first suggestion slot and inline autocompleted. It 473 // gets dropped as soon as the user types something. 474 match.relevance = verbatim_relevance_; 475 476 return match; 477} 478