blob: b5a6f48296c744aaed7aec6ce2dcbee41c19fc5f [file] [log] [blame]
[email protected]e41982a72012-11-20 07:16:511// Copyright 2012 The Chromium Authors. All rights reserved.
license.botbf09a502008-08-24 00:55:552// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
initial.commit09911bf2008-07-26 23:55:294
5#include "chrome/browser/autocomplete/search_provider.h"
6
[email protected]1cb2dac2010-03-08 21:49:157#include <algorithm>
[email protected]c3a4bd992010-08-18 20:25:018#include <cmath>
[email protected]1cb2dac2010-03-08 21:49:159
[email protected]2041cf342010-02-19 03:15:5910#include "base/callback.h"
[email protected]51124552011-07-16 01:37:1011#include "base/i18n/break_iterator.h"
[email protected]503d03872011-05-06 08:36:2612#include "base/i18n/case_conversion.h"
[email protected]d6e58c6e2009-10-10 20:40:5013#include "base/i18n/icu_string_conversions.h"
[email protected]ffbec692012-02-26 20:26:4214#include "base/json/json_string_value_serializer.h"
[email protected]fa1e0e12013-07-18 00:10:1415#include "base/message_loop/message_loop.h"
[email protected]f5b95ba92012-03-27 14:05:1916#include "base/metrics/histogram.h"
[email protected]3853a4c2013-02-11 17:15:5717#include "base/prefs/pref_service.h"
[email protected]98570e12013-06-10 19:54:2218#include "base/strings/string16.h"
19#include "base/strings/string_util.h"
[email protected]135cb802013-06-09 16:44:2020#include "base/strings/utf_string_conversions.h"
[email protected]ea3b9a502011-04-04 14:19:3721#include "chrome/browser/autocomplete/autocomplete_classifier.h"
[email protected]810ffba2012-06-12 01:07:4822#include "chrome/browser/autocomplete/autocomplete_classifier_factory.h"
[email protected]9ac40092010-10-27 23:05:2623#include "chrome/browser/autocomplete/autocomplete_match.h"
[email protected]5af9bc82012-06-29 00:53:4824#include "chrome/browser/autocomplete/autocomplete_provider_listener.h"
[email protected]73c2b1632012-07-02 22:51:3825#include "chrome/browser/autocomplete/autocomplete_result.h"
[email protected]2c812ba02011-07-14 00:23:1526#include "chrome/browser/autocomplete/keyword_provider.h"
[email protected]371dab12012-06-01 03:23:5527#include "chrome/browser/autocomplete/url_prefix.h"
[email protected]6a2c09f2013-01-25 04:50:0728#include "chrome/browser/history/history_service.h"
[email protected]9d2db762012-06-19 00:01:1029#include "chrome/browser/history/history_service_factory.h"
[email protected]10c2d692012-05-11 05:32:2330#include "chrome/browser/history/in_memory_database.h"
[email protected]ab7780792013-01-10 01:26:0931#include "chrome/browser/metrics/variations/variations_http_header_provider.h"
[email protected]684fcc12013-03-08 22:50:0232#include "chrome/browser/omnibox/omnibox_field_trial.h"
[email protected]8ecad5e2010-12-02 21:18:3333#include "chrome/browser/profiles/profile.h"
[email protected]a7b8e43d2013-03-18 18:52:4334#include "chrome/browser/search/search.h"
[email protected]9899a612012-08-21 23:50:0435#include "chrome/browser/search_engines/template_url_prepopulate_data.h"
[email protected]8e5c89a2011-06-07 18:13:3336#include "chrome/browser/search_engines/template_url_service.h"
37#include "chrome/browser/search_engines/template_url_service_factory.h"
[email protected]c4a9d4c2013-08-10 07:06:2738#include "chrome/browser/ui/browser.h"
39#include "chrome/browser/ui/browser_finder.h"
40#include "chrome/browser/ui/browser_instant_controller.h"
41#include "chrome/browser/ui/search/instant_controller.h"
[email protected]4f3b4462013-07-27 19:20:1842#include "chrome/common/net/url_fixer_upper.h"
initial.commit09911bf2008-07-26 23:55:2943#include "chrome/common/pref_names.h"
[email protected]dcf7d352009-02-26 01:56:0244#include "chrome/common/url_constants.h"
[email protected]34ac8f32009-02-22 23:03:2745#include "grit/generated_resources.h"
initial.commit09911bf2008-07-26 23:55:2946#include "net/base/escape.h"
[email protected]d3cf8682f02012-02-29 23:29:3447#include "net/base/load_flags.h"
[email protected]371dab12012-06-01 03:23:5548#include "net/base/net_util.h"
[email protected]bd3b4712012-12-18 17:01:3049#include "net/http/http_request_headers.h"
[email protected]319d9e6f2009-02-18 19:47:2150#include "net/http/http_response_headers.h"
[email protected]3dc1bc42012-06-19 08:20:5351#include "net/url_request/url_fetcher.h"
[email protected]319d9e6f2009-02-18 19:47:2152#include "net/url_request/url_request_status.h"
[email protected]c051a1b2011-01-21 23:30:1753#include "ui/base/l10n/l10n_util.h"
[email protected]761fa4702013-07-02 15:25:1554#include "url/url_util.h"
initial.commit09911bf2008-07-26 23:55:2955
[email protected]bc8bb0cd2013-06-24 21:50:2356
57// Helpers --------------------------------------------------------------------
[email protected]e1acf6f2008-10-27 20:43:3358
[email protected]51124552011-07-16 01:37:1059namespace {
60
[email protected]7706a522012-08-16 17:42:2561// We keep track in a histogram how many suggest requests we send, how
62// many suggest requests we invalidate (e.g., due to a user typing
63// another character), and how many replies we receive.
64// *** ADD NEW ENUMS AFTER ALL PREVIOUSLY DEFINED ONES! ***
65// (excluding the end-of-list enum value)
66// We do not want values of existing enums to change or else it screws
67// up the statistics.
68enum SuggestRequestsHistogramValue {
69 REQUEST_SENT = 1,
70 REQUEST_INVALIDATED,
71 REPLY_RECEIVED,
72 MAX_SUGGEST_REQUEST_HISTOGRAM_VALUE
73};
74
[email protected]90fe2bb2013-01-15 03:42:1375// The verbatim score for an input which is not an URL.
76const int kNonURLVerbatimRelevance = 1300;
77
[email protected]7706a522012-08-16 17:42:2578// Increments the appropriate value in the histogram by one.
79void LogOmniboxSuggestRequest(
80 SuggestRequestsHistogramValue request_value) {
81 UMA_HISTOGRAM_ENUMERATION("Omnibox.SuggestRequests", request_value,
82 MAX_SUGGEST_REQUEST_HISTOGRAM_VALUE);
83}
84
[email protected]51124552011-07-16 01:37:1085bool HasMultipleWords(const string16& text) {
86 base::i18n::BreakIterator i(text, base::i18n::BreakIterator::BREAK_WORD);
87 bool found_word = false;
88 if (i.Init()) {
89 while (i.Advance()) {
90 if (i.IsWord()) {
91 if (found_word)
92 return true;
93 found_word = true;
94 }
95 }
96 }
97 return false;
98}
99
[email protected]d1f0a7f2012-06-05 10:26:42100} // namespace
[email protected]51124552011-07-16 01:37:10101
[email protected]033f3422012-03-13 21:24:18102
[email protected]3954c3a2012-04-10 20:17:55103// SearchProvider::Providers --------------------------------------------------
[email protected]b547666d2009-04-23 16:37:58104
[email protected]85b8d6f2012-05-08 20:53:47105SearchProvider::Providers::Providers(TemplateURLService* template_url_service)
106 : template_url_service_(template_url_service) {
107}
108
109const TemplateURL* SearchProvider::Providers::GetDefaultProviderURL() const {
110 return default_provider_.empty() ? NULL :
111 template_url_service_->GetTemplateURLForKeyword(default_provider_);
112}
113
114const TemplateURL* SearchProvider::Providers::GetKeywordProviderURL() const {
115 return keyword_provider_.empty() ? NULL :
116 template_url_service_->GetTemplateURLForKeyword(keyword_provider_);
[email protected]257ab712009-04-14 17:16:24117}
118
[email protected]3954c3a2012-04-10 20:17:55119
[email protected]bc8bb0cd2013-06-24 21:50:23120// SearchProvider::Result -----------------------------------------------------
121
122SearchProvider::Result::Result(bool from_keyword_provider,
[email protected]d30268a2013-06-25 22:31:07123 int relevance,
124 bool relevance_from_server)
[email protected]bc8bb0cd2013-06-24 21:50:23125 : from_keyword_provider_(from_keyword_provider),
[email protected]d30268a2013-06-25 22:31:07126 relevance_(relevance),
127 relevance_from_server_(relevance_from_server) {
[email protected]bc8bb0cd2013-06-24 21:50:23128}
129
130SearchProvider::Result::~Result() {
131}
132
133
134// SearchProvider::SuggestResult ----------------------------------------------
135
136SearchProvider::SuggestResult::SuggestResult(const string16& suggestion,
137 bool from_keyword_provider,
[email protected]d30268a2013-06-25 22:31:07138 int relevance,
139 bool relevance_from_server)
140 : Result(from_keyword_provider, relevance, relevance_from_server),
[email protected]bc8bb0cd2013-06-24 21:50:23141 suggestion_(suggestion) {
142}
143
144SearchProvider::SuggestResult::~SuggestResult() {
145}
146
147bool SearchProvider::SuggestResult::IsInlineable(const string16& input) const {
148 return StartsWith(suggestion_, input, false);
149}
150
151int SearchProvider::SuggestResult::CalculateRelevance(
152 const AutocompleteInput& input,
153 bool keyword_provider_requested) const {
154 if (!from_keyword_provider_ && keyword_provider_requested)
155 return 100;
156 return ((input.type() == AutocompleteInput::URL) ? 300 : 600);
157}
158
159
160// SearchProvider::NavigationResult -------------------------------------------
161
162SearchProvider::NavigationResult::NavigationResult(
163 const AutocompleteProvider& provider,
164 const GURL& url,
165 const string16& description,
166 bool from_keyword_provider,
[email protected]d30268a2013-06-25 22:31:07167 int relevance,
168 bool relevance_from_server)
169 : Result(from_keyword_provider, relevance, relevance_from_server),
[email protected]bc8bb0cd2013-06-24 21:50:23170 url_(url),
171 formatted_url_(AutocompleteInput::FormattedStringWithEquivalentMeaning(
172 url, provider.StringForURLDisplay(url, true, false))),
173 description_(description) {
174 DCHECK(url_.is_valid());
175}
176
177SearchProvider::NavigationResult::~NavigationResult() {
178}
179
180bool SearchProvider::NavigationResult::IsInlineable(
181 const string16& input) const {
182 return URLPrefix::BestURLPrefix(formatted_url_, input) != NULL;
183}
184
185int SearchProvider::NavigationResult::CalculateRelevance(
186 const AutocompleteInput& input,
187 bool keyword_provider_requested) const {
188 return (from_keyword_provider_ || !keyword_provider_requested) ? 800 : 150;
189}
190
191
192// SearchProvider::CompareScoredResults ---------------------------------------
193
194class SearchProvider::CompareScoredResults {
195 public:
196 bool operator()(const Result& a, const Result& b) {
197 // Sort in descending relevance order.
198 return a.relevance() > b.relevance();
199 }
200};
201
202
203// SearchProvider::Results ----------------------------------------------------
204
[email protected]d30268a2013-06-25 22:31:07205SearchProvider::Results::Results() : verbatim_relevance(-1) {
[email protected]bc8bb0cd2013-06-24 21:50:23206}
207
208SearchProvider::Results::~Results() {
209}
210
211void SearchProvider::Results::Clear() {
212 suggest_results.clear();
213 navigation_results.clear();
[email protected]bc8bb0cd2013-06-24 21:50:23214 verbatim_relevance = -1;
215}
216
217bool SearchProvider::Results::HasServerProvidedScores() const {
218 if (verbatim_relevance >= 0)
219 return true;
220
[email protected]d30268a2013-06-25 22:31:07221 // Right now either all results of one type will be server-scored or they will
222 // all be locally scored, but in case we change this later, we'll just check
223 // them all.
224 for (SuggestResults::const_iterator i(suggest_results.begin());
225 i != suggest_results.end(); ++i) {
226 if (i->relevance_from_server())
227 return true;
228 }
229 for (NavigationResults::const_iterator i(navigation_results.begin());
230 i != navigation_results.end(); ++i) {
231 if (i->relevance_from_server())
232 return true;
233 }
234
235 return false;
[email protected]bc8bb0cd2013-06-24 21:50:23236}
[email protected]d30268a2013-06-25 22:31:07237
238
[email protected]3954c3a2012-04-10 20:17:55239// SearchProvider -------------------------------------------------------------
240
241// static
242const int SearchProvider::kDefaultProviderURLFetcherID = 1;
[email protected]3954c3a2012-04-10 20:17:55243const int SearchProvider::kKeywordProviderURLFetcherID = 2;
[email protected]24dbf2302013-04-05 16:59:25244int SearchProvider::kMinimumTimeBetweenSuggestQueriesMs = 100;
[email protected]d30268a2013-06-25 22:31:07245const char SearchProvider::kRelevanceFromServerKey[] = "relevance_from_server";
246const char SearchProvider::kTrue[] = "true";
247const char SearchProvider::kFalse[] = "false";
[email protected]3954c3a2012-04-10 20:17:55248
[email protected]bc8bb0cd2013-06-24 21:50:23249SearchProvider::SearchProvider(AutocompleteProviderListener* listener,
250 Profile* profile)
251 : AutocompleteProvider(listener, profile,
252 AutocompleteProvider::TYPE_SEARCH),
253 providers_(TemplateURLServiceFactory::GetForProfile(profile)),
254 suggest_results_pending_(0),
[email protected]bc8bb0cd2013-06-24 21:50:23255 field_trial_triggered_(false),
[email protected]c4a9d4c2013-08-10 07:06:27256 field_trial_triggered_in_session_(false) {
[email protected]bc8bb0cd2013-06-24 21:50:23257}
258
[email protected]cb86ee6f2013-04-28 16:58:15259// static
260AutocompleteMatch SearchProvider::CreateSearchSuggestion(
[email protected]cb86ee6f2013-04-28 16:58:15261 AutocompleteProvider* autocomplete_provider,
[email protected]cb86ee6f2013-04-28 16:58:15262 int relevance,
263 AutocompleteMatch::Type type,
[email protected]bba9e632013-06-28 22:52:19264 const TemplateURL* template_url,
265 const string16& query_string,
266 const string16& input_text,
267 const AutocompleteInput& input,
[email protected]cb86ee6f2013-04-28 16:58:15268 bool is_keyword,
[email protected]bba9e632013-06-28 22:52:19269 int accepted_suggestion,
[email protected]56fa29592013-07-02 20:25:53270 int omnibox_start_margin,
271 bool append_extra_query_params) {
[email protected]cb86ee6f2013-04-28 16:58:15272 AutocompleteMatch match(autocomplete_provider, relevance, false, type);
273
[email protected]bba9e632013-06-28 22:52:19274 if (!template_url)
[email protected]cb86ee6f2013-04-28 16:58:15275 return match;
[email protected]bba9e632013-06-28 22:52:19276 match.keyword = template_url->keyword();
[email protected]cb86ee6f2013-04-28 16:58:15277
278 match.contents.assign(query_string);
279 // We do intra-string highlighting for suggestions - the suggested segment
280 // will be highlighted, e.g. for input_text = "you" the suggestion may be
281 // "youtube", so we'll bold the "tube" section: you*tube*.
282 if (input_text != query_string) {
283 size_t input_position = match.contents.find(input_text);
284 if (input_position == string16::npos) {
285 // The input text is not a substring of the query string, e.g. input
286 // text is "slasdot" and the query string is "slashdot", so we bold the
287 // whole thing.
288 match.contents_class.push_back(
289 ACMatchClassification(0, ACMatchClassification::MATCH));
290 } else {
291 // TODO(beng): ACMatchClassification::MATCH now seems to just mean
292 // "bold" this. Consider modifying the terminology.
293 // We don't iterate over the string here annotating all matches because
294 // it looks odd to have every occurrence of a substring that may be as
295 // short as a single character highlighted in a query suggestion result,
296 // e.g. for input text "s" and query string "southwest airlines", it
297 // looks odd if both the first and last s are highlighted.
298 if (input_position != 0) {
299 match.contents_class.push_back(
[email protected]4b6d916e2013-06-07 05:02:08300 ACMatchClassification(0, ACMatchClassification::MATCH));
[email protected]cb86ee6f2013-04-28 16:58:15301 }
302 match.contents_class.push_back(
[email protected]4b6d916e2013-06-07 05:02:08303 ACMatchClassification(input_position, ACMatchClassification::NONE));
[email protected]cb86ee6f2013-04-28 16:58:15304 size_t next_fragment_position = input_position + input_text.length();
305 if (next_fragment_position < query_string.length()) {
306 match.contents_class.push_back(
307 ACMatchClassification(next_fragment_position,
[email protected]4b6d916e2013-06-07 05:02:08308 ACMatchClassification::MATCH));
[email protected]cb86ee6f2013-04-28 16:58:15309 }
310 }
311 } else {
312 // Otherwise, we're dealing with the "default search" result which has no
313 // completion.
314 match.contents_class.push_back(
315 ACMatchClassification(0, ACMatchClassification::NONE));
316 }
317
318 // When the user forced a query, we need to make sure all the fill_into_edit
319 // values preserve that property. Otherwise, if the user starts editing a
320 // suggestion, non-Search results will suddenly appear.
321 if (input.type() == AutocompleteInput::FORCED_QUERY)
322 match.fill_into_edit.assign(ASCIIToUTF16("?"));
323 if (is_keyword)
324 match.fill_into_edit.append(match.keyword + char16(' '));
325 if (!input.prevent_inline_autocomplete() &&
326 StartsWith(query_string, input_text, false)) {
[email protected]518024c2013-07-19 23:40:25327 match.inline_autocompletion = query_string.substr(input_text.length());
[email protected]cb86ee6f2013-04-28 16:58:15328 }
329 match.fill_into_edit.append(query_string);
330
[email protected]bba9e632013-06-28 22:52:19331 const TemplateURLRef& search_url = template_url->url_ref();
[email protected]cb86ee6f2013-04-28 16:58:15332 DCHECK(search_url.SupportsReplacement());
333 match.search_terms_args.reset(
334 new TemplateURLRef::SearchTermsArgs(query_string));
335 match.search_terms_args->original_query = input_text;
336 match.search_terms_args->accepted_suggestion = accepted_suggestion;
[email protected]f3e46eec2013-06-11 14:46:28337 match.search_terms_args->omnibox_start_margin = omnibox_start_margin;
[email protected]56fa29592013-07-02 20:25:53338 match.search_terms_args->append_extra_query_params =
339 append_extra_query_params;
[email protected]cb86ee6f2013-04-28 16:58:15340 // This is the destination URL sans assisted query stats. This must be set
341 // so the AutocompleteController can properly de-dupe; the controller will
342 // eventually overwrite it before it reaches the user.
343 match.destination_url =
344 GURL(search_url.ReplaceSearchTerms(*match.search_terms_args.get()));
345
346 // Search results don't look like URLs.
347 match.transition = is_keyword ?
348 content::PAGE_TRANSITION_KEYWORD : content::PAGE_TRANSITION_GENERATED;
349
350 return match;
351}
352
[email protected]bc8bb0cd2013-06-24 21:50:23353void SearchProvider::AddProviderInfo(ProvidersInfo* provider_info) const {
354 provider_info->push_back(metrics::OmniboxEventProto_ProviderInfo());
355 metrics::OmniboxEventProto_ProviderInfo& new_entry = provider_info->back();
356 new_entry.set_provider(AsOmniboxEventProviderType());
357 new_entry.set_provider_done(done_);
358 std::vector<uint32> field_trial_hashes;
359 OmniboxFieldTrial::GetActiveSuggestFieldTrialHashes(&field_trial_hashes);
360 for (size_t i = 0; i < field_trial_hashes.size(); ++i) {
361 if (field_trial_triggered_)
362 new_entry.mutable_field_trial_triggered()->Add(field_trial_hashes[i]);
363 if (field_trial_triggered_in_session_) {
364 new_entry.mutable_field_trial_triggered_in_session()->Add(
365 field_trial_hashes[i]);
366 }
367 }
368}
369
370void SearchProvider::ResetSession() {
371 field_trial_triggered_in_session_ = false;
[email protected]4ab4c7c2010-11-24 04:49:34372}
373
[email protected]bc8bb0cd2013-06-24 21:50:23374SearchProvider::~SearchProvider() {
375}
376
377// static
378void SearchProvider::RemoveStaleResults(const string16& input,
379 int verbatim_relevance,
380 SuggestResults* suggest_results,
381 NavigationResults* navigation_results) {
382 DCHECK_GE(verbatim_relevance, 0);
383 // Keep pointers to the head of (the highest scoring elements of)
384 // |suggest_results| and |navigation_results|. Iterate down the lists
385 // removing non-inlineable results in order of decreasing relevance
386 // scores. Stop when the highest scoring element among those remaining
387 // is inlineable or the element is less than |verbatim_relevance|.
388 // This allows non-inlineable lower-scoring results to remain
389 // because (i) they are guaranteed to not be inlined and (ii)
390 // letting them remain reduces visual jank. For instance, as the
391 // user types the mis-spelled query "fpobar" (for foobar), the
392 // suggestion "foobar" will be suggested on every keystroke. If the
393 // SearchProvider always removes all non-inlineable results, the user will
394 // see visual jitter/jank as the result disappears and re-appears moments
395 // later as the suggest server returns results.
396 SuggestResults::iterator sug_it = suggest_results->begin();
397 NavigationResults::iterator nav_it = navigation_results->begin();
398 while ((sug_it != suggest_results->end()) ||
399 (nav_it != navigation_results->end())) {
400 const int sug_rel =
401 (sug_it != suggest_results->end()) ? sug_it->relevance() : -1;
402 const int nav_rel =
403 (nav_it != navigation_results->end()) ? nav_it->relevance() : -1;
404 if (std::max(sug_rel, nav_rel) < verbatim_relevance)
405 break;
406 if (sug_rel > nav_rel) {
407 // The current top result is a search suggestion.
408 if (sug_it->IsInlineable(input))
409 break;
410 sug_it = suggest_results->erase(sug_it);
411 } else if (sug_rel == nav_rel) {
412 // Have both results and they're tied.
413 const bool sug_inlineable = sug_it->IsInlineable(input);
414 const bool nav_inlineable = nav_it->IsInlineable(input);
415 if (!sug_inlineable)
416 sug_it = suggest_results->erase(sug_it);
417 if (!nav_inlineable)
418 nav_it = navigation_results->erase(nav_it);
419 if (sug_inlineable || nav_inlineable)
420 break;
421 } else {
422 // The current top result is a navigational suggestion.
423 if (nav_it->IsInlineable(input))
424 break;
425 nav_it = navigation_results->erase(nav_it);
426 }
427 }
428}
429
430// static
431int SearchProvider::CalculateRelevanceForKeywordVerbatim(
432 AutocompleteInput::Type type,
433 bool prefer_keyword) {
434 // This function is responsible for scoring verbatim query matches
435 // for non-extension keywords. KeywordProvider::CalculateRelevance()
436 // scores verbatim query matches for extension keywords, as well as
437 // for keyword matches (i.e., suggestions of a keyword itself, not a
438 // suggestion of a query on a keyword search engine). These two
439 // functions are currently in sync, but there's no reason we
440 // couldn't decide in the future to score verbatim matches
441 // differently for extension and non-extension keywords. If you
442 // make such a change, however, you should update this comment to
443 // describe it, so it's clear why the functions diverge.
444 if (prefer_keyword)
445 return 1500;
446 return (type == AutocompleteInput::QUERY) ? 1450 : 1100;
447}
448
initial.commit09911bf2008-07-26 23:55:29449void SearchProvider::Start(const AutocompleteInput& input,
[email protected]8deeb952008-10-09 18:21:27450 bool minimal_changes) {
[email protected]04504c242013-01-22 21:08:55451 // Do our best to load the model as early as possible. This will reduce
452 // odds of having the model not ready when really needed (a non-empty input).
453 TemplateURLService* model = providers_.template_url_service();
454 DCHECK(model);
455 model->Load();
456
initial.commit09911bf2008-07-26 23:55:29457 matches_.clear();
[email protected]618d6e62012-12-16 05:55:57458 field_trial_triggered_ = false;
initial.commit09911bf2008-07-26 23:55:29459
[email protected]6c85aa02009-02-27 12:08:09460 // Can't return search/suggest results for bogus input or without a profile.
initial.commit09911bf2008-07-26 23:55:29461 if (!profile_ || (input.type() == AutocompleteInput::INVALID)) {
[email protected]e29249dc52012-07-19 17:33:50462 Stop(false);
initial.commit09911bf2008-07-26 23:55:29463 return;
464 }
465
[email protected]14710852013-02-05 23:45:41466 keyword_input_ = input;
[email protected]257ab712009-04-14 17:16:24467 const TemplateURL* keyword_provider =
[email protected]14710852013-02-05 23:45:41468 KeywordProvider::GetSubstitutingTemplateURLForInput(model,
469 &keyword_input_);
470 if (keyword_provider == NULL)
471 keyword_input_.Clear();
472 else if (keyword_input_.text().empty())
[email protected]257ab712009-04-14 17:16:24473 keyword_provider = NULL;
[email protected]257ab712009-04-14 17:16:24474
[email protected]85b8d6f2012-05-08 20:53:47475 const TemplateURL* default_provider = model->GetDefaultSearchProvider();
[email protected]9b74ab52012-03-30 16:08:07476 if (default_provider && !default_provider->SupportsReplacement())
[email protected]257ab712009-04-14 17:16:24477 default_provider = NULL;
478
479 if (keyword_provider == default_provider)
[email protected]e17511f2011-07-13 14:09:18480 default_provider = NULL; // No use in querying the same provider twice.
[email protected]257ab712009-04-14 17:16:24481
482 if (!default_provider && !keyword_provider) {
483 // No valid providers.
[email protected]e29249dc52012-07-19 17:33:50484 Stop(false);
initial.commit09911bf2008-07-26 23:55:29485 return;
486 }
487
488 // If we're still running an old query but have since changed the query text
[email protected]257ab712009-04-14 17:16:24489 // or the providers, abort the query.
[email protected]85b8d6f2012-05-08 20:53:47490 string16 default_provider_keyword(default_provider ?
491 default_provider->keyword() : string16());
492 string16 keyword_provider_keyword(keyword_provider ?
493 keyword_provider->keyword() : string16());
[email protected]9e789742011-01-10 23:27:32494 if (!minimal_changes ||
[email protected]85b8d6f2012-05-08 20:53:47495 !providers_.equal(default_provider_keyword, keyword_provider_keyword)) {
[email protected]bb900e02013-03-14 14:15:29496 // Cancel any in-flight suggest requests.
[email protected]e1290ee62013-06-26 18:31:15497 if (!done_)
[email protected]e29249dc52012-07-19 17:33:50498 Stop(false);
[email protected]257ab712009-04-14 17:16:24499 }
initial.commit09911bf2008-07-26 23:55:29500
[email protected]85b8d6f2012-05-08 20:53:47501 providers_.set(default_provider_keyword, keyword_provider_keyword);
initial.commit09911bf2008-07-26 23:55:29502
503 if (input.text().empty()) {
504 // User typed "?" alone. Give them a placeholder result indicating what
505 // this syntax does.
[email protected]257ab712009-04-14 17:16:24506 if (default_provider) {
[email protected]69c579e2010-04-23 20:01:00507 AutocompleteMatch match;
508 match.provider = this;
[email protected]a2fedb1e2011-01-25 15:23:36509 match.contents.assign(l10n_util::GetStringUTF16(IDS_EMPTY_KEYWORD_VALUE));
[email protected]257ab712009-04-14 17:16:24510 match.contents_class.push_back(
[email protected]2c33dd22010-02-11 21:46:35511 ACMatchClassification(0, ACMatchClassification::NONE));
[email protected]85b8d6f2012-05-08 20:53:47512 match.keyword = providers_.default_provider();
[email protected]257ab712009-04-14 17:16:24513 matches_.push_back(match);
514 }
[email protected]e29249dc52012-07-19 17:33:50515 Stop(false);
initial.commit09911bf2008-07-26 23:55:29516 return;
517 }
518
519 input_ = input;
520
[email protected]e1290ee62013-06-26 18:31:15521 DoHistoryQuery(minimal_changes);
522 StartOrStopSuggestQuery(minimal_changes);
[email protected]344946a12012-12-20 12:03:42523 UpdateMatches();
initial.commit09911bf2008-07-26 23:55:29524}
525
[email protected]e29249dc52012-07-19 17:33:50526void SearchProvider::Stop(bool clear_cached_results) {
initial.commit09911bf2008-07-26 23:55:29527 StopSuggest();
528 done_ = true;
[email protected]e29249dc52012-07-19 17:33:50529
530 if (clear_cached_results)
[email protected]71b46152013-05-03 16:39:20531 ClearAllResults();
initial.commit09911bf2008-07-26 23:55:29532}
533
[email protected]10c2d692012-05-11 05:32:23534void SearchProvider::OnURLFetchComplete(const net::URLFetcher* source) {
initial.commit09911bf2008-07-26 23:55:29535 DCHECK(!done_);
[email protected]257ab712009-04-14 17:16:24536 suggest_results_pending_--;
[email protected]7706a522012-08-16 17:42:25537 LogOmniboxSuggestRequest(REPLY_RECEIVED);
[email protected]1cb2dac2010-03-08 21:49:15538 DCHECK_GE(suggest_results_pending_, 0); // Should never go negative.
[email protected]ec9207d32008-09-26 00:51:06539 const net::HttpResponseHeaders* const response_headers =
[email protected]7cc6e5632011-10-25 17:56:12540 source->GetResponseHeaders();
[email protected]c530c852011-10-24 18:18:34541 std::string json_data;
542 source->GetResponseAsString(&json_data);
[email protected]6c85aa02009-02-27 12:08:09543 // JSON is supposed to be UTF-8, but some suggest service providers send JSON
544 // files in non-UTF-8 encodings. The actual encoding is usually specified in
545 // the Content-Type header field.
[email protected]ec9207d32008-09-26 00:51:06546 if (response_headers) {
547 std::string charset;
548 if (response_headers->GetCharset(&charset)) {
[email protected]a2fedb1e2011-01-25 15:23:36549 string16 data_16;
[email protected]ec9207d32008-09-26 00:51:06550 // TODO(jungshik): Switch to CodePageToUTF8 after it's added.
[email protected]c530c852011-10-24 18:18:34551 if (base::CodepageToUTF16(json_data, charset.c_str(),
[email protected]a2fedb1e2011-01-25 15:23:36552 base::OnStringConversionError::FAIL,
553 &data_16))
554 json_data = UTF16ToUTF8(data_16);
[email protected]ec9207d32008-09-26 00:51:06555 }
556 }
557
[email protected]d7ad4772012-06-01 03:12:54558 const bool is_keyword = (source == keyword_fetcher_.get());
[email protected]f2916ea2013-01-26 02:20:14559 // Ensure the request succeeded and that the provider used is still available.
560 // A verbatim match cannot be generated without this provider, causing errors.
[email protected]013e9a02012-05-18 20:27:10561 const bool request_succeeded =
[email protected]bc8bb0cd2013-06-24 21:50:23562 source->GetStatus().is_success() && (source->GetResponseCode() == 200) &&
563 (is_keyword ?
564 providers_.GetKeywordProviderURL() :
565 providers_.GetDefaultProviderURL());
[email protected]a0ad93ea2012-05-07 22:11:53566
567 // Record response time for suggest requests sent to Google. We care
568 // only about the common case: the Google default provider used in
569 // non-keyword mode.
[email protected]85b8d6f2012-05-08 20:53:47570 const TemplateURL* default_url = providers_.GetDefaultProviderURL();
[email protected]55ce8f12012-05-09 04:44:08571 if (!is_keyword && default_url &&
[email protected]9899a612012-08-21 23:50:04572 (TemplateURLPrepopulateData::GetEngineType(default_url->url()) ==
573 SEARCH_ENGINE_GOOGLE)) {
[email protected]bc8bb0cd2013-06-24 21:50:23574 const base::TimeDelta elapsed_time =
[email protected]013e9a02012-05-18 20:27:10575 base::TimeTicks::Now() - time_suggest_request_sent_;
576 if (request_succeeded) {
577 UMA_HISTOGRAM_TIMES("Omnibox.SuggestRequest.Success.GoogleResponseTime",
578 elapsed_time);
579 } else {
580 UMA_HISTOGRAM_TIMES("Omnibox.SuggestRequest.Failure.GoogleResponseTime",
581 elapsed_time);
582 }
[email protected]b4cebf82008-12-29 19:59:08583 }
584
[email protected]d7ad4772012-06-01 03:12:54585 bool results_updated = false;
586 if (request_succeeded) {
587 JSONStringValueSerializer deserializer(json_data);
588 deserializer.set_allow_trailing_comma(true);
589 scoped_ptr<Value> data(deserializer.Deserialize(NULL, NULL));
590 results_updated = data.get() && ParseSuggestResults(data.get(), is_keyword);
591 }
592
[email protected]344946a12012-12-20 12:03:42593 UpdateMatches();
[email protected]d7ad4772012-06-01 03:12:54594 if (done_ || results_updated)
595 listener_->OnProviderUpdate(results_updated);
initial.commit09911bf2008-07-26 23:55:29596}
597
[email protected]bc8bb0cd2013-06-24 21:50:23598void SearchProvider::Run() {
599 // Start a new request with the current input.
600 suggest_results_pending_ = 0;
601 time_suggest_request_sent_ = base::TimeTicks::Now();
[email protected]abe441e2013-05-06 12:35:05602
[email protected]bc8bb0cd2013-06-24 21:50:23603 default_fetcher_.reset(CreateSuggestFetcher(kDefaultProviderURLFetcherID,
604 providers_.GetDefaultProviderURL(), input_));
605 keyword_fetcher_.reset(CreateSuggestFetcher(kKeywordProviderURLFetcherID,
606 providers_.GetKeywordProviderURL(), keyword_input_));
607
608 // Both the above can fail if the providers have been modified or deleted
609 // since the query began.
610 if (suggest_results_pending_ == 0) {
611 UpdateDone();
612 // We only need to update the listener if we're actually done.
613 if (done_)
614 listener_->OnProviderUpdate(false);
615 }
[email protected]601858c02010-09-01 17:08:20616}
617
[email protected]8d457132010-11-04 18:13:40618void SearchProvider::DoHistoryQuery(bool minimal_changes) {
619 // The history query results are synchronous, so if minimal_changes is true,
620 // we still have the last results and don't need to do anything.
621 if (minimal_changes)
initial.commit09911bf2008-07-26 23:55:29622 return;
623
[email protected]8d457132010-11-04 18:13:40624 keyword_history_results_.clear();
625 default_history_results_.clear();
initial.commit09911bf2008-07-26 23:55:29626
[email protected]78e5e432013-08-03 02:10:10627 if (OmniboxFieldTrial::SearchHistoryDisable(
628 input_.current_page_classification()))
[email protected]d8cd76b2013-07-10 09:46:16629 return;
630
[email protected]8d457132010-11-04 18:13:40631 HistoryService* const history_service =
[email protected]9d2db762012-06-19 00:01:10632 HistoryServiceFactory::GetForProfile(profile_, Profile::EXPLICIT_ACCESS);
[email protected]8d457132010-11-04 18:13:40633 history::URLDatabase* url_db = history_service ?
634 history_service->InMemoryDatabase() : NULL;
635 if (!url_db)
initial.commit09911bf2008-07-26 23:55:29636 return;
637
[email protected]51124552011-07-16 01:37:10638 // Request history for both the keyword and default provider. We grab many
639 // more matches than we'll ultimately clamp to so that if there are several
640 // recent multi-word matches who scores are lowered (see
641 // AddHistoryResultsToMap()), they won't crowd out older, higher-scoring
642 // matches. Note that this doesn't fix the problem entirely, but merely
643 // limits it to cases with a very large number of such multi-word matches; for
644 // now, this seems OK compared with the complexity of a real fix, which would
645 // require multiple searches and tracking of "single- vs. multi-word" in the
646 // database.
647 int num_matches = kMaxMatches * 5;
[email protected]85b8d6f2012-05-08 20:53:47648 const TemplateURL* default_url = providers_.GetDefaultProviderURL();
649 if (default_url) {
650 url_db->GetMostRecentKeywordSearchTerms(default_url->id(), input_.text(),
651 num_matches, &default_history_results_);
[email protected]257ab712009-04-14 17:16:24652 }
[email protected]85b8d6f2012-05-08 20:53:47653 const TemplateURL* keyword_url = providers_.GetKeywordProviderURL();
654 if (keyword_url) {
655 url_db->GetMostRecentKeywordSearchTerms(keyword_url->id(),
[email protected]14710852013-02-05 23:45:41656 keyword_input_.text(), num_matches, &keyword_history_results_);
[email protected]3954c3a2012-04-10 20:17:55657 }
initial.commit09911bf2008-07-26 23:55:29658}
659
[email protected]6dc950f2012-07-16 19:49:08660void SearchProvider::StartOrStopSuggestQuery(bool minimal_changes) {
[email protected]83c726482008-09-10 06:36:34661 if (!IsQuerySuitableForSuggest()) {
initial.commit09911bf2008-07-26 23:55:29662 StopSuggest();
[email protected]71b46152013-05-03 16:39:20663 ClearAllResults();
initial.commit09911bf2008-07-26 23:55:29664 return;
665 }
666
667 // For the minimal_changes case, if we finished the previous query and still
668 // have its results, or are allowed to keep running it, just do that, rather
669 // than starting a new query.
670 if (minimal_changes &&
[email protected]cc1526e2013-05-17 04:04:24671 (!default_results_.suggest_results.empty() ||
672 !default_results_.navigation_results.empty() ||
673 !keyword_results_.suggest_results.empty() ||
674 !keyword_results_.navigation_results.empty() ||
[email protected]ea3b9a502011-04-04 14:19:37675 (!done_ &&
676 input_.matches_requested() == AutocompleteInput::ALL_MATCHES)))
initial.commit09911bf2008-07-26 23:55:29677 return;
678
679 // We can't keep running any previous query, so halt it.
680 StopSuggest();
[email protected]d1f0a7f2012-06-05 10:26:42681
682 // Remove existing results that cannot inline autocomplete the new input.
[email protected]71b46152013-05-03 16:39:20683 RemoveAllStaleResults();
initial.commit09911bf2008-07-26 23:55:29684
685 // We can't start a new query if we're only allowed synchronous results.
[email protected]ea3b9a502011-04-04 14:19:37686 if (input_.matches_requested() != AutocompleteInput::ALL_MATCHES)
initial.commit09911bf2008-07-26 23:55:29687 return;
688
[email protected]24dbf2302013-04-05 16:59:25689 // To avoid flooding the suggest server, don't send a query until at
690 // least 100 ms since the last query.
[email protected]515ffa942012-11-27 20:18:24691 base::TimeTicks next_suggest_time(time_suggest_request_sent_ +
[email protected]bc8bb0cd2013-06-24 21:50:23692 base::TimeDelta::FromMilliseconds(kMinimumTimeBetweenSuggestQueriesMs));
[email protected]515ffa942012-11-27 20:18:24693 base::TimeTicks now(base::TimeTicks::Now());
694 if (now >= next_suggest_time) {
695 Run();
696 return;
697 }
698 timer_.Start(FROM_HERE, next_suggest_time - now, this, &SearchProvider::Run);
initial.commit09911bf2008-07-26 23:55:29699}
700
[email protected]83c726482008-09-10 06:36:34701bool SearchProvider::IsQuerySuitableForSuggest() const {
[email protected]3954c3a2012-04-10 20:17:55702 // Don't run Suggest in incognito mode, if the engine doesn't support it, or
703 // if the user has disabled it.
[email protected]85b8d6f2012-05-08 20:53:47704 const TemplateURL* default_url = providers_.GetDefaultProviderURL();
705 const TemplateURL* keyword_url = providers_.GetKeywordProviderURL();
[email protected]83c726482008-09-10 06:36:34706 if (profile_->IsOffTheRecord() ||
[email protected]85b8d6f2012-05-08 20:53:47707 ((!default_url || default_url->suggestions_url().empty()) &&
708 (!keyword_url || keyword_url->suggestions_url().empty())) ||
[email protected]83c726482008-09-10 06:36:34709 !profile_->GetPrefs()->GetBoolean(prefs::kSearchSuggestEnabled))
710 return false;
711
[email protected]cac59d32010-08-09 23:23:14712 // If the input type might be a URL, we take extra care so that private data
[email protected]83c726482008-09-10 06:36:34713 // isn't sent to the server.
[email protected]83c726482008-09-10 06:36:34714
[email protected]cac59d32010-08-09 23:23:14715 // FORCED_QUERY means the user is explicitly asking us to search for this, so
716 // we assume it isn't a URL and/or there isn't private data.
717 if (input_.type() == AutocompleteInput::FORCED_QUERY)
718 return true;
[email protected]83c726482008-09-10 06:36:34719
[email protected]f608ea102013-03-18 15:08:09720 // Next we check the scheme. If this is UNKNOWN/URL with a scheme that isn't
721 // http/https/ftp, we shouldn't send it. Sending things like file: and data:
722 // is both a waste of time and a disclosure of potentially private, local
723 // data. Other "schemes" may actually be usernames, and we don't want to send
724 // passwords. If the scheme is OK, we still need to check other cases below.
725 // If this is QUERY, then the presence of these schemes means the user
726 // explicitly typed one, and thus this is probably a URL that's being entered
727 // and happens to currently be invalid -- in which case we again want to run
728 // our checks below. Other QUERY cases are less likely to be URLs and thus we
729 // assume we're OK.
[email protected]a2fedb1e2011-01-25 15:23:36730 if (!LowerCaseEqualsASCII(input_.scheme(), chrome::kHttpScheme) &&
731 !LowerCaseEqualsASCII(input_.scheme(), chrome::kHttpsScheme) &&
732 !LowerCaseEqualsASCII(input_.scheme(), chrome::kFtpScheme))
[email protected]cac59d32010-08-09 23:23:14733 return (input_.type() == AutocompleteInput::QUERY);
734
735 // Don't send URLs with usernames, queries or refs. Some of these are
736 // private, and the Suggest server is unlikely to have any useful results
737 // for any of them. Also don't send URLs with ports, as we may initially
738 // think that a username + password is a host + port (and we don't want to
739 // send usernames/passwords), and even if the port really is a port, the
740 // server is once again unlikely to have and useful results.
741 const url_parse::Parsed& parts = input_.parts();
742 if (parts.username.is_nonempty() || parts.port.is_nonempty() ||
743 parts.query.is_nonempty() || parts.ref.is_nonempty())
744 return false;
745
746 // Don't send anything for https except the hostname. Hostnames are OK
747 // because they are visible when the TCP connection is established, but the
748 // specific path may reveal private information.
[email protected]a2fedb1e2011-01-25 15:23:36749 if (LowerCaseEqualsASCII(input_.scheme(), chrome::kHttpsScheme) &&
750 parts.path.is_nonempty())
[email protected]cac59d32010-08-09 23:23:14751 return false;
[email protected]83c726482008-09-10 06:36:34752
753 return true;
754}
755
initial.commit09911bf2008-07-26 23:55:29756void SearchProvider::StopSuggest() {
[email protected]7706a522012-08-16 17:42:25757 // Increment the appropriate field in the histogram by the number of
758 // pending requests that were invalidated.
759 for (int i = 0; i < suggest_results_pending_; i++)
760 LogOmniboxSuggestRequest(REQUEST_INVALIDATED);
[email protected]257ab712009-04-14 17:16:24761 suggest_results_pending_ = 0;
[email protected]2d316662008-09-03 18:18:14762 timer_.Stop();
[email protected]257ab712009-04-14 17:16:24763 // Stop any in-progress URL fetches.
764 keyword_fetcher_.reset();
765 default_fetcher_.reset();
[email protected]55ce8f12012-05-09 04:44:08766}
767
[email protected]71b46152013-05-03 16:39:20768void SearchProvider::ClearAllResults() {
[email protected]cc1526e2013-05-17 04:04:24769 keyword_results_.Clear();
770 default_results_.Clear();
[email protected]1e1550e2013-05-02 17:37:51771}
772
[email protected]71b46152013-05-03 16:39:20773void SearchProvider::RemoveAllStaleResults() {
[email protected]1e1550e2013-05-02 17:37:51774 // In theory it would be better to run an algorithm like that in
775 // RemoveStaleResults(...) below that uses all four results lists
776 // and both verbatim scores at once. However, that will be much
777 // more complicated for little obvious gain. For code simplicity
778 // and ease in reasoning about the invariants involved, this code
779 // removes stales results from the keyword provider and default
780 // provider independently.
[email protected]d30268a2013-06-25 22:31:07781 RemoveStaleResults(input_.text(), GetVerbatimRelevance(NULL),
[email protected]cc1526e2013-05-17 04:04:24782 &default_results_.suggest_results,
783 &default_results_.navigation_results);
[email protected]1e1550e2013-05-02 17:37:51784 if (!keyword_input_.text().empty()) {
[email protected]d30268a2013-06-25 22:31:07785 RemoveStaleResults(keyword_input_.text(), GetKeywordVerbatimRelevance(NULL),
[email protected]cc1526e2013-05-17 04:04:24786 &keyword_results_.suggest_results,
787 &keyword_results_.navigation_results);
[email protected]1e1550e2013-05-02 17:37:51788 } else {
789 // User is either in keyword mode with a blank input or out of
790 // keyword mode entirely.
[email protected]cc1526e2013-05-17 04:04:24791 keyword_results_.Clear();
[email protected]1e1550e2013-05-02 17:37:51792 }
[email protected]d1f0a7f2012-06-05 10:26:42793}
794
[email protected]d1f0a7f2012-06-05 10:26:42795void SearchProvider::ApplyCalculatedRelevance() {
[email protected]cc1526e2013-05-17 04:04:24796 ApplyCalculatedSuggestRelevance(&keyword_results_.suggest_results);
797 ApplyCalculatedSuggestRelevance(&default_results_.suggest_results);
798 ApplyCalculatedNavigationRelevance(&keyword_results_.navigation_results);
799 ApplyCalculatedNavigationRelevance(&default_results_.navigation_results);
[email protected]cc1526e2013-05-17 04:04:24800 default_results_.verbatim_relevance = -1;
801 keyword_results_.verbatim_relevance = -1;
[email protected]d1f0a7f2012-06-05 10:26:42802}
803
[email protected]188b50c2013-03-28 07:19:42804void SearchProvider::ApplyCalculatedSuggestRelevance(SuggestResults* list) {
[email protected]d1f0a7f2012-06-05 10:26:42805 for (size_t i = 0; i < list->size(); ++i) {
[email protected]188b50c2013-03-28 07:19:42806 SuggestResult& result = (*list)[i];
807 result.set_relevance(
808 result.CalculateRelevance(input_, providers_.has_keyword_provider()) +
809 (list->size() - i - 1));
[email protected]d30268a2013-06-25 22:31:07810 result.set_relevance_from_server(false);
[email protected]d1f0a7f2012-06-05 10:26:42811 }
812}
813
[email protected]188b50c2013-03-28 07:19:42814void SearchProvider::ApplyCalculatedNavigationRelevance(
815 NavigationResults* list) {
[email protected]d1f0a7f2012-06-05 10:26:42816 for (size_t i = 0; i < list->size(); ++i) {
[email protected]188b50c2013-03-28 07:19:42817 NavigationResult& result = (*list)[i];
818 result.set_relevance(
819 result.CalculateRelevance(input_, providers_.has_keyword_provider()) +
820 (list->size() - i - 1));
[email protected]d30268a2013-06-25 22:31:07821 result.set_relevance_from_server(false);
[email protected]d1f0a7f2012-06-05 10:26:42822 }
823}
824
[email protected]15fb2aa2012-05-22 22:52:59825net::URLFetcher* SearchProvider::CreateSuggestFetcher(
[email protected]7cc6e5632011-10-25 17:56:12826 int id,
[email protected]9ff91722012-09-07 05:29:12827 const TemplateURL* template_url,
[email protected]14710852013-02-05 23:45:41828 const AutocompleteInput& input) {
[email protected]9ff91722012-09-07 05:29:12829 if (!template_url || template_url->suggestions_url().empty())
830 return NULL;
831
832 // Bail if the suggestion URL is invalid with the given replacements.
[email protected]14710852013-02-05 23:45:41833 TemplateURLRef::SearchTermsArgs search_term_args(input.text());
834 search_term_args.cursor_position = input.cursor_position();
[email protected]d5015ca2013-08-08 22:04:18835 search_term_args.page_classification = input.current_page_classification();
[email protected]9ff91722012-09-07 05:29:12836 GURL suggest_url(template_url->suggestions_url_ref().ReplaceSearchTerms(
[email protected]00790562012-12-14 09:57:16837 search_term_args));
[email protected]9ff91722012-09-07 05:29:12838 if (!suggest_url.is_valid())
839 return NULL;
840
841 suggest_results_pending_++;
842 LogOmniboxSuggestRequest(REQUEST_SENT);
843
844 net::URLFetcher* fetcher =
845 net::URLFetcher::Create(id, suggest_url, net::URLFetcher::GET, this);
[email protected]7cc6e5632011-10-25 17:56:12846 fetcher->SetRequestContext(profile_->GetRequestContext());
[email protected]d3cf8682f02012-02-29 23:29:34847 fetcher->SetLoadFlags(net::LOAD_DO_NOT_SAVE_COOKIES);
[email protected]bd3b4712012-12-18 17:01:30848 // Add Chrome experiment state to the request headers.
849 net::HttpRequestHeaders headers;
[email protected]ab7780792013-01-10 01:26:09850 chrome_variations::VariationsHttpHeaderProvider::GetInstance()->AppendHeaders(
[email protected]bd3b4712012-12-18 17:01:30851 fetcher->GetOriginalURL(), profile_->IsOffTheRecord(), false, &headers);
852 fetcher->SetExtraRequestHeaders(headers.ToString());
[email protected]257ab712009-04-14 17:16:24853 fetcher->Start();
854 return fetcher;
855}
856
[email protected]d7ad4772012-06-01 03:12:54857bool SearchProvider::ParseSuggestResults(Value* root_val, bool is_keyword) {
[email protected]d7ad4772012-06-01 03:12:54858 string16 query;
859 ListValue* root_list = NULL;
[email protected]cc1526e2013-05-17 04:04:24860 ListValue* results_list = NULL;
[email protected]14710852013-02-05 23:45:41861 const string16& input_text =
862 is_keyword ? keyword_input_.text() : input_.text();
[email protected]d7ad4772012-06-01 03:12:54863 if (!root_val->GetAsList(&root_list) || !root_list->GetString(0, &query) ||
[email protected]cc1526e2013-05-17 04:04:24864 (query != input_text) || !root_list->GetList(1, &results_list))
initial.commit09911bf2008-07-26 23:55:29865 return false;
866
[email protected]55ce8f12012-05-09 04:44:08867 // 3rd element: Description list.
[email protected]d7ad4772012-06-01 03:12:54868 ListValue* descriptions = NULL;
869 root_list->GetList(2, &descriptions);
initial.commit09911bf2008-07-26 23:55:29870
[email protected]55ce8f12012-05-09 04:44:08871 // 4th element: Disregard the query URL list for now.
initial.commit09911bf2008-07-26 23:55:29872
[email protected]d1f0a7f2012-06-05 10:26:42873 // Reset suggested relevance information from the default provider.
[email protected]cc1526e2013-05-17 04:04:24874 Results* results = is_keyword ? &keyword_results_ : &default_results_;
[email protected]cc1526e2013-05-17 04:04:24875 results->verbatim_relevance = -1;
[email protected]d1f0a7f2012-06-05 10:26:42876
[email protected]55ce8f12012-05-09 04:44:08877 // 5th element: Optional key-value pairs from the Suggest server.
[email protected]d7ad4772012-06-01 03:12:54878 ListValue* types = NULL;
[email protected]d1f0a7f2012-06-05 10:26:42879 ListValue* relevances = NULL;
880 DictionaryValue* extras = NULL;
881 if (root_list->GetDictionary(4, &extras)) {
882 extras->GetList("google:suggesttype", &types);
883
[email protected]eb8330d2013-06-15 00:55:08884 // Discard this list if its size does not match that of the suggestions.
885 if (extras->GetList("google:suggestrelevance", &relevances) &&
886 relevances->GetSize() != results_list->GetSize())
887 relevances = NULL;
888 extras->GetInteger("google:verbatimrelevance",
889 &results->verbatim_relevance);
[email protected]618d6e62012-12-16 05:55:57890
891 // Check if the active suggest field trial (if any) has triggered either
892 // for the default provider or keyword provider.
893 bool triggered = false;
894 extras->GetBoolean("google:fieldtrialtriggered", &triggered);
895 field_trial_triggered_ |= triggered;
896 field_trial_triggered_in_session_ |= triggered;
initial.commit09911bf2008-07-26 23:55:29897 }
898
[email protected]d1f0a7f2012-06-05 10:26:42899 // Clear the previous results now that new results are available.
[email protected]cc1526e2013-05-17 04:04:24900 results->suggest_results.clear();
901 results->navigation_results.clear();
[email protected]d1f0a7f2012-06-05 10:26:42902
903 string16 result, title;
904 std::string type;
905 int relevance = -1;
[email protected]cc1526e2013-05-17 04:04:24906 for (size_t index = 0; results_list->GetString(index, &result); ++index) {
[email protected]8e81f5092010-09-29 23:19:40907 // Google search may return empty suggestions for weird input characters,
[email protected]55ce8f12012-05-09 04:44:08908 // they make no sense at all and can cause problems in our code.
[email protected]d7ad4772012-06-01 03:12:54909 if (result.empty())
[email protected]8e81f5092010-09-29 23:19:40910 continue;
911
[email protected]d1f0a7f2012-06-05 10:26:42912 // Apply valid suggested relevance scores; discard invalid lists.
913 if (relevances != NULL && !relevances->GetInteger(index, &relevance))
914 relevances = NULL;
[email protected]d7ad4772012-06-01 03:12:54915 if (types && types->GetString(index, &type) && (type == "NAVIGATION")) {
[email protected]d1f0a7f2012-06-05 10:26:42916 // Do not blindly trust the URL coming from the server to be valid.
917 GURL url(URLFixerUpper::FixupURL(UTF16ToUTF8(result), std::string()));
918 if (url.is_valid()) {
919 if (descriptions != NULL)
920 descriptions->GetString(index, &title);
[email protected]d30268a2013-06-25 22:31:07921 results->navigation_results.push_back(NavigationResult(
922 *this, url, title, is_keyword, relevance, true));
initial.commit09911bf2008-07-26 23:55:29923 }
924 } else {
[email protected]d1f0a7f2012-06-05 10:26:42925 // TODO(kochi): Improve calculator result presentation.
[email protected]cc1526e2013-05-17 04:04:24926 results->suggest_results.push_back(
[email protected]d30268a2013-06-25 22:31:07927 SuggestResult(result, is_keyword, relevance, true));
initial.commit09911bf2008-07-26 23:55:29928 }
929 }
930
[email protected]d1f0a7f2012-06-05 10:26:42931 // Apply calculated relevance scores if a valid list was not provided.
932 if (relevances == NULL) {
[email protected]cc1526e2013-05-17 04:04:24933 ApplyCalculatedSuggestRelevance(&results->suggest_results);
934 ApplyCalculatedNavigationRelevance(&results->navigation_results);
[email protected]d1f0a7f2012-06-05 10:26:42935 }
[email protected]9dfb4d362013-04-05 02:15:12936 // Keep the result lists sorted.
937 const CompareScoredResults comparator = CompareScoredResults();
[email protected]cc1526e2013-05-17 04:04:24938 std::stable_sort(results->suggest_results.begin(),
939 results->suggest_results.end(),
[email protected]9dfb4d362013-04-05 02:15:12940 comparator);
[email protected]cc1526e2013-05-17 04:04:24941 std::stable_sort(results->navigation_results.begin(),
942 results->navigation_results.end(),
[email protected]9dfb4d362013-04-05 02:15:12943 comparator);
[email protected]d1f0a7f2012-06-05 10:26:42944 return true;
initial.commit09911bf2008-07-26 23:55:29945}
946
[email protected]344946a12012-12-20 12:03:42947void SearchProvider::ConvertResultsToAutocompleteMatches() {
initial.commit09911bf2008-07-26 23:55:29948 // Convert all the results to matches and add them to a map, so we can keep
949 // the most relevant match for each result.
950 MatchMap map;
[email protected]bc8bb0cd2013-06-24 21:50:23951 const base::Time no_time;
[email protected]cc1526e2013-05-17 04:04:24952 int did_not_accept_keyword_suggestion =
953 keyword_results_.suggest_results.empty() ?
initial.commit09911bf2008-07-26 23:55:29954 TemplateURLRef::NO_SUGGESTIONS_AVAILABLE :
955 TemplateURLRef::NO_SUGGESTION_CHOSEN;
initial.commit09911bf2008-07-26 23:55:29956
[email protected]d30268a2013-06-25 22:31:07957 bool relevance_from_server;
958 int verbatim_relevance = GetVerbatimRelevance(&relevance_from_server);
[email protected]cc1526e2013-05-17 04:04:24959 int did_not_accept_default_suggestion =
960 default_results_.suggest_results.empty() ?
[email protected]55ce8f12012-05-09 04:44:08961 TemplateURLRef::NO_SUGGESTIONS_AVAILABLE :
962 TemplateURLRef::NO_SUGGESTION_CHOSEN;
[email protected]d1f0a7f2012-06-05 10:26:42963 if (verbatim_relevance > 0) {
964 AddMatchToMap(input_.text(), input_.text(), verbatim_relevance,
[email protected]d30268a2013-06-25 22:31:07965 relevance_from_server,
[email protected]b7f64d742013-05-21 04:04:04966 AutocompleteMatchType::SEARCH_WHAT_YOU_TYPED,
[email protected]d1f0a7f2012-06-05 10:26:42967 did_not_accept_default_suggestion, false, &map);
968 }
[email protected]5423e562013-02-07 03:58:45969 if (!keyword_input_.text().empty()) {
970 const TemplateURL* keyword_url = providers_.GetKeywordProviderURL();
971 // We only create the verbatim search query match for a keyword
972 // if it's not an extension keyword. Extension keywords are handled
973 // in KeywordProvider::Start(). (Extensions are complicated...)
974 // Note: in this provider, SEARCH_OTHER_ENGINE must correspond
975 // to the keyword verbatim search query. Do not create other matches
976 // of type SEARCH_OTHER_ENGINE.
977 if (keyword_url && !keyword_url->IsExtensionKeyword()) {
[email protected]d30268a2013-06-25 22:31:07978 bool keyword_relevance_from_server;
979 const int keyword_verbatim_relevance =
980 GetKeywordVerbatimRelevance(&keyword_relevance_from_server);
[email protected]dab8d52d2013-03-05 07:35:28981 if (keyword_verbatim_relevance > 0) {
982 AddMatchToMap(keyword_input_.text(), keyword_input_.text(),
[email protected]d30268a2013-06-25 22:31:07983 keyword_verbatim_relevance, keyword_relevance_from_server,
[email protected]b7f64d742013-05-21 04:04:04984 AutocompleteMatchType::SEARCH_OTHER_ENGINE,
[email protected]dab8d52d2013-03-05 07:35:28985 did_not_accept_keyword_suggestion, true, &map);
986 }
[email protected]5423e562013-02-07 03:58:45987 }
988 }
[email protected]257ab712009-04-14 17:16:24989 AddHistoryResultsToMap(keyword_history_results_, true,
990 did_not_accept_keyword_suggestion, &map);
991 AddHistoryResultsToMap(default_history_results_, false,
992 did_not_accept_default_suggestion, &map);
993
[email protected]cc1526e2013-05-17 04:04:24994 AddSuggestResultsToMap(keyword_results_.suggest_results, &map);
995 AddSuggestResultsToMap(default_results_.suggest_results, &map);
initial.commit09911bf2008-07-26 23:55:29996
[email protected]d30268a2013-06-25 22:31:07997 ACMatches matches;
initial.commit09911bf2008-07-26 23:55:29998 for (MatchMap::const_iterator i(map.begin()); i != map.end(); ++i)
[email protected]d30268a2013-06-25 22:31:07999 matches.push_back(i->second);
initial.commit09911bf2008-07-26 23:55:291000
[email protected]d30268a2013-06-25 22:31:071001 AddNavigationResultsToMatches(keyword_results_.navigation_results, &matches);
1002 AddNavigationResultsToMatches(default_results_.navigation_results, &matches);
initial.commit09911bf2008-07-26 23:55:291003
[email protected]d30268a2013-06-25 22:31:071004 // Now add the most relevant matches to |matches_|. We take up to kMaxMatches
1005 // suggest/navsuggest matches, regardless of origin. If Instant Extended is
1006 // enabled and we have server-provided (and thus hopefully more accurate)
1007 // scores for some suggestions, we allow more of those, until we reach
1008 // AutocompleteResult::kMaxMatches total matches (that is, enough to fill the
1009 // whole popup).
1010 //
1011 // We will always return any verbatim matches, no matter how we obtained their
1012 // scores, unless we have already accepted AutocompleteResult::kMaxMatches
1013 // higher-scoring matches under the conditions above.
1014 std::sort(matches.begin(), matches.end(), &AutocompleteMatch::MoreRelevant);
1015 matches_.clear();
[email protected]3723e6e2012-06-11 21:06:561016
[email protected]d30268a2013-06-25 22:31:071017 size_t num_suggestions = 0;
1018 for (ACMatches::const_iterator i(matches.begin());
1019 (i != matches.end()) &&
1020 (matches_.size() < AutocompleteResult::kMaxMatches);
1021 ++i) {
1022 // SEARCH_OTHER_ENGINE is only used in the SearchProvider for the keyword
1023 // verbatim result, so this condition basically means "if this match is a
1024 // suggestion of some sort".
1025 if ((i->type != AutocompleteMatchType::SEARCH_WHAT_YOU_TYPED) &&
1026 (i->type != AutocompleteMatchType::SEARCH_OTHER_ENGINE)) {
1027 // If we've already hit the limit on non-server-scored suggestions, and
1028 // this isn't a server-scored suggestion we can add, skip it.
1029 if ((num_suggestions >= kMaxMatches) &&
1030 (!chrome::IsInstantExtendedAPIEnabled() ||
1031 (i->GetAdditionalInfo(kRelevanceFromServerKey) != kTrue))) {
1032 continue;
1033 }
1034
1035 ++num_suggestions;
1036 }
1037
1038 matches_.push_back(*i);
1039 }
[email protected]344946a12012-12-20 12:03:421040}
1041
[email protected]9dfb4d362013-04-05 02:15:121042bool SearchProvider::IsTopMatchNavigationInKeywordMode() const {
1043 return (!providers_.keyword_provider().empty() &&
[email protected]b7f64d742013-05-21 04:04:041044 (matches_.front().type == AutocompleteMatchType::NAVSUGGEST));
[email protected]9dfb4d362013-04-05 02:15:121045}
1046
[email protected]344946a12012-12-20 12:03:421047bool SearchProvider::IsTopMatchScoreTooLow() const {
[email protected]dab8d52d2013-03-05 07:35:281048 // Here we use CalculateRelevanceForVerbatimIgnoringKeywordModeState()
1049 // rather than CalculateRelevanceForVerbatim() because the latter returns
1050 // a very low score (250) if keyword mode is active. This is because
1051 // when keyword mode is active the user probably wants the keyword matches,
1052 // not matches from the default provider. Hence, we use the version of
1053 // the function that ignores whether keyword mode is active. This allows
1054 // SearchProvider to maintain its contract with the AutocompleteController
1055 // that it will always provide an inlineable match with a reasonable
1056 // score.
1057 return matches_.front().relevance <
1058 CalculateRelevanceForVerbatimIgnoringKeywordModeState();
[email protected]344946a12012-12-20 12:03:421059}
1060
[email protected]fb95251e2013-07-17 14:52:241061bool SearchProvider::IsTopMatchSearchWithURLInput() const {
[email protected]344946a12012-12-20 12:03:421062 return input_.type() == AutocompleteInput::URL &&
1063 matches_.front().relevance > CalculateRelevanceForVerbatim() &&
[email protected]fb95251e2013-07-17 14:52:241064 matches_.front().type != AutocompleteMatchType::NAVSUGGEST;
[email protected]344946a12012-12-20 12:03:421065}
1066
1067bool SearchProvider::IsTopMatchNotInlinable() const {
[email protected]5423e562013-02-07 03:58:451068 // Note: this test assumes the SEARCH_OTHER_ENGINE match corresponds to
1069 // the verbatim search query on the keyword engine. SearchProvider should
1070 // not create any other match of type SEARCH_OTHER_ENGINE.
[email protected]b7f64d742013-05-21 04:04:041071 return
1072 matches_.front().type != AutocompleteMatchType::SEARCH_WHAT_YOU_TYPED &&
[email protected]b7f64d742013-05-21 04:04:041073 matches_.front().type != AutocompleteMatchType::SEARCH_OTHER_ENGINE &&
[email protected]518024c2013-07-19 23:40:251074 matches_.front().inline_autocompletion.empty() &&
[email protected]b7f64d742013-05-21 04:04:041075 matches_.front().fill_into_edit != input_.text();
[email protected]344946a12012-12-20 12:03:421076}
1077
1078void SearchProvider::UpdateMatches() {
1079 ConvertResultsToAutocompleteMatches();
initial.commit09911bf2008-07-26 23:55:291080
[email protected]382a0642012-06-06 06:13:521081 // Check constraints that may be violated by suggested relevances.
[email protected]344946a12012-12-20 12:03:421082 if (!matches_.empty() &&
[email protected]bc8bb0cd2013-06-24 21:50:231083 (default_results_.HasServerProvidedScores() ||
1084 keyword_results_.HasServerProvidedScores())) {
[email protected]9dfb4d362013-04-05 02:15:121085 // These blocks attempt to repair undesirable behavior by suggested
[email protected]344946a12012-12-20 12:03:421086 // relevances with minimal impact, preserving other suggested relevances.
[email protected]9dfb4d362013-04-05 02:15:121087 if (IsTopMatchNavigationInKeywordMode()) {
1088 // Correct the suggested relevance scores if the top match is a
1089 // navigation in keyword mode, since inlining a navigation match
1090 // would break the user out of keyword mode. By the way, if the top
1091 // match is a non-keyword match (query or navsuggestion) in keyword
1092 // mode, the user would also break out of keyword mode. However,
1093 // that situation is impossible given the current scoring paradigm
1094 // and the fact that only one search engine (Google) provides suggested
1095 // relevance scores at this time.
1096 DemoteKeywordNavigationMatchesPastTopQuery();
1097 ConvertResultsToAutocompleteMatches();
1098 DCHECK(!IsTopMatchNavigationInKeywordMode());
1099 }
[email protected]344946a12012-12-20 12:03:421100 if (IsTopMatchScoreTooLow()) {
[email protected]1beee342012-06-19 22:22:281101 // Disregard the suggested verbatim relevance if the top score is below
1102 // the usual verbatim value. For example, a BarProvider may rely on
1103 // SearchProvider's verbatim or inlineable matches for input "foo" to
1104 // always outrank its own lowly-ranked non-inlineable "bar" match.
[email protected]cc1526e2013-05-17 04:04:241105 default_results_.verbatim_relevance = -1;
1106 keyword_results_.verbatim_relevance = -1;
[email protected]344946a12012-12-20 12:03:421107 ConvertResultsToAutocompleteMatches();
[email protected]e6acd002012-06-16 22:27:471108 }
[email protected]fb95251e2013-07-17 14:52:241109 if (IsTopMatchSearchWithURLInput()) {
[email protected]e6acd002012-06-16 22:27:471110 // Disregard the suggested search and verbatim relevances if the input
1111 // type is URL and the top match is a highly-ranked search suggestion.
1112 // For example, prevent a search for "foo.com" from outranking another
1113 // provider's navigation for "foo.com" or "foo.com/url_from_history".
[email protected]cc1526e2013-05-17 04:04:241114 ApplyCalculatedSuggestRelevance(&keyword_results_.suggest_results);
1115 ApplyCalculatedSuggestRelevance(&default_results_.suggest_results);
1116 default_results_.verbatim_relevance = -1;
1117 keyword_results_.verbatim_relevance = -1;
[email protected]344946a12012-12-20 12:03:421118 ConvertResultsToAutocompleteMatches();
[email protected]382a0642012-06-06 06:13:521119 }
[email protected]344946a12012-12-20 12:03:421120 if (IsTopMatchNotInlinable()) {
[email protected]d30268a2013-06-25 22:31:071121 // Disregard suggested relevances if the top match is not a verbatim match
1122 // or inlinable. For example, input "foo" should not invoke a search for
1123 // "bar", which would happen if the "bar" search match outranked all other
1124 // matches.
[email protected]344946a12012-12-20 12:03:421125 ApplyCalculatedRelevance();
1126 ConvertResultsToAutocompleteMatches();
[email protected]382a0642012-06-06 06:13:521127 }
[email protected]9dfb4d362013-04-05 02:15:121128 DCHECK(!IsTopMatchNavigationInKeywordMode());
[email protected]344946a12012-12-20 12:03:421129 DCHECK(!IsTopMatchScoreTooLow());
[email protected]fb95251e2013-07-17 14:52:241130 DCHECK(!IsTopMatchSearchWithURLInput());
[email protected]344946a12012-12-20 12:03:421131 DCHECK(!IsTopMatchNotInlinable());
[email protected]d1f0a7f2012-06-05 10:26:421132 }
1133
[email protected]cc63dea2008-08-21 20:56:311134 UpdateStarredStateOfMatches();
[email protected]4ab4c7c2010-11-24 04:49:341135 UpdateDone();
[email protected]257ab712009-04-14 17:16:241136}
1137
1138void SearchProvider::AddNavigationResultsToMatches(
[email protected]d30268a2013-06-25 22:31:071139 const NavigationResults& navigation_results,
1140 ACMatches* matches) {
[email protected]bc8bb0cd2013-06-24 21:50:231141 for (NavigationResults::const_iterator it = navigation_results.begin();
1142 it != navigation_results.end(); ++it) {
[email protected]d30268a2013-06-25 22:31:071143 matches->push_back(NavigationToMatch(*it));
[email protected]bc8bb0cd2013-06-24 21:50:231144 // In the absence of suggested relevance scores, use only the single
1145 // highest-scoring result. (The results are already sorted by relevance.)
[email protected]d30268a2013-06-25 22:31:071146 if (!it->relevance_from_server())
[email protected]bc8bb0cd2013-06-24 21:50:231147 return;
[email protected]257ab712009-04-14 17:16:241148 }
1149}
1150
1151void SearchProvider::AddHistoryResultsToMap(const HistoryResults& results,
1152 bool is_keyword,
1153 int did_not_accept_suggestion,
1154 MatchMap* map) {
[email protected]51124552011-07-16 01:37:101155 if (results.empty())
1156 return;
1157
[email protected]d7ad4772012-06-01 03:12:541158 bool prevent_inline_autocomplete = input_.prevent_inline_autocomplete() ||
1159 (input_.type() == AutocompleteInput::URL);
[email protected]14710852013-02-05 23:45:411160 const string16& input_text =
1161 is_keyword ? keyword_input_.text() : input_.text();
[email protected]51124552011-07-16 01:37:101162 bool input_multiple_words = HasMultipleWords(input_text);
1163
[email protected]55ce8f12012-05-09 04:44:081164 SuggestResults scored_results;
1165 if (!prevent_inline_autocomplete && input_multiple_words) {
1166 // ScoreHistoryResults() allows autocompletion of multi-word, 1-visit
1167 // queries if the input also has multiple words. But if we were already
[email protected]51124552011-07-16 01:37:101168 // autocompleting a multi-word, multi-visit query, and the current input is
1169 // still a prefix of it, then changing the autocompletion suddenly feels
1170 // wrong. To detect this case, first score as if only one word has been
1171 // typed, then check for a best result that is an autocompleted, multi-word
1172 // query. If we find one, then just keep that score set.
[email protected]55ce8f12012-05-09 04:44:081173 scored_results = ScoreHistoryResults(results, prevent_inline_autocomplete,
1174 false, input_text, is_keyword);
[email protected]9dfb4d362013-04-05 02:15:121175 if ((scored_results.front().relevance() <
[email protected]55ce8f12012-05-09 04:44:081176 AutocompleteResult::kLowestDefaultScore) ||
[email protected]9dfb4d362013-04-05 02:15:121177 !HasMultipleWords(scored_results.front().suggestion()))
[email protected]55ce8f12012-05-09 04:44:081178 scored_results.clear(); // Didn't detect the case above, score normally.
[email protected]51124552011-07-16 01:37:101179 }
[email protected]55ce8f12012-05-09 04:44:081180 if (scored_results.empty())
1181 scored_results = ScoreHistoryResults(results, prevent_inline_autocomplete,
1182 input_multiple_words, input_text,
1183 is_keyword);
1184 for (SuggestResults::const_iterator i(scored_results.begin());
1185 i != scored_results.end(); ++i) {
[email protected]d30268a2013-06-25 22:31:071186 AddMatchToMap(i->suggestion(), input_text, i->relevance(), false,
[email protected]b7f64d742013-05-21 04:04:041187 AutocompleteMatchType::SEARCH_HISTORY,
1188 did_not_accept_suggestion,
[email protected]55ce8f12012-05-09 04:44:081189 is_keyword, map);
[email protected]51124552011-07-16 01:37:101190 }
1191}
1192
[email protected]55ce8f12012-05-09 04:44:081193SearchProvider::SuggestResults SearchProvider::ScoreHistoryResults(
[email protected]51124552011-07-16 01:37:101194 const HistoryResults& results,
1195 bool base_prevent_inline_autocomplete,
1196 bool input_multiple_words,
1197 const string16& input_text,
1198 bool is_keyword) {
[email protected]810ffba2012-06-12 01:07:481199 AutocompleteClassifier* classifier =
1200 AutocompleteClassifierFactory::GetForProfile(profile_);
[email protected]55ce8f12012-05-09 04:44:081201 SuggestResults scored_results;
[email protected]78e5e432013-08-03 02:10:101202 const bool prevent_search_history_inlining =
1203 OmniboxFieldTrial::SearchHistoryPreventInlining(
1204 input_.current_page_classification());
[email protected]257ab712009-04-14 17:16:241205 for (HistoryResults::const_iterator i(results.begin()); i != results.end();
1206 ++i) {
[email protected]51124552011-07-16 01:37:101207 // Don't autocomplete multi-word queries that have only been seen once
1208 // unless the user has typed more than one word.
1209 bool prevent_inline_autocomplete = base_prevent_inline_autocomplete ||
1210 (!input_multiple_words && (i->visits < 2) && HasMultipleWords(i->term));
1211
[email protected]ea3b9a502011-04-04 14:19:371212 // Don't autocomplete search terms that would normally be treated as URLs
[email protected]51124552011-07-16 01:37:101213 // when typed. For example, if the user searched for "google.com" and types
1214 // "goog", don't autocomplete to the search term "google.com". Otherwise,
1215 // the input will look like a URL but act like a search, which is confusing.
[email protected]cc447362011-04-06 03:57:481216 // NOTE: We don't check this in the following cases:
1217 // * When inline autocomplete is disabled, we won't be inline
1218 // autocompleting this term, so we don't need to worry about confusion as
1219 // much. This also prevents calling Classify() again from inside the
1220 // classifier (which will corrupt state and likely crash), since the
[email protected]51124552011-07-16 01:37:101221 // classifier always disables inline autocomplete.
[email protected]cc447362011-04-06 03:57:481222 // * When the user has typed the whole term, the "what you typed" history
1223 // match will outrank us for URL-like inputs anyway, so we need not do
1224 // anything special.
[email protected]51124552011-07-16 01:37:101225 if (!prevent_inline_autocomplete && classifier && (i->term != input_text)) {
[email protected]ea3b9a502011-04-04 14:19:371226 AutocompleteMatch match;
[email protected]f608ea102013-03-18 15:08:091227 classifier->Classify(i->term, false, false, &match, NULL);
[email protected]2905f742011-10-13 03:51:581228 prevent_inline_autocomplete =
[email protected]749e7ae02012-09-05 18:47:461229 !AutocompleteMatch::IsSearchType(match.type);
[email protected]ea3b9a502011-04-04 14:19:371230 }
[email protected]51124552011-07-16 01:37:101231
[email protected]78e5e432013-08-03 02:10:101232 int relevance = CalculateRelevanceForHistory(
1233 i->time, is_keyword, !prevent_inline_autocomplete,
1234 prevent_search_history_inlining);
[email protected]d30268a2013-06-25 22:31:071235 scored_results.push_back(
1236 SuggestResult(i->term, is_keyword, relevance, false));
[email protected]257ab712009-04-14 17:16:241237 }
[email protected]51124552011-07-16 01:37:101238
1239 // History returns results sorted for us. However, we may have docked some
1240 // results' scores, so things are no longer in order. Do a stable sort to get
1241 // things back in order without otherwise disturbing results with equal
1242 // scores, then force the scores to be unique, so that the order in which
1243 // they're shown is deterministic.
[email protected]55ce8f12012-05-09 04:44:081244 std::stable_sort(scored_results.begin(), scored_results.end(),
1245 CompareScoredResults());
[email protected]51124552011-07-16 01:37:101246 int last_relevance = 0;
[email protected]55ce8f12012-05-09 04:44:081247 for (SuggestResults::iterator i(scored_results.begin());
1248 i != scored_results.end(); ++i) {
1249 if ((i != scored_results.begin()) && (i->relevance() >= last_relevance))
1250 i->set_relevance(last_relevance - 1);
1251 last_relevance = i->relevance();
[email protected]51124552011-07-16 01:37:101252 }
1253
[email protected]55ce8f12012-05-09 04:44:081254 return scored_results;
[email protected]257ab712009-04-14 17:16:241255}
1256
[email protected]55ce8f12012-05-09 04:44:081257void SearchProvider::AddSuggestResultsToMap(const SuggestResults& results,
[email protected]55ce8f12012-05-09 04:44:081258 MatchMap* map) {
[email protected]55ce8f12012-05-09 04:44:081259 for (size_t i = 0; i < results.size(); ++i) {
[email protected]188b50c2013-03-28 07:19:421260 const bool is_keyword = results[i].from_keyword_provider();
1261 const string16& input = is_keyword ? keyword_input_.text() : input_.text();
1262 AddMatchToMap(results[i].suggestion(), input, results[i].relevance(),
[email protected]d30268a2013-06-25 22:31:071263 results[i].relevance_from_server(),
[email protected]b7f64d742013-05-21 04:04:041264 AutocompleteMatchType::SEARCH_SUGGEST, i, is_keyword, map);
[email protected]257ab712009-04-14 17:16:241265 }
initial.commit09911bf2008-07-26 23:55:291266}
1267
[email protected]d30268a2013-06-25 22:31:071268int SearchProvider::GetVerbatimRelevance(bool* relevance_from_server) const {
[email protected]dc6943b2012-06-19 06:39:561269 // Use the suggested verbatim relevance score if it is non-negative (valid),
1270 // if inline autocomplete isn't prevented (always show verbatim on backspace),
[email protected]1beee342012-06-19 22:22:281271 // and if it won't suppress verbatim, leaving no default provider matches.
1272 // Otherwise, if the default provider returned no matches and was still able
[email protected]dc6943b2012-06-19 06:39:561273 // to suppress verbatim, the user would have no search/nav matches and may be
[email protected]1beee342012-06-19 22:22:281274 // left unable to search using their default provider from the omnibox.
[email protected]dc6943b2012-06-19 06:39:561275 // Check for results on each verbatim calculation, as results from older
1276 // queries (on previous input) may be trimmed for failing to inline new input.
[email protected]bc8bb0cd2013-06-24 21:50:231277 bool use_server_relevance =
1278 (default_results_.verbatim_relevance >= 0) &&
[email protected]dab8d52d2013-03-05 07:35:281279 !input_.prevent_inline_autocomplete() &&
[email protected]bc8bb0cd2013-06-24 21:50:231280 ((default_results_.verbatim_relevance > 0) ||
[email protected]cc1526e2013-05-17 04:04:241281 !default_results_.suggest_results.empty() ||
[email protected]bc8bb0cd2013-06-24 21:50:231282 !default_results_.navigation_results.empty());
[email protected]d30268a2013-06-25 22:31:071283 if (relevance_from_server)
1284 *relevance_from_server = use_server_relevance;
[email protected]bc8bb0cd2013-06-24 21:50:231285 return use_server_relevance ?
1286 default_results_.verbatim_relevance : CalculateRelevanceForVerbatim();
[email protected]382a0642012-06-06 06:13:521287}
[email protected]d1f0a7f2012-06-05 10:26:421288
[email protected]382a0642012-06-06 06:13:521289int SearchProvider::CalculateRelevanceForVerbatim() const {
[email protected]85b8d6f2012-05-08 20:53:471290 if (!providers_.keyword_provider().empty())
[email protected]52d08b12009-10-19 18:42:361291 return 250;
[email protected]dab8d52d2013-03-05 07:35:281292 return CalculateRelevanceForVerbatimIgnoringKeywordModeState();
1293}
[email protected]52d08b12009-10-19 18:42:361294
[email protected]dab8d52d2013-03-05 07:35:281295int SearchProvider::
1296 CalculateRelevanceForVerbatimIgnoringKeywordModeState() const {
initial.commit09911bf2008-07-26 23:55:291297 switch (input_.type()) {
1298 case AutocompleteInput::UNKNOWN:
[email protected]52d08b12009-10-19 18:42:361299 case AutocompleteInput::QUERY:
1300 case AutocompleteInput::FORCED_QUERY:
[email protected]90fe2bb2013-01-15 03:42:131301 return kNonURLVerbatimRelevance;
initial.commit09911bf2008-07-26 23:55:291302
initial.commit09911bf2008-07-26 23:55:291303 case AutocompleteInput::URL:
[email protected]52d08b12009-10-19 18:42:361304 return 850;
initial.commit09911bf2008-07-26 23:55:291305
1306 default:
1307 NOTREACHED();
1308 return 0;
1309 }
1310}
1311
[email protected]d30268a2013-06-25 22:31:071312int SearchProvider::GetKeywordVerbatimRelevance(
1313 bool* relevance_from_server) const {
[email protected]dab8d52d2013-03-05 07:35:281314 // Use the suggested verbatim relevance score if it is non-negative (valid),
1315 // if inline autocomplete isn't prevented (always show verbatim on backspace),
1316 // and if it won't suppress verbatim, leaving no keyword provider matches.
1317 // Otherwise, if the keyword provider returned no matches and was still able
1318 // to suppress verbatim, the user would have no search/nav matches and may be
1319 // left unable to search using their keyword provider from the omnibox.
1320 // Check for results on each verbatim calculation, as results from older
1321 // queries (on previous input) may be trimmed for failing to inline new input.
[email protected]bc8bb0cd2013-06-24 21:50:231322 bool use_server_relevance =
1323 (keyword_results_.verbatim_relevance >= 0) &&
[email protected]dab8d52d2013-03-05 07:35:281324 !input_.prevent_inline_autocomplete() &&
[email protected]bc8bb0cd2013-06-24 21:50:231325 ((keyword_results_.verbatim_relevance > 0) ||
[email protected]cc1526e2013-05-17 04:04:241326 !keyword_results_.suggest_results.empty() ||
[email protected]bc8bb0cd2013-06-24 21:50:231327 !keyword_results_.navigation_results.empty());
[email protected]d30268a2013-06-25 22:31:071328 if (relevance_from_server)
1329 *relevance_from_server = use_server_relevance;
[email protected]bc8bb0cd2013-06-24 21:50:231330 return use_server_relevance ?
1331 keyword_results_.verbatim_relevance :
1332 CalculateRelevanceForKeywordVerbatim(keyword_input_.type(),
1333 keyword_input_.prefer_keyword());
[email protected]5423e562013-02-07 03:58:451334}
1335
[email protected]51124552011-07-16 01:37:101336int SearchProvider::CalculateRelevanceForHistory(
[email protected]bc8bb0cd2013-06-24 21:50:231337 const base::Time& time,
[email protected]51124552011-07-16 01:37:101338 bool is_keyword,
[email protected]78e5e432013-08-03 02:10:101339 bool use_aggressive_method,
1340 bool prevent_search_history_inlining) const {
[email protected]aa613d62010-11-09 20:40:181341 // The relevance of past searches falls off over time. There are two distinct
1342 // equations used. If the first equation is used (searches to the primary
[email protected]78e5e432013-08-03 02:10:101343 // provider that we want to score aggressively), the score is in the range
1344 // 1300-1599 (unless |prevent_search_history_inlining|, in which case
[email protected]d8cd76b2013-07-10 09:46:161345 // it's in the range 1200-1299). If the second equation is used the
1346 // relevance of a search 15 minutes ago is discounted 50 points, while the
1347 // relevance of a search two weeks ago is discounted 450 points.
[email protected]bc8bb0cd2013-06-24 21:50:231348 double elapsed_time = std::max((base::Time::Now() - time).InSecondsF(), 0.0);
[email protected]188b50c2013-03-28 07:19:421349 bool is_primary_provider = is_keyword || !providers_.has_keyword_provider();
[email protected]78e5e432013-08-03 02:10:101350 if (is_primary_provider && use_aggressive_method) {
[email protected]aa613d62010-11-09 20:40:181351 // Searches with the past two days get a different curve.
[email protected]51124552011-07-16 01:37:101352 const double autocomplete_time = 2 * 24 * 60 * 60;
[email protected]aa613d62010-11-09 20:40:181353 if (elapsed_time < autocomplete_time) {
[email protected]d8cd76b2013-07-10 09:46:161354 int max_score = is_keyword ? 1599 : 1399;
[email protected]78e5e432013-08-03 02:10:101355 if (prevent_search_history_inlining)
[email protected]d8cd76b2013-07-10 09:46:161356 max_score = 1299;
1357 return max_score - static_cast<int>(99 *
[email protected]aa613d62010-11-09 20:40:181358 std::pow(elapsed_time / autocomplete_time, 2.5));
1359 }
1360 elapsed_time -= autocomplete_time;
1361 }
1362
[email protected]c3a4bd992010-08-18 20:25:011363 const int score_discount =
1364 static_cast<int>(6.5 * std::pow(elapsed_time, 0.3));
initial.commit09911bf2008-07-26 23:55:291365
[email protected]6c85aa02009-02-27 12:08:091366 // Don't let scores go below 0. Negative relevance scores are meaningful in
1367 // a different way.
initial.commit09911bf2008-07-26 23:55:291368 int base_score;
[email protected]51124552011-07-16 01:37:101369 if (is_primary_provider)
[email protected]52d08b12009-10-19 18:42:361370 base_score = (input_.type() == AutocompleteInput::URL) ? 750 : 1050;
[email protected]51124552011-07-16 01:37:101371 else
1372 base_score = 200;
initial.commit09911bf2008-07-26 23:55:291373 return std::max(0, base_score - score_discount);
1374}
1375
[email protected]a2fedb1e2011-01-25 15:23:361376void SearchProvider::AddMatchToMap(const string16& query_string,
1377 const string16& input_text,
initial.commit09911bf2008-07-26 23:55:291378 int relevance,
[email protected]d30268a2013-06-25 22:31:071379 bool relevance_from_server,
[email protected]4c1fb7ec2008-11-13 00:19:001380 AutocompleteMatch::Type type,
initial.commit09911bf2008-07-26 23:55:291381 int accepted_suggestion,
[email protected]257ab712009-04-14 17:16:241382 bool is_keyword,
initial.commit09911bf2008-07-26 23:55:291383 MatchMap* map) {
[email protected]c4a9d4c2013-08-10 07:06:271384 // On non-mobile, ask the instant controller for the appropriate start margin.
1385 // On mobile the start margin is unused, so leave the value as default there.
1386 int omnibox_start_margin = chrome::kDisableStartMargin;
1387#if !defined(OS_ANDROID) && !defined(IOS)
1388 if (chrome::IsInstantExtendedAPIEnabled()) {
1389 Browser* browser =
1390 chrome::FindBrowserWithProfile(profile_, chrome::GetActiveDesktop());
1391 if (browser && browser->instant_controller() &&
1392 browser->instant_controller()->instant()) {
1393 omnibox_start_margin =
1394 browser->instant_controller()->instant()->omnibox_bounds().x();
1395 }
1396 }
1397#endif // !defined(OS_ANDROID) && !defined(IOS)
1398
[email protected]bba9e632013-06-28 22:52:191399 const TemplateURL* template_url = is_keyword ?
1400 providers_.GetKeywordProviderURL() : providers_.GetDefaultProviderURL();
1401 AutocompleteMatch match = CreateSearchSuggestion(this, relevance, type,
1402 template_url, query_string, input_text, input_, is_keyword,
[email protected]c4a9d4c2013-08-10 07:06:271403 accepted_suggestion, omnibox_start_margin,
[email protected]56fa29592013-07-02 20:25:531404 !is_keyword || providers_.default_provider().empty());
[email protected]cb86ee6f2013-04-28 16:58:151405 if (!match.destination_url.is_valid())
[email protected]85b8d6f2012-05-08 20:53:471406 return;
[email protected]d30268a2013-06-25 22:31:071407 match.RecordAdditionalInfo(kRelevanceFromServerKey,
1408 relevance_from_server ? kTrue : kFalse);
[email protected]85b8d6f2012-05-08 20:53:471409
initial.commit09911bf2008-07-26 23:55:291410 // Try to add |match| to |map|. If a match for |query_string| is already in
1411 // |map|, replace it if |match| is more relevant.
1412 // NOTE: Keep this ToLower() call in sync with url_database.cc.
[email protected]bc8bb0cd2013-06-24 21:50:231413 const std::pair<MatchMap::iterator, bool> i(
1414 map->insert(std::make_pair(base::i18n::ToLower(query_string), match)));
initial.commit09911bf2008-07-26 23:55:291415 // NOTE: We purposefully do a direct relevance comparison here instead of
1416 // using AutocompleteMatch::MoreRelevant(), so that we'll prefer "items added
1417 // first" rather than "items alphabetically first" when the scores are equal.
1418 // The only case this matters is when a user has results with the same score
1419 // that differ only by capitalization; because the history system returns
1420 // results sorted by recency, this means we'll pick the most recent such
1421 // result even if the precision of our relevance score is too low to
1422 // distinguish the two.
1423 if (!i.second && (match.relevance > i.first->second.relevance))
1424 i.first->second = match;
1425}
1426
1427AutocompleteMatch SearchProvider::NavigationToMatch(
[email protected]188b50c2013-03-28 07:19:421428 const NavigationResult& navigation) {
1429 const string16& input = navigation.from_keyword_provider() ?
1430 keyword_input_.text() : input_.text();
[email protected]55ce8f12012-05-09 04:44:081431 AutocompleteMatch match(this, navigation.relevance(), false,
[email protected]b7f64d742013-05-21 04:04:041432 AutocompleteMatchType::NAVSUGGEST);
[email protected]55ce8f12012-05-09 04:44:081433 match.destination_url = navigation.url();
[email protected]371dab12012-06-01 03:23:551434
1435 // First look for the user's input inside the fill_into_edit as it would be
1436 // without trimming the scheme, so we can find matches at the beginning of the
1437 // scheme.
[email protected]a1b5e862013-03-29 06:38:441438 const string16& untrimmed_fill_into_edit = navigation.formatted_url();
[email protected]371dab12012-06-01 03:23:551439 const URLPrefix* prefix =
1440 URLPrefix::BestURLPrefix(untrimmed_fill_into_edit, input);
1441 size_t match_start = (prefix == NULL) ?
1442 untrimmed_fill_into_edit.find(input) : prefix->prefix.length();
1443 size_t inline_autocomplete_offset = (prefix == NULL) ?
1444 string16::npos : (match_start + input.length());
1445 bool trim_http = !HasHTTPScheme(input) && (!prefix || (match_start != 0));
1446
1447 // Preserve the forced query '?' prefix in |match.fill_into_edit|.
1448 // Otherwise, user edits to a suggestion would show non-Search results.
1449 if (input_.type() == AutocompleteInput::FORCED_QUERY) {
1450 match.fill_into_edit = ASCIIToUTF16("?");
1451 if (inline_autocomplete_offset != string16::npos)
1452 ++inline_autocomplete_offset;
1453 }
1454
1455 const std::string languages(
1456 profile_->GetPrefs()->GetString(prefs::kAcceptLanguages));
1457 const net::FormatUrlTypes format_types =
1458 net::kFormatUrlOmitAll & ~(trim_http ? 0 : net::kFormatUrlOmitHTTP);
1459 match.fill_into_edit +=
1460 AutocompleteInput::FormattedStringWithEquivalentMeaning(navigation.url(),
1461 net::FormatUrl(navigation.url(), languages, format_types,
1462 net::UnescapeRule::SPACES, NULL, NULL,
1463 &inline_autocomplete_offset));
[email protected]518024c2013-07-19 23:40:251464 if (!input_.prevent_inline_autocomplete() &&
1465 (inline_autocomplete_offset != string16::npos)) {
1466 DCHECK(inline_autocomplete_offset <= match.fill_into_edit.length());
1467 match.inline_autocompletion =
1468 match.fill_into_edit.substr(inline_autocomplete_offset);
1469 }
[email protected]371dab12012-06-01 03:23:551470
1471 match.contents = net::FormatUrl(navigation.url(), languages,
1472 format_types, net::UnescapeRule::SPACES, NULL, NULL, &match_start);
1473 // If the first match in the untrimmed string was inside a scheme that we
1474 // trimmed, look for a subsequent match.
1475 if (match_start == string16::npos)
1476 match_start = match.contents.find(input);
1477 // Safe if |match_start| is npos; also safe if the input is longer than the
1478 // remaining contents after |match_start|.
1479 AutocompleteMatch::ClassifyLocationInString(match_start, input.length(),
1480 match.contents.length(), ACMatchClassification::URL,
1481 &match.contents_class);
initial.commit09911bf2008-07-26 23:55:291482
[email protected]55ce8f12012-05-09 04:44:081483 match.description = navigation.description();
[email protected]371dab12012-06-01 03:23:551484 AutocompleteMatch::ClassifyMatchInString(input, match.description,
1485 ACMatchClassification::NONE, &match.description_class);
[email protected]d30268a2013-06-25 22:31:071486
1487 match.RecordAdditionalInfo(
1488 kRelevanceFromServerKey,
1489 navigation.relevance_from_server() ? kTrue : kFalse);
1490
initial.commit09911bf2008-07-26 23:55:291491 return match;
1492}
[email protected]4ab4c7c2010-11-24 04:49:341493
[email protected]9dfb4d362013-04-05 02:15:121494void SearchProvider::DemoteKeywordNavigationMatchesPastTopQuery() {
[email protected]d519d392013-03-27 09:24:461495 // First, determine the maximum score of any keyword query match (verbatim or
1496 // query suggestion).
[email protected]d30268a2013-06-25 22:31:071497 bool relevance_from_server;
1498 int max_query_relevance = GetKeywordVerbatimRelevance(&relevance_from_server);
[email protected]cc1526e2013-05-17 04:04:241499 if (!keyword_results_.suggest_results.empty()) {
[email protected]d30268a2013-06-25 22:31:071500 const SuggestResult& top_keyword = keyword_results_.suggest_results.front();
1501 const int suggest_relevance = top_keyword.relevance();
1502 if (suggest_relevance > max_query_relevance) {
1503 max_query_relevance = suggest_relevance;
1504 relevance_from_server = top_keyword.relevance_from_server();
1505 } else if (suggest_relevance == max_query_relevance) {
1506 relevance_from_server |= top_keyword.relevance_from_server();
1507 }
[email protected]d519d392013-03-27 09:24:461508 }
1509 // If no query is supposed to appear, then navigational matches cannot
[email protected]9dfb4d362013-04-05 02:15:121510 // be demoted past it. Get rid of suggested relevance scores for
1511 // navsuggestions and introduce the verbatim results again. The keyword
1512 // verbatim match will outscore the navsuggest matches.
1513 if (max_query_relevance == 0) {
[email protected]cc1526e2013-05-17 04:04:241514 ApplyCalculatedNavigationRelevance(&keyword_results_.navigation_results);
1515 ApplyCalculatedNavigationRelevance(&default_results_.navigation_results);
1516 keyword_results_.verbatim_relevance = -1;
1517 default_results_.verbatim_relevance = -1;
[email protected]9dfb4d362013-04-05 02:15:121518 return;
1519 }
[email protected]d519d392013-03-27 09:24:461520 // Now we know we can enforce the minimum score constraint even after
1521 // the navigation matches are demoted. Proceed to demote the navigation
1522 // matches to enforce the query-must-come-first constraint.
[email protected]d519d392013-03-27 09:24:461523 // Cap the relevance score of all results.
[email protected]cc1526e2013-05-17 04:04:241524 for (NavigationResults::iterator it =
1525 keyword_results_.navigation_results.begin();
1526 it != keyword_results_.navigation_results.end(); ++it) {
[email protected]9dfb4d362013-04-05 02:15:121527 if (it->relevance() < max_query_relevance)
1528 return;
1529 max_query_relevance = std::max(max_query_relevance - 1, 0);
1530 it->set_relevance(max_query_relevance);
[email protected]d30268a2013-06-25 22:31:071531 it->set_relevance_from_server(relevance_from_server);
[email protected]d519d392013-03-27 09:24:461532 }
[email protected]d519d392013-03-27 09:24:461533}
1534
[email protected]4ab4c7c2010-11-24 04:49:341535void SearchProvider::UpdateDone() {
[email protected]2cdf1172012-08-26 12:21:331536 // We're done when the timer isn't running, there are no suggest queries
[email protected]5fac3782013-03-06 09:32:311537 // pending, and we're not waiting on Instant.
[email protected]e1290ee62013-06-26 18:31:151538 done_ = !timer_.IsRunning() && (suggest_results_pending_ == 0);
[email protected]4ab4c7c2010-11-24 04:49:341539}