// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef CHROME_BROWSER_AUTOCOMPLETE_HISTORY_URL_PROVIDER_H_ #define CHROME_BROWSER_AUTOCOMPLETE_HISTORY_URL_PROVIDER_H_ #include <string> #include <vector> #include "base/compiler_specific.h" #include "base/synchronization/cancellation_flag.h" #include "chrome/browser/autocomplete/autocomplete_input.h" #include "chrome/browser/autocomplete/history_provider.h" #include "chrome/browser/autocomplete/history_provider_util.h" #include "chrome/browser/autocomplete/url_prefix.h" #include "chrome/browser/omnibox/omnibox_field_trial.h" #include "chrome/browser/search_engines/search_terms_data.h" #include "chrome/browser/search_engines/template_url.h" class Profile; namespace base { class MessageLoop; } namespace history { class HistoryBackend; class URLDatabase; } // How history autocomplete works // ============================== // // Read down this diagram for temporal ordering. // // Main thread History thread // ----------- -------------- // AutocompleteController::Start // -> HistoryURLProvider::Start // -> RunAutocompletePasses // -> SuggestExactInput // [params_ allocated] // -> DoAutocomplete (for inline autocomplete) // -> URLDatabase::AutocompleteForPrefix (on in-memory DB) // -> HistoryService::ScheduleAutocomplete // (return to controller) ---- // / // HistoryBackend::ScheduleAutocomplete // -> HistoryURLProvider::ExecuteWithDB // -> DoAutocomplete // -> URLDatabase::AutocompleteForPrefix // / // HistoryService::QueryComplete // [params_ destroyed] // -> AutocompleteProviderListener::OnProviderUpdate // // The autocomplete controller calls us, and must be called back, on the main // thread. When called, we run two autocomplete passes. The first pass runs // synchronously on the main thread and queries the in-memory URL database. // This pass promotes matches for inline autocomplete if applicable. We do // this synchronously so that users get consistent behavior when they type // quickly and hit enter, no matter how loaded the main history database is. // Doing this synchronously also prevents inline autocomplete from being // "flickery" in the AutocompleteEdit. Because the in-memory DB does not have // redirect data, results other than the top match might change between the // two passes, so we can't just decide to use this pass' matches as the final // results. // // The second autocomplete pass uses the full history database, which must be // queried on the history thread. Start() asks the history service schedule to // callback on the history thread with a pointer to the main database. When we // are done doing queries, we schedule a task on the main thread that notifies // the AutocompleteController that we're done. // // The communication between these threads is done using a // HistoryURLProviderParams object. This is allocated in the main thread, and // normally deleted in QueryComplete(). So that both autocomplete passes can // use the same code, we also use this to hold results during the first // autocomplete pass. // // While the second pass is running, the AutocompleteController may cancel the // request. This can happen frequently when the user is typing quickly. In // this case, the main thread sets params_->cancel, which the background thread // checks periodically. If it finds the flag set, it stops what it's doing // immediately and calls back to the main thread. (We don't delete the params // on the history thread, because we should only do that when we can safely // NULL out params_, and that must be done on the main thread.) // Used to communicate autocomplete parameters between threads via the history // service. struct HistoryURLProviderParams { HistoryURLProviderParams(const AutocompleteInput& input, bool trim_http, const std::string& languages, TemplateURL* default_search_provider, const SearchTermsData& search_terms_data); ~HistoryURLProviderParams(); base::MessageLoop* message_loop; // A copy of the autocomplete input. We need the copy since this object will // live beyond the original query while it runs on the history thread. AutocompleteInput input; // Should inline autocompletion be disabled? This is initalized from // |input.prevent_inline_autocomplete()|, but set to false is the input // contains trailing white space. bool prevent_inline_autocomplete; // Set when "http://" should be trimmed from the beginning of the URLs. bool trim_http; // Set by the main thread to cancel this request. If this flag is set when // the query runs, the query will be abandoned. This allows us to avoid // running queries that are no longer needed. Since we don't care if we run // the extra queries, the lack of signaling is not a problem. base::CancellationFlag cancel_flag; // Set by ExecuteWithDB() on the history thread when the query could not be // performed because the history system failed to properly init the database. // If this is set when the main thread is called back, it avoids changing // |matches_| at all, so it won't delete the default match // RunAutocompletePasses() creates. bool failed; // List of matches written by the history thread. We keep this separate list // to avoid having the main thread read the provider's matches while the // history thread is manipulating them. The provider copies this list back // to matches_ on the main thread in QueryComplete(). ACMatches matches; // Languages we should pass to gfx::GetCleanStringFromUrl. std::string languages; // When true, we should avoid calling SuggestExactInput(). bool dont_suggest_exact_input; // The default search provider and search terms data necessary to cull results // that correspond to searches (on the default engine). These can only be // obtained on the UI thread, so we have to copy them into here to pass them // to the history thread. We use a scoped_ptr<TemplateURL> for the DSP since // TemplateURLs can't be copied by value. We use a scoped_ptr<SearchTermsData> // so that we can store a snapshot of the SearchTermsData accessible from the // history thread. scoped_ptr<TemplateURL> default_search_provider; scoped_ptr<SearchTermsData> search_terms_data; private: DISALLOW_COPY_AND_ASSIGN(HistoryURLProviderParams); }; // This class is an autocomplete provider and is also a pseudo-internal // component of the history system. See comments above. class HistoryURLProvider : public HistoryProvider { public: // Various values used in scoring, made public so other providers // can insert results in appropriate ranges relative to these. static const int kScoreForBestInlineableResult; static const int kScoreForUnvisitedIntranetResult; static const int kScoreForWhatYouTypedResult; static const int kBaseScoreForNonInlineableResult; HistoryURLProvider(AutocompleteProviderListener* listener, Profile* profile); // HistoryProvider: virtual void Start(const AutocompleteInput& input, bool minimal_changes) OVERRIDE; virtual void Stop(bool clear_cached_results) OVERRIDE; // Returns a match representing a navigation to |destination_url| given user // input of |text|. |trim_http| controls whether the match's |fill_into_edit| // and |contents| should have any HTTP scheme stripped off, and should not be // set to true if |text| contains an http prefix. // NOTE: This does not set the relevance of the returned match, as different // callers want different behavior. Callers must set this manually. AutocompleteMatch SuggestExactInput(const base::string16& text, const GURL& destination_url, bool trim_http); // Runs the history query on the history thread, called by the history // system. The history database MAY BE NULL in which case it is not // available and we should return no data. Also schedules returning the // results to the main thread void ExecuteWithDB(history::HistoryBackend* backend, history::URLDatabase* db, HistoryURLProviderParams* params); // Actually runs the autocomplete job on the given database, which is // guaranteed not to be NULL. void DoAutocomplete(history::HistoryBackend* backend, history::URLDatabase* db, HistoryURLProviderParams* params); // Dispatches the results to the autocomplete controller. Called on the // main thread by ExecuteWithDB when the results are available. // Frees params_gets_deleted on exit. void QueryComplete(HistoryURLProviderParams* params_gets_deleted); private: FRIEND_TEST_ALL_PREFIXES(HistoryURLProviderTest, HUPScoringExperiment); enum MatchType { NORMAL, WHAT_YOU_TYPED, INLINE_AUTOCOMPLETE, UNVISITED_INTRANET, // An intranet site that has never been visited. }; class VisitClassifier; ~HistoryURLProvider(); // Determines the relevance for a match, given its type. If // |match_type| is NORMAL, |match_number| is a number [0, // kMaxSuggestions) indicating the relevance of the match (higher == // more relevant). For other values of |match_type|, |match_number| // is ignored. Only called some of the time; for some matches, // relevancy scores are assigned consecutively decreasing (1416, // 1415, 1414, ...). int CalculateRelevance(MatchType match_type, size_t match_number) const; // Helper function that actually launches the two autocomplete passes. void RunAutocompletePasses(const AutocompleteInput& input, bool fixup_input_and_run_pass_1); // Given a |match| containing the "what you typed" suggestion created by // SuggestExactInput(), looks up its info in the DB. If found, fills in the // title from the DB, promotes the match's priority to that of an inline // autocomplete match (maybe it should be slightly better?), and places it on // the front of |matches| (so we pick the right matches to throw away // when culling redirects to/from it). Returns whether a match was promoted. bool FixupExactSuggestion(history::URLDatabase* db, const AutocompleteInput& input, const VisitClassifier& classifier, AutocompleteMatch* match, history::HistoryMatches* matches) const; // Helper function for FixupExactSuggestion, this returns true if the input // corresponds to some intranet URL where the user has previously visited the // host in question. In this case the input should be treated as a URL. bool CanFindIntranetURL(history::URLDatabase* db, const AutocompleteInput& input) const; // Determines if |match| is suitable for inline autocomplete. If so, and if // |params| is non-NULL, promotes the match. Returns whether |match| is // suitable for inline autocomplete. bool PromoteMatchForInlineAutocomplete(const history::HistoryMatch& match, HistoryURLProviderParams* params); // Sees if a shorter version of the best match should be created, and if so // places it at the front of |matches|. This can suggest history URLs that // are prefixes of the best match (if they've been visited enough, compared to // the best match), or create host-only suggestions even when they haven't // been visited before: if the user visited http://example.com/asdf once, // we'll suggest http://example.com/ even if they've never been to it. void PromoteOrCreateShorterSuggestion( history::URLDatabase* db, const HistoryURLProviderParams& params, bool have_what_you_typed_match, const AutocompleteMatch& what_you_typed_match, history::HistoryMatches* matches); // Removes results that have been rarely typed or visited, and not any time // recently. The exact parameters for this heuristic can be found in the // function body. Also culls results corresponding to queries from the default // search engine. These are low-quality, difficult-to-understand matches for // users, and the SearchProvider should surface past queries in a better way // anyway. void CullPoorMatches(const HistoryURLProviderParams& params, history::HistoryMatches* matches) const; // Removes results that redirect to each other, leaving at most |max_results| // results. void CullRedirects(history::HistoryBackend* backend, history::HistoryMatches* matches, size_t max_results) const; // Helper function for CullRedirects, this removes all but the first // occurance of [any of the set of strings in |remove|] from the |matches| // list. // // The return value is the index of the item that is after the item in the // input identified by |source_index|. If |source_index| or an item before // is removed, the next item will be shifted, and this allows the caller to // pick up on the next one when this happens. size_t RemoveSubsequentMatchesOf(history::HistoryMatches* matches, size_t source_index, const std::vector<GURL>& remove) const; // Converts a line from the database into an autocomplete match for display. // If experimental scoring is enabled, the final relevance score might be // different from the given |relevance|. AutocompleteMatch HistoryMatchToACMatch( const HistoryURLProviderParams& params, const history::HistoryMatch& history_match, MatchType match_type, int relevance); // Returns a set of classifications that highlight all the occurrences // of |input_text| at word breaks in |description|. static ACMatchClassifications ClassifyDescription( const base::string16& input_text, const base::string16& description); // Returns a new relevance score for the given |match| based on the // |old_relevance| score and |scoring_params_|. The new relevance score is // guaranteed to be less than or equal to |old_relevance|. In other words, // this function can only demote a score, never boost it. // Returns |old_relevance| score if experimental scoring is disabled // or if the |match.promoted| is true. int CalculateRelevanceScoreUsingScoringParams( const history::HistoryMatch& match, int old_relevance) const; // Params for the current query. The provider should not free this directly; // instead, it is passed as a parameter through the history backend, and the // parameter itself is freed once it's no longer needed. The only reason we // keep this member is so we can set the cancel bit on it. HistoryURLProviderParams* params_; // Params controlling experimental behavior of this provider. HUPScoringParams scoring_params_; // If true, HistoryURL provider should lookup and cull redirects. If // false, it returns matches that may be redirects to each other and // simply hopes the default AutoCompleteController behavior to remove // URLs that are likely duplicates (http://google.com <-> // https://www.google.com/, etc.) will do a good enough job. bool cull_redirects_; // Used in PromoteOrCreateShorterSuggestion(). If true, we may create // shorter suggestions even when they haven't been visited before: // if the user visited http://example.com/asdf once, we'll suggest // http://example.com/ even if they've never been to it. bool create_shorter_match_; // Whether to query the history URL database to match. Even if // false, we still use the URL database to decide if the // URL-what-you-typed was visited before or not. If false, the only // possible result that HistoryURL provider can return is // URL-what-you-typed. This variable is not part of params_ because // it never changes after the HistoryURLProvider is initialized. // It's used to aid the transition to get all URLs from history to // be scored in the HistoryQuick provider only. bool search_url_database_; }; #endif // CHROME_BROWSER_AUTOCOMPLETE_HISTORY_URL_PROVIDER_H_