| // Copyright 2014 The Chromium Authors |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "components/omnibox/browser/autocomplete_provider.h" |
| |
| #include <algorithm> |
| #include <string> |
| |
| #include "base/i18n/time_formatting.h" |
| #include "base/notreached.h" |
| #include "base/strings/string_util.h" |
| #include "base/strings/utf_string_conversions.h" |
| #include "base/trace_event/memory_usage_estimator.h" |
| #include "components/bookmarks/browser/bookmark_utils.h" |
| #include "components/omnibox/browser/autocomplete_enums.h" |
| #include "components/omnibox/browser/autocomplete_i18n.h" |
| #include "components/omnibox/browser/autocomplete_input.h" |
| #include "components/omnibox/browser/autocomplete_match.h" |
| #include "components/omnibox/browser/autocomplete_match_classification.h" |
| #include "components/omnibox/browser/autocomplete_provider_listener.h" |
| #include "components/omnibox/browser/history_provider.h" |
| #include "components/omnibox/browser/omnibox_field_trial.h" |
| #include "components/url_formatter/url_fixer.h" |
| #include "url/gurl.h" |
| |
| AutocompleteProvider::AutocompleteProvider(Type type) |
| : provider_max_matches_(OmniboxFieldTrial::GetProviderMaxMatches(type)), |
| type_(type) {} |
| |
| // static |
| const char* AutocompleteProvider::TypeToString(Type type) { |
| // When creating a new provider, add the provider type to this function and |
| // make sure to also add the appropriate OmniboxProvider variant to the |
| // Omnibox.ProviderTime2 histogram (defined in omnibox/histograms.xml) so that |
| // the run-time metrics associated with the relevant provider can be properly |
| // analyzed. |
| switch (type) { |
| case TYPE_BOOKMARK: |
| return "Bookmark"; |
| case TYPE_BUILTIN: |
| return "Builtin"; |
| case TYPE_CLIPBOARD: |
| return "Clipboard"; |
| case TYPE_DOCUMENT: |
| return "Document"; |
| case TYPE_HISTORY_QUICK: |
| return "HistoryQuick"; |
| case TYPE_HISTORY_URL: |
| return "HistoryURL"; |
| case TYPE_KEYWORD: |
| return "Keyword"; |
| case TYPE_ON_DEVICE_HEAD: |
| return "OnDeviceHead"; |
| case TYPE_SEARCH: |
| return "Search"; |
| case TYPE_SHORTCUTS: |
| return "Shortcuts"; |
| case TYPE_ZERO_SUGGEST: |
| return "ZeroSuggest"; |
| case TYPE_ZERO_SUGGEST_LOCAL_HISTORY: |
| return "LocalHistoryZeroSuggest"; |
| case TYPE_QUERY_TILE: |
| return "QueryTile"; |
| case TYPE_MOST_VISITED_SITES: |
| return "MostVisitedSites"; |
| case TYPE_VERBATIM_MATCH: |
| return "VerbatimMatch"; |
| case TYPE_VOICE_SUGGEST: |
| return "VoiceSuggest"; |
| case TYPE_HISTORY_FUZZY: |
| return "HistoryFuzzy"; |
| case TYPE_OPEN_TAB: |
| return "OpenTab"; |
| case TYPE_HISTORY_CLUSTER_PROVIDER: |
| return "HistoryCluster"; |
| case TYPE_CALCULATOR: |
| return "Calculator"; |
| case TYPE_FEATURED_SEARCH: |
| return "FeaturedSearch"; |
| case TYPE_HISTORY_EMBEDDINGS: |
| return "HistoryEmbeddings"; |
| case TYPE_ENTERPRISE_SEARCH_AGGREGATOR: |
| return "EnterpriseSearchAggregator"; |
| case TYPE_UNSCOPED_EXTENSION: |
| return "UnscopedExtension"; |
| case TYPE_RECENTLY_CLOSED_TABS: |
| return "RecentlyClosedTabs"; |
| case TYPE_CONTEXTUAL_SEARCH: |
| return "ContextualSearch"; |
| case TYPE_TAB_GROUP: |
| return "TabGroup"; |
| default: |
| DUMP_WILL_BE_NOTREACHED() |
| << "Unhandled AutocompleteProvider::Type " << type; |
| return "Unknown"; |
| } |
| } |
| |
| const std::u16string AutocompleteProvider::LocalizedLastModifiedString( |
| base::Time now, |
| base::Time modified_time) { |
| // Use shorthand if the times fall on the same day or in the same year. |
| base::Time::Exploded exploded_modified_time; |
| base::Time::Exploded exploded_now; |
| modified_time.LocalExplode(&exploded_modified_time); |
| now.LocalExplode(&exploded_now); |
| if (exploded_modified_time.year == exploded_now.year) { |
| if (exploded_modified_time.month == exploded_now.month && |
| exploded_modified_time.day_of_month == exploded_now.day_of_month) { |
| // Same local calendar day - use localized time. |
| return base::TimeFormatTimeOfDay(modified_time); |
| } |
| |
| // Same year but not the same day: use abbreviated month/day ("Jan 1"). |
| return base::LocalizedTimeFormatWithPattern(modified_time, "MMMd"); |
| } |
| |
| // No shorthand; display full MM/DD/YYYY. |
| return base::TimeFormatShortDateNumeric(modified_time); |
| } |
| |
| void AutocompleteProvider::AddListener(AutocompleteProviderListener* listener) { |
| listeners_.push_back(listener); |
| } |
| |
| void AutocompleteProvider::NotifyListeners(bool updated_matches) const { |
| for (AutocompleteProviderListener* listener : listeners_) { |
| listener->OnProviderUpdate(updated_matches, this); |
| } |
| } |
| |
| void AutocompleteProvider::StartPrefetch(const AutocompleteInput& input) { |
| DCHECK(!input.omit_asynchronous_matches()); |
| } |
| |
| void AutocompleteProvider::Stop(AutocompleteStopReason stop_reason) { |
| done_ = true; |
| if (stop_reason == AutocompleteStopReason::kClobbered) { |
| matches_.clear(); |
| suggestion_groups_map_.clear(); |
| } |
| } |
| |
| const char* AutocompleteProvider::GetName() const { |
| return TypeToString(type_); |
| } |
| |
| metrics::OmniboxEventProto_ProviderType |
| AutocompleteProvider::AsOmniboxEventProviderType() const { |
| switch (type_) { |
| case TYPE_BOOKMARK: |
| return metrics::OmniboxEventProto::BOOKMARK; |
| case TYPE_BUILTIN: |
| return metrics::OmniboxEventProto::BUILTIN; |
| case TYPE_CLIPBOARD: |
| return metrics::OmniboxEventProto::CLIPBOARD; |
| case TYPE_DOCUMENT: |
| return metrics::OmniboxEventProto::DOCUMENT; |
| case TYPE_HISTORY_QUICK: |
| return metrics::OmniboxEventProto::HISTORY_QUICK; |
| case TYPE_HISTORY_URL: |
| return metrics::OmniboxEventProto::HISTORY_URL; |
| case TYPE_KEYWORD: |
| return metrics::OmniboxEventProto::KEYWORD; |
| case TYPE_ON_DEVICE_HEAD: |
| return metrics::OmniboxEventProto::ON_DEVICE_HEAD; |
| case TYPE_SEARCH: |
| return metrics::OmniboxEventProto::SEARCH; |
| case TYPE_SHORTCUTS: |
| return metrics::OmniboxEventProto::SHORTCUTS; |
| case TYPE_ZERO_SUGGEST: |
| return metrics::OmniboxEventProto::ZERO_SUGGEST; |
| case TYPE_ZERO_SUGGEST_LOCAL_HISTORY: |
| return metrics::OmniboxEventProto::ZERO_SUGGEST_LOCAL_HISTORY; |
| case TYPE_QUERY_TILE: |
| return metrics::OmniboxEventProto::QUERY_TILE; |
| case TYPE_MOST_VISITED_SITES: |
| return metrics::OmniboxEventProto::MOST_VISITED_SITES; |
| case TYPE_VERBATIM_MATCH: |
| return metrics::OmniboxEventProto::VERBATIM_MATCH; |
| case TYPE_VOICE_SUGGEST: |
| return metrics::OmniboxEventProto::SEARCH; |
| case TYPE_HISTORY_FUZZY: |
| return metrics::OmniboxEventProto::HISTORY_FUZZY; |
| case TYPE_OPEN_TAB: |
| return metrics::OmniboxEventProto::OPEN_TAB; |
| case TYPE_HISTORY_CLUSTER_PROVIDER: |
| return metrics::OmniboxEventProto::HISTORY_CLUSTER; |
| case TYPE_CALCULATOR: |
| return metrics::OmniboxEventProto::CALCULATOR; |
| case TYPE_FEATURED_SEARCH: |
| return metrics::OmniboxEventProto::FEATURED_SEARCH; |
| case TYPE_HISTORY_EMBEDDINGS: |
| return metrics::OmniboxEventProto::HISTORY_EMBEDDINGS; |
| case TYPE_ENTERPRISE_SEARCH_AGGREGATOR: |
| return metrics::OmniboxEventProto::ENTERPRISE_SEARCH_AGGREGATOR; |
| case TYPE_UNSCOPED_EXTENSION: |
| return metrics::OmniboxEventProto::UNSCOPED_EXTENSION; |
| case TYPE_RECENTLY_CLOSED_TABS: |
| return metrics::OmniboxEventProto::RECENTLY_CLOSED_TABS; |
| case TYPE_CONTEXTUAL_SEARCH: |
| return metrics::OmniboxEventProto::CONTEXTUAL_SEARCH_PROVIDER; |
| case TYPE_TAB_GROUP: |
| return metrics::OmniboxEventProto::TAB_GROUP_PROVIDER; |
| default: |
| // TODO(crbug.com/40940012) This was a NOTREACHED that we converted to |
| // help debug crbug.com/1499235 since NOTREACHED's don't log their |
| // message in crash reports. Should be reverted back to a NOTREACHED or |
| // NOTREACHED if their logs eventually begin being logged to |
| // crash reports. |
| DUMP_WILL_BE_NOTREACHED() |
| << "[NOTREACHED] Unhandled AutocompleteProvider::Type " << type_; |
| return metrics::OmniboxEventProto::UNKNOWN_PROVIDER; |
| } |
| } |
| |
| void AutocompleteProvider::DeleteMatch(const AutocompleteMatch& match) { |
| DLOG(WARNING) << "The AutocompleteProvider '" << GetName() |
| << "' has not implemented DeleteMatch."; |
| } |
| |
| void AutocompleteProvider::DeleteMatchElement(const AutocompleteMatch& match, |
| size_t element_index) { |
| DLOG(WARNING) << "The AutocompleteProvider '" << GetName() |
| << "' has not implemented DeleteMatchElement."; |
| } |
| |
| void AutocompleteProvider::AddProviderInfo(ProvidersInfo* provider_info) const { |
| } |
| |
| size_t AutocompleteProvider::EstimateMemoryUsage() const { |
| return base::trace_event::EstimateMemoryUsage(matches_); |
| } |
| |
| AutocompleteProvider::~AutocompleteProvider() { |
| // Don't bother using `kClobbered` to clear caches and state, since those will |
| // be destroyed with the provider. |
| Stop(AutocompleteStopReason::kInteraction); |
| } |
| |
| // static |
| AutocompleteProvider::AdjustedInputAndStarterPackKeyword |
| AutocompleteProvider::AdjustInputForStarterPackKeyword( |
| const AutocompleteInput& input, |
| const TemplateURLService* turl_service) { |
| if (input.prefer_keyword()) { |
| AutocompleteInput keyword_input = input; |
| const TemplateURL* template_url = |
| AutocompleteInput::GetSubstitutingTemplateURLForInput(turl_service, |
| &keyword_input); |
| if (template_url && template_url->starter_pack_id() > 0) { |
| return {keyword_input, template_url}; |
| } |
| } |
| return {input, nullptr}; |
| } |
| |
| // static |
| AutocompleteProvider::FixupReturn AutocompleteProvider::FixupUserInput( |
| const AutocompleteInput& input) { |
| const std::u16string& input_text = input.text(); |
| const FixupReturn failed(false, input_text); |
| |
| // Fixup and canonicalize user input. |
| const GURL canonical_gurl( |
| url_formatter::FixupURL(base::UTF16ToUTF8(input_text), std::string())); |
| std::string canonical_gurl_str(canonical_gurl.possibly_invalid_spec()); |
| if (canonical_gurl_str.empty()) { |
| // This probably won't happen, but there are no guarantees. |
| return failed; |
| } |
| |
| // If the user types a number, GURL will convert it to a dotted quad. |
| // However, if the parser did not mark this as a URL, then the user probably |
| // didn't intend this interpretation. Since this can break history matching |
| // for hostname beginning with numbers (e.g. input of "17173" will be matched |
| // against "0.0.67.21" instead of the original "17173", failing to find |
| // "17173.com"), swap the original hostname in for the fixed-up one. |
| if ((input.type() != metrics::OmniboxInputType::URL) && |
| canonical_gurl.HostIsIPAddress()) { |
| std::string original_hostname = base::UTF16ToUTF8( |
| input_text.substr(input.parts().host.begin, input.parts().host.len)); |
| const url::Parsed& parts = |
| canonical_gurl.parsed_for_possibly_invalid_spec(); |
| // parts.host must not be empty when HostIsIPAddress() is true. |
| DCHECK(parts.host.is_nonempty()); |
| canonical_gurl_str.replace(parts.host.begin, parts.host.len, |
| original_hostname); |
| } |
| std::u16string output(base::UTF8ToUTF16(canonical_gurl_str)); |
| // Don't prepend a scheme when the user didn't have one. Since the fixer |
| // upper only prepends the "http" scheme that's all we need to check for. |
| // Note that even if Defaulting Typed Omnibox Navigations to HTTPS feature is |
| // enabled, the https upgrade is done in AutocompleteInput::Parse() and not |
| // in the fixer upper, so we don't need to check for that case. |
| if (!AutocompleteInput::HasHTTPScheme(input_text)) |
| TrimSchemePrefix(&output, /*trim_https=*/false); |
| |
| // Make the number of trailing slashes on the output exactly match the input. |
| // Examples of why not doing this would matter: |
| // * The user types "a" and has this fixed up to "a/". Now no other sites |
| // beginning with "a" will match. |
| // * The user types "file:" and has this fixed up to "file://". Now inline |
| // autocomplete will append too few slashes, resulting in e.g. "file:/b..." |
| // instead of "file:///b..." |
| // * The user types "http:/" and has this fixed up to "http:". Now inline |
| // autocomplete will append too many slashes, resulting in e.g. |
| // "http:///c..." instead of "http://c...". |
| // NOTE: We do this after calling TrimHttpPrefix() since that can strip |
| // trailing slashes (if the scheme is the only thing in the input). It's not |
| // clear that the result of fixup really matters in this case, but there's no |
| // harm in making sure. |
| const size_t last_input_nonslash = input_text.find_last_not_of(u"/\\"); |
| size_t num_input_slashes = |
| (last_input_nonslash == std::u16string::npos) |
| ? input_text.length() |
| : (input_text.length() - 1 - last_input_nonslash); |
| // If we appended text, user slashes are irrelevant. |
| if (output.length() > input_text.length() && |
| base::StartsWith(output, input_text, base::CompareCase::SENSITIVE)) |
| num_input_slashes = 0; |
| const size_t last_output_nonslash = output.find_last_not_of(u"/\\"); |
| const size_t num_output_slashes = |
| (last_output_nonslash == std::u16string::npos) |
| ? output.length() |
| : (output.length() - 1 - last_output_nonslash); |
| if (num_output_slashes < num_input_slashes) |
| output.append(num_input_slashes - num_output_slashes, '/'); |
| else if (num_output_slashes > num_input_slashes) |
| output.erase(output.length() - num_output_slashes + num_input_slashes); |
| if (output.empty()) |
| return failed; |
| |
| return FixupReturn(true, output); |
| } |
| |
| // static |
| size_t AutocompleteProvider::TrimSchemePrefix(std::u16string* url, |
| bool trim_https) { |
| // Find any "http:" or "https:". |
| if (trim_https && !AutocompleteInput::HasHTTPSScheme(*url)) |
| return 0; |
| if (!trim_https && !AutocompleteInput::HasHTTPScheme(*url)) |
| return 0; |
| const char* scheme = trim_https ? url::kHttpsScheme : url::kHttpScheme; |
| size_t scheme_pos = url->find(base::ASCIIToUTF16(scheme) + u':'); |
| DCHECK_NE(std::u16string::npos, scheme_pos); |
| |
| // Erase scheme plus up to two slashes. |
| size_t prefix_end = scheme_pos + strlen(scheme) + 1; |
| const size_t after_slashes = std::min(url->length(), prefix_end + 2); |
| while ((prefix_end < after_slashes) && ((*url)[prefix_end] == '/')) |
| ++prefix_end; |
| url->erase(scheme_pos, prefix_end - scheme_pos); |
| return (scheme_pos == 0) ? prefix_end : 0; |
| } |
| |
| void AutocompleteProvider::ResizeMatches(size_t max_matches, |
| bool ml_scoring_enabled) { |
| if (matches_.size() <= max_matches) { |
| return; |
| } |
| |
| // When ML Scoring is not enabled, simply resize the `matches_` list. |
| if (!ml_scoring_enabled) { |
| matches_.resize(max_matches); |
| return; |
| } |
| |
| // The provider should pass all match candidates to the controller if ML |
| // scoring is enabled. Mark any matches over `max_matches` with zero relevance |
| // and `culled_by_provider` set to true to simulate the resizing. |
| std::ranges::for_each(std::next(matches_.begin(), max_matches), |
| matches_.end(), [&](auto& match) { |
| match.relevance = 0; |
| match.culled_by_provider = true; |
| }); |
| } |