| // Copyright 2012 The Chromium Authors |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "components/omnibox/browser/history_url_provider.h" |
| |
| #include <stddef.h> |
| |
| #include <algorithm> |
| #include <array> |
| #include <memory> |
| #include <string> |
| #include <utility> |
| #include <vector> |
| |
| #include "base/compiler_specific.h" |
| #include "base/containers/span.h" |
| #include "base/run_loop.h" |
| #include "base/strings/string_util.h" |
| #include "base/strings/stringprintf.h" |
| #include "base/strings/utf_string_conversions.h" |
| #include "base/test/bind.h" |
| #include "base/test/scoped_feature_list.h" |
| #include "base/test/task_environment.h" |
| #include "base/time/time.h" |
| #include "build/build_config.h" |
| #include "components/bookmarks/test/test_bookmark_client.h" |
| #include "components/history/core/browser/history_service.h" |
| #include "components/history/core/browser/url_database.h" |
| #include "components/history/core/test/history_service_test_util.h" |
| #include "components/omnibox/browser/autocomplete_enums.h" |
| #include "components/omnibox/browser/autocomplete_match.h" |
| #include "components/omnibox/browser/autocomplete_provider.h" |
| #include "components/omnibox/browser/autocomplete_provider_listener.h" |
| #include "components/omnibox/browser/autocomplete_result.h" |
| #include "components/omnibox/browser/fake_autocomplete_provider_client.h" |
| #include "components/omnibox/browser/history_quick_provider.h" |
| #include "components/omnibox/browser/verbatim_match.h" |
| #include "components/omnibox/common/omnibox_features.h" |
| #include "components/prefs/pref_service.h" |
| #include "components/search_engines/default_search_manager.h" |
| #include "components/search_engines/template_url.h" |
| #include "components/search_engines/template_url_service.h" |
| #include "components/search_engines/template_url_starter_pack_data.h" |
| #include "components/url_formatter/url_fixer.h" |
| #include "testing/gtest/include/gtest/gtest.h" |
| #include "third_party/metrics_proto/omnibox_event.pb.h" |
| #include "third_party/metrics_proto/omnibox_focus_type.pb.h" |
| #include "third_party/metrics_proto/omnibox_input_type.pb.h" |
| #include "ui/base/page_transition_types.h" |
| |
| using base::ASCIIToUTF16; |
| using base::Time; |
| |
| namespace { |
| |
| struct TestURLInfo { |
| const char* url; |
| const char* title; |
| int visit_count; |
| int typed_count; |
| int age_in_days; |
| bool hidden = false; |
| }; |
| auto test_db = std::to_array<TestURLInfo>({ |
| {"http://www.google.com/", "Google", 3, 3, 80}, |
| |
| // High-quality pages should get a host synthesized as a lower-quality |
| // match. |
| {"http://slashdot.org/favorite_page.html", "Favorite page", 200, 100, 80}, |
| |
| // Less popular pages should have hosts synthesized as higher-quality |
| // matches. |
| {"http://kerneltrap.org/not_very_popular.html", "Less popular", 4, 0, 80}, |
| |
| // Unpopular pages should not appear in the results at all. |
| {"http://freshmeat.net/unpopular.html", "Unpopular", 1, 0, 80}, |
| |
| // If a host has a match, we should pick it up during host synthesis. |
| {"http://news.google.com/?ned=us&topic=n", "Google News - U.S.", 2, 2, 80}, |
| {"http://news.google.com/", "Google News", 1, 1, 80}, |
| |
| // Matches that are normally not inline-autocompletable should be |
| // autocompleted if they are shorter substitutes for longer matches that |
| // would have been inline autocompleted. |
| {"http://synthesisatest.com/foo/", "Test A", 1, 1, 80}, |
| {"http://synthesisbtest.com/foo/", "Test B", 1, 1, 80}, |
| {"http://synthesisbtest.com/foo/bar.html", "Test B Bar", 2, 2, 80}, |
| |
| // Suggested short URLs must be "good enough" and must match user input. |
| {"http://foo.com/", "Dir", 5, 5, 80}, |
| {"http://foo.com/dir/", "Dir", 2, 2, 80}, |
| {"http://foo.com/dir/another/", "Dir", 5, 1, 80}, |
| {"http://foo.com/dir/another/again/", "Dir", 10, 0, 80}, |
| {"http://foo.com/dir/another/again/myfile.html", "File", 10, 2, 80}, |
| |
| // We throw in a lot of extra URLs here to make sure we're testing the |
| // history database's query, not just the autocomplete provider. |
| {"http://startest.com/y/a", "A", 2, 2, 80}, |
| {"http://startest.com/y/b", "B", 5, 2, 80}, |
| {"http://startest.com/x/c", "C", 5, 2, 80}, |
| {"http://startest.com/x/d", "D", 5, 5, 80}, |
| {"http://startest.com/y/e", "E", 4, 2, 80}, |
| {"http://startest.com/y/f", "F", 3, 2, 80}, |
| {"http://startest.com/y/g", "G", 3, 2, 80}, |
| {"http://startest.com/y/h", "H", 3, 2, 80}, |
| {"http://startest.com/y/i", "I", 3, 2, 80}, |
| {"http://startest.com/y/j", "J", 3, 2, 80}, |
| {"http://startest.com/y/k", "K", 3, 2, 80}, |
| {"http://startest.com/y/l", "L", 3, 2, 80}, |
| {"http://startest.com/y/m", "M", 3, 2, 80}, |
| |
| // A file: URL is useful for testing that fixup does the right thing w.r.t. |
| // the number of trailing slashes on the user's input. |
| {"file:///C:/foo.txt", "", 2, 2, 80}, |
| |
| // Results with absurdly high typed_counts so that very generic queries like |
| // "http" will give consistent results even if more data is added above. |
| {"http://bogussite.com/a", "Bogus A", 10002, 10000, 80}, |
| {"http://bogussite.com/b", "Bogus B", 10001, 10000, 80}, |
| {"http://bogussite.com/c", "Bogus C", 10000, 10000, 80}, |
| |
| // Domain name with number. |
| {"http://www.17173.com/", "Domain with number", 3, 3, 80}, |
| |
| // URLs to test exact-matching behavior. |
| {"http://go/", "Intranet URL", 1, 1, 80}, |
| {"http://gooey/", "Intranet URL 2", 5, 5, 80}, |
| // This entry is explicitly added as hidden |
| {"http://g/", "Intranet URL", 7, 7, 80, true}, |
| |
| // URLs for testing offset adjustment. |
| {"http://www.\xEA\xB5\x90\xEC\x9C\xA1.kr/", "Korean", 2, 2, 80}, |
| {"http://spaces.com/path%20with%20spaces/foo.html", "Spaces", 2, 2, 80}, |
| {"http://ms/c++%20style%20guide", "Style guide", 2, 2, 80}, |
| |
| // URLs for testing ctrl-enter behavior. |
| {"http://binky/", "Intranet binky", 2, 2, 80}, |
| {"http://winky/", "Intranet winky", 2, 2, 80}, |
| {"http://www.winky.com/", "Internet winky", 5, 0, 80}, |
| |
| // URLs used by EmptyVisits. |
| {"http://pandora.com/", "Pandora", 2, 2, 80}, |
| {"http://pa/", "pa", 0, 0, history::kLowQualityMatchAgeLimitInDays - 1}, |
| |
| // For intranet based tests. |
| {"http://intra/one", "Intranet", 2, 2, 80}, |
| {"http://intra/two", "Intranet two", 1, 1, 80}, |
| {"http://intra/three", "Intranet three", 2, 2, 80}, |
| {"https://www.prefixintra/one", "Intranet www", 1, 1, 80}, |
| {"http://moo/bar", "Intranet moo", 1, 1, 80}, |
| {"http://typedhost/typedpath", "Intranet typed", 1, 1, 80}, |
| {"http://typedhost/untypedpath", "Intranet untyped", 1, 0, 80}, |
| |
| {"http://x.com/one", "Internet", 2, 2, 80}, |
| {"http://x.com/two", "Internet two", 1, 1, 80}, |
| {"http://x.com/three", "Internet three", 2, 2, 80}, |
| |
| // For punycode tests. |
| {"http://puny.xn--h2by8byc123p.in/", "Punycode", 2, 2, 5}, |
| {"http://two_puny.xn--1lq90ic7f1rc.cn/", |
| "Punycode to be rendered in Unicode", 2, 2, 5}, |
| |
| // For experimental HUP scoring test. |
| {"http://7.com/1a", "One", 8, 4, 4}, |
| {"http://7.com/2a", "Two A", 4, 2, 8}, |
| {"http://7.com/2b", "Two B", 4, 1, 8}, |
| {"http://7.com/3a", "Three", 2, 1, 16}, |
| {"http://7.com/4a", "Four A", 1, 1, 32}, |
| {"http://7.com/4b", "Four B", 1, 1, 64}, |
| {"http://7.com/5a", "Five A", 8, 0, 64}, // never typed. |
| |
| // For match URL formatting test. |
| {"https://www.abc.def.com/path", "URL with subdomain", 10, 10, 80}, |
| {"https://www.hij.com/path", "URL with www only", 10, 10, 80}, |
| |
| // For URL-what-you-typed in history tests. |
| {"https://wytih/", "What you typed in history main", 1, 1, 80}, |
| {"https://www.wytih/", "What you typed in history www main", 2, 2, 80}, |
| {"https://www.wytih/page", "What you typed in history www page", 5, 5, 80}, |
| {"ftp://wytih/file", "What you typed in history ftp file", 6, 6, 80}, |
| {"https://www.wytih/file", "What you typed in history www file", 7, 7, 80}, |
| |
| // URLs containing whitespaces for inline autocompletion tests. |
| {"https://www.zebra.com/zebra", "zebra1", 7, 7, 80}, |
| {"https://www.zebra.com/zebras", "zebra2", 7, 7, 80}, |
| {"https://www.zebra.com/zebra s", "zebra3", 7, 7, 80}, |
| {"https://www.zebra.com/zebra s", "zebra4", 7, 7, 80}, |
| |
| // URL with "history" in it, to test the @history starter pack scope. |
| {"https://history.com/", "History.com", 1, 1, 80}, |
| }); |
| |
| } // namespace |
| |
| class HistoryURLProviderPublic : public HistoryURLProvider { |
| public: |
| HistoryURLProviderPublic(AutocompleteProviderClient* client, |
| AutocompleteProviderListener* listener) |
| : HistoryURLProvider(client, listener) {} |
| |
| using HistoryURLProvider::HistoryMatchToACMatch; |
| using HistoryURLProvider::scoring_params_; |
| |
| protected: |
| ~HistoryURLProviderPublic() override = default; |
| }; |
| |
| class HistoryURLProviderTest : public testing::Test, |
| public AutocompleteProviderListener { |
| public: |
| struct UrlAndLegalDefault { |
| std::string url; |
| bool allowed_to_be_default_match; |
| }; |
| |
| HistoryURLProviderTest() : sort_matches_(false) { |
| HistoryQuickProvider::set_disabled(true); |
| } |
| |
| ~HistoryURLProviderTest() override { |
| HistoryQuickProvider::set_disabled(false); |
| } |
| |
| HistoryURLProviderTest(const HistoryURLProviderTest&) = delete; |
| HistoryURLProviderTest& operator=(const HistoryURLProviderTest&) = delete; |
| |
| // AutocompleteProviderListener: |
| void OnProviderUpdate(bool updated_matches, |
| const AutocompleteProvider* provider) override; |
| |
| protected: |
| // testing::Test |
| void SetUp() override { ASSERT_TRUE(SetUpImpl(true)); } |
| void TearDown() override; |
| |
| // Does the real setup. |
| [[nodiscard]] bool SetUpImpl(bool create_history_db); |
| |
| // Fills test data into the history system. |
| void FillData(); |
| |
| // Runs an autocomplete query on |text| and checks to see that the returned |
| // results' destination URLs match those provided. Also allows checking |
| // that the input type was identified correctly. |
| void RunTest(const std::u16string& text, |
| const std::string& desired_tld, |
| bool prevent_inline_autocomplete, |
| base::span<const UrlAndLegalDefault> expected_urls, |
| metrics::OmniboxInputType* identified_input_type); |
| |
| // A version of the above without the final |type| output parameter. |
| void RunTest(const std::u16string& text, |
| const std::string& desired_tld, |
| bool prevent_inline_autocomplete, |
| base::span<const UrlAndLegalDefault> expected_urls) { |
| metrics::OmniboxInputType type; |
| return RunTest(text, desired_tld, prevent_inline_autocomplete, |
| expected_urls, &type); |
| } |
| |
| // Verifies that for the given |input_text|, the first match's contents |
| // are |expected_match_contents|. Also verifies that there is a correctly |
| // positioned match classification within the contents. |
| void ExpectFormattedFullMatch(const std::string& input_text, |
| const wchar_t* expected_match_contents, |
| size_t expected_match_location, |
| size_t expected_match_length); |
| |
| base::ScopedTempDir history_dir_; |
| base::test::TaskEnvironment task_environment_; |
| ACMatches matches_; |
| std::unique_ptr<FakeAutocompleteProviderClient> client_; |
| scoped_refptr<HistoryURLProviderPublic> provider_; |
| // Should the matches be sorted and duplicates removed? |
| bool sort_matches_; |
| base::OnceClosure quit_closure_; |
| }; |
| |
| class HistoryURLProviderTestNoDB : public HistoryURLProviderTest { |
| protected: |
| void SetUp() override { ASSERT_TRUE(SetUpImpl(false)); } |
| }; |
| |
| class HistoryURLProviderTestNoSearchProvider : public HistoryURLProviderTest { |
| protected: |
| void SetUp() override { |
| DefaultSearchManager::SetFallbackSearchEnginesDisabledForTesting(true); |
| HistoryURLProviderTest::SetUp(); |
| } |
| |
| void TearDown() override { |
| HistoryURLProviderTest::TearDown(); |
| DefaultSearchManager::SetFallbackSearchEnginesDisabledForTesting(false); |
| } |
| }; |
| |
| void HistoryURLProviderTest::OnProviderUpdate( |
| bool updated_matches, |
| const AutocompleteProvider* provider) { |
| if (provider_->done()) { |
| std::move(quit_closure_).Run(); |
| } |
| } |
| |
| bool HistoryURLProviderTest::SetUpImpl(bool create_history_db) { |
| client_ = std::make_unique<FakeAutocompleteProviderClient>(); |
| CHECK(history_dir_.CreateUniqueTempDir()); |
| client_->set_history_service( |
| history::CreateHistoryService(history_dir_.GetPath(), create_history_db)); |
| client_->set_bookmark_model(bookmarks::TestBookmarkClient::CreateModel()); |
| if (!client_->GetHistoryService()) |
| return false; |
| provider_ = |
| base::MakeRefCounted<HistoryURLProviderPublic>(client_.get(), this); |
| FillData(); |
| return true; |
| } |
| |
| void HistoryURLProviderTest::TearDown() { |
| matches_.clear(); |
| provider_ = nullptr; |
| client_.reset(); |
| task_environment_.RunUntilIdle(); |
| } |
| |
| void HistoryURLProviderTest::FillData() { |
| // Most visits are a long time ago (some tests require this since we do some |
| // special logic for things visited very recently). Note that this time must |
| // be more recent than the "expire history" threshold for the data to be kept |
| // in the main database. |
| // |
| // TODO(brettw) It would be nice if we could test this behavior, in which |
| // case the time would be specifed in the test_db structure. |
| const Time now = Time::Now(); |
| |
| for (size_t i = 0; i < std::size(test_db); ++i) { |
| const TestURLInfo& cur = test_db[i]; |
| const GURL current_url(cur.url); |
| client_->GetHistoryService()->AddPageWithDetails( |
| current_url, base::UTF8ToUTF16(cur.title), cur.visit_count, |
| cur.typed_count, now - base::Days(cur.age_in_days), cur.hidden, |
| history::SOURCE_BROWSED); |
| } |
| } |
| |
| void HistoryURLProviderTest::RunTest( |
| const std::u16string& text, |
| const std::string& desired_tld, |
| bool prevent_inline_autocomplete, |
| base::span<const UrlAndLegalDefault> expected_urls, |
| metrics::OmniboxInputType* identified_input_type) { |
| AutocompleteInput input(text, std::u16string::npos, desired_tld, |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| input.set_prevent_inline_autocomplete(prevent_inline_autocomplete); |
| *identified_input_type = input.type(); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| |
| matches_ = provider_->matches(); |
| if (sort_matches_) { |
| TemplateURLService* service = client_->GetTemplateURLService(); |
| AutocompleteResult::DeduplicateMatches(&matches_, input, service); |
| std::sort(matches_.begin(), matches_.end(), |
| &AutocompleteMatch::MoreRelevant); |
| } |
| SCOPED_TRACE(u"input = " + text); |
| ASSERT_EQ(expected_urls.size(), matches_.size()) |
| << "Input text: " << text << "\nTLD: \"" << desired_tld << "\""; |
| for (size_t i = 0; i < expected_urls.size(); ++i) { |
| EXPECT_EQ(expected_urls[i].url, matches_[i].destination_url.spec()); |
| EXPECT_EQ(expected_urls[i].allowed_to_be_default_match, |
| matches_[i].allowed_to_be_default_match); |
| } |
| } |
| |
| void HistoryURLProviderTest::ExpectFormattedFullMatch( |
| const std::string& input_text, |
| const wchar_t* expected_match_contents, |
| size_t expected_match_location, |
| size_t expected_match_length) { |
| std::u16string expected_match_contents_string = |
| base::WideToUTF16(expected_match_contents); |
| ASSERT_FALSE(expected_match_contents_string.empty()); |
| |
| SCOPED_TRACE("input = " + input_text); |
| SCOPED_TRACE(u"expected_match_contents = " + expected_match_contents_string); |
| |
| AutocompleteInput input(ASCIIToUTF16(input_text), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| |
| // Test the variations of URL formatting on the first match. |
| auto& match = provider_->matches().front(); |
| EXPECT_EQ(expected_match_contents_string, match.contents); |
| |
| // Verify pre-match portion classification, if it should exist. |
| auto classification_it = match.contents_class.begin(); |
| ASSERT_NE(classification_it, match.contents_class.end()); |
| if (expected_match_location > 0) { |
| EXPECT_EQ(ACMatchClassification::URL, classification_it->style); |
| EXPECT_EQ(0U, classification_it->offset); |
| ++classification_it; |
| } |
| |
| // Verify the match portion classification. |
| ASSERT_NE(classification_it, match.contents_class.end()); |
| EXPECT_EQ(ACMatchClassification::URL | ACMatchClassification::MATCH, |
| classification_it->style); |
| EXPECT_EQ(expected_match_location, classification_it->offset); |
| ++classification_it; |
| |
| // Verify post-match portion classification, if it should exist. |
| size_t post_match_offset = expected_match_location + expected_match_length; |
| if (post_match_offset < expected_match_contents_string.length()) { |
| ASSERT_NE(classification_it, match.contents_class.end()); |
| EXPECT_EQ(ACMatchClassification::URL, classification_it->style); |
| EXPECT_EQ(post_match_offset, classification_it->offset); |
| } |
| } |
| |
| TEST_F(HistoryURLProviderTest, PromoteShorterURLs) { |
| // Test that hosts get synthesized below popular pages. |
| const UrlAndLegalDefault expected_nonsynth[] = { |
| {"http://slashdot.org/favorite_page.html", false}, |
| {"http://slashdot.org/", false}}; |
| RunTest(u"slash", std::string(), true, expected_nonsynth); |
| |
| // Test that hosts get synthesized above less popular pages. |
| const UrlAndLegalDefault expected_synth[] = { |
| {"http://kerneltrap.org/", false}, |
| {"http://kerneltrap.org/not_very_popular.html", false}}; |
| RunTest(u"kernel", std::string(), true, expected_synth); |
| |
| // Test that unpopular pages are ignored completely. |
| RunTest(u"fresh", std::string(), true, {}); |
| |
| // Test that if we create or promote shorter suggestions that would not |
| // normally be inline autocompletable, we make them inline autocompletable if |
| // the original suggestion (that we replaced as "top") was inline |
| // autocompletable. |
| const UrlAndLegalDefault expected_synthesisa[] = { |
| {"http://synthesisatest.com/", true}, |
| {"http://synthesisatest.com/foo/", true}}; |
| RunTest(u"synthesisa", std::string(), false, expected_synthesisa); |
| EXPECT_LT(matches_.front().relevance, 1200); |
| const UrlAndLegalDefault expected_synthesisb[] = { |
| {"http://synthesisbtest.com/foo/", true}, |
| {"http://synthesisbtest.com/foo/bar.html", true}}; |
| RunTest(u"synthesisb", std::string(), false, expected_synthesisb); |
| EXPECT_GE(matches_.front().relevance, 1410); |
| |
| // Test that if we have a synthesized host that matches a suggestion, they |
| // get combined into one. |
| const UrlAndLegalDefault expected_combine[] = { |
| {"http://news.google.com/", false}, |
| {"http://news.google.com/?ned=us&topic=n", false}, |
| }; |
| ASSERT_NO_FATAL_FAILURE( |
| RunTest(u"news", std::string(), true, expected_combine)); |
| // The title should also have gotten set properly on the host for the |
| // synthesized one, since it was also in the results. |
| EXPECT_EQ(u"Google News", matches_.front().description); |
| |
| // Test that short URL matching works correctly as the user types more |
| // (several tests): |
| // The entry for foo.com is the best of all five foo.com* entries. |
| const UrlAndLegalDefault short_1[] = { |
| {"http://foo.com/", false}, |
| {"http://foo.com/dir/another/again/myfile.html", false}, |
| {"http://foo.com/dir/", false}}; |
| RunTest(u"foo", std::string(), true, short_1); |
| |
| // When the user types the whole host, make sure we don't get two results for |
| // it. |
| const UrlAndLegalDefault short_2[] = { |
| {"http://foo.com/", true}, |
| {"http://foo.com/dir/another/again/myfile.html", false}, |
| {"http://foo.com/dir/", false}, |
| {"http://foo.com/dir/another/", false}}; |
| RunTest(u"foo.com", std::string(), true, short_2); |
| RunTest(u"foo.com/", std::string(), true, short_2); |
| |
| // The filename is the second best of the foo.com* entries, but there is a |
| // shorter URL that's "good enough". The host doesn't match the user input |
| // and so should not appear. |
| const UrlAndLegalDefault short_3[] = { |
| {"http://foo.com/dir/another/", false}, |
| {"http://foo.com/d", true}, |
| {"http://foo.com/dir/another/again/myfile.html", false}, |
| {"http://foo.com/dir/", false}}; |
| RunTest(u"foo.com/d", std::string(), true, short_3); |
| // If prevent_inline_autocomplete is false, we won't bother creating the |
| // URL-what-you-typed match because we have promoted inline autocompletions. |
| const UrlAndLegalDefault short_3_allow_inline[] = { |
| {"http://foo.com/dir/another/", true}, |
| {"http://foo.com/dir/another/again/myfile.html", true}, |
| {"http://foo.com/dir/", true}}; |
| RunTest(u"foo.com/d", std::string(), false, short_3_allow_inline); |
| |
| // We shouldn't promote shorter URLs than the best if they're not good |
| // enough. |
| const UrlAndLegalDefault short_4[] = { |
| {"http://foo.com/dir/another/again/myfile.html", false}, |
| {"http://foo.com/dir/another/a", true}, |
| {"http://foo.com/dir/another/again/", false}}; |
| RunTest(u"foo.com/dir/another/a", std::string(), true, short_4); |
| // If prevent_inline_autocomplete is false, we won't bother creating the |
| // URL-what-you-typed match because we have promoted inline autocompletions. |
| const UrlAndLegalDefault short_4_allow_inline[] = { |
| {"http://foo.com/dir/another/again/myfile.html", true}, |
| {"http://foo.com/dir/another/again/", true}}; |
| RunTest(u"foo.com/dir/another/a", std::string(), false, short_4_allow_inline); |
| |
| // Exact matches should always be best no matter how much more another match |
| // has been typed. |
| const UrlAndLegalDefault short_5a[] = {{"http://gooey/", true}, |
| {"http://www.google.com/", true}, |
| {"http://go/", true}}; |
| const UrlAndLegalDefault short_5b[] = {{"http://go/", true}, |
| {"http://gooey/", true}, |
| {"http://www.google.com/", true}}; |
| // Note that there is an http://g/ URL that is marked as hidden. It shouldn't |
| // show up at all. This test implicitly tests this fact too. |
| RunTest(u"g", std::string(), false, short_5a); |
| RunTest(u"go", std::string(), false, short_5b); |
| } |
| |
| TEST_F(HistoryURLProviderTest, CullRedirects) { |
| // URLs we will be using, plus the visit counts they will initially get |
| // (the redirect set below will also increment the visit counts). We want |
| // the results to be in A,B,C order. Note also that our visit counts are |
| // all high enough so that domain synthesizing won't get triggered. |
| struct TestCase { |
| const char* url; |
| int count; |
| }; |
| auto test_cases = std::to_array<TestCase>({ |
| {"http://redirects/A", 30}, |
| {"http://redirects/B", 20}, |
| {"http://redirects/C", 10}, |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| client_->GetHistoryService()->AddPageWithDetails( |
| GURL(test_cases[i].url), u"Title", test_cases[i].count, |
| test_cases[i].count, Time::Now(), false, history::SOURCE_BROWSED); |
| } |
| |
| // Create a B->C->A redirect chain, but set the visit counts such that they |
| // will appear in A,B,C order in the results. The autocomplete query will |
| // search for the most recent visit when looking for redirects, so this will |
| // be found even though the previous visits had no redirects. |
| history::RedirectList redirects_to_a; |
| redirects_to_a.push_back(GURL(test_cases[1].url)); |
| redirects_to_a.push_back(GURL(test_cases[2].url)); |
| redirects_to_a.push_back(GURL(test_cases[0].url)); |
| client_->GetHistoryService()->AddPage( |
| GURL(test_cases[0].url), Time::Now(), 0, 0, GURL(), redirects_to_a, |
| ui::PAGE_TRANSITION_TYPED, history::SOURCE_BROWSED, true); |
| |
| // Because all the results are part of a redirect chain with other results, |
| // all but the first one (A) should be culled. We should get the default |
| // "what you typed" result, plus this one. |
| const std::u16string typing(u"http://redirects/"); |
| const UrlAndLegalDefault expected_results[] = { |
| {test_cases[0].url, false}, {base::UTF16ToUTF8(typing), true}}; |
| RunTest(typing, std::string(), true, expected_results); |
| |
| // If prevent_inline_autocomplete is false, we won't bother creating the |
| // URL-what-you-typed match because we have promoted inline autocompletions. |
| // The result set should instead consist of a single URL representing the |
| // whole set of redirects. |
| const UrlAndLegalDefault expected_results_allow_inlining[] = { |
| {test_cases[0].url, true}}; |
| RunTest(typing, std::string(), false, expected_results_allow_inlining); |
| } |
| |
| TEST_F(HistoryURLProviderTestNoSearchProvider, WhatYouTypedNoSearchProvider) { |
| // When no search provider is available, make sure we provide what-you-typed |
| // matches for text that could be a URL. |
| |
| const UrlAndLegalDefault results_1[] = {{"http://wytmatch/", true}}; |
| RunTest(u"wytmatch", std::string(), false, results_1); |
| |
| RunTest(u"wytmatch foo bar", std::string(), false, {}); |
| RunTest(u"wytmatch+foo+bar", std::string(), false, {}); |
| |
| const UrlAndLegalDefault results_2[] = { |
| {"http://wytmatch+foo+bar.com/", true}}; |
| RunTest(u"wytmatch+foo+bar.com", std::string(), false, results_2); |
| } |
| |
| TEST_F(HistoryURLProviderTest, WhatYouTyped) { |
| // Make sure we suggest a What You Typed match at the right times. |
| RunTest(u"wytmatch", std::string(), false, {}); |
| RunTest(u"wytmatch foo bar", std::string(), false, {}); |
| RunTest(u"wytmatch+foo+bar", std::string(), false, {}); |
| RunTest(u"wytmatch+foo+bar.com", std::string(), false, {}); |
| |
| const UrlAndLegalDefault results_1[] = {{"http://www.wytmatch.com/", true}}; |
| RunTest(u"wytmatch", "com", false, results_1); |
| |
| const UrlAndLegalDefault results_2[] = { |
| {"http://wytmatch%20foo%20bar/", false}}; |
| RunTest(u"http://wytmatch foo bar", std::string(), false, results_2); |
| |
| const UrlAndLegalDefault results_3[] = { |
| {"https://wytmatch%20foo%20bar/", false}}; |
| RunTest(u"https://wytmatch foo bar", std::string(), false, results_3); |
| |
| const UrlAndLegalDefault results_4[] = {{"https://wytih/", true}, |
| {"https://www.wytih/file", true}, |
| {"ftp://wytih/file", true}, |
| {"https://www.wytih/page", true}}; |
| RunTest(u"wytih", std::string(), false, results_4); |
| |
| const UrlAndLegalDefault results_5[] = {{"https://www.wytih/", true}, |
| {"https://www.wytih/file", true}, |
| {"https://www.wytih/page", true}}; |
| RunTest(u"www.wytih", std::string(), false, results_5); |
| |
| const UrlAndLegalDefault results_6[] = {{"ftp://wytih/file", true}, |
| {"https://www.wytih/file", true}}; |
| RunTest(u"wytih/file", std::string(), false, results_6); |
| } |
| |
| // Test that the exact history match does not lose username/password |
| // credentials. |
| TEST_F(HistoryURLProviderTest, |
| WhatYouTyped_Exact_URLPreservesUsernameAndPassword) { |
| const UrlAndLegalDefault results_1[] = {{"https://user@wytih/", true}}; |
| RunTest(u"https://user@wytih", std::string(), false, results_1); |
| |
| const UrlAndLegalDefault results_2[] = { |
| {"https://user:pass@www.wytih/file", true}}; |
| RunTest(u"https://user:pass@www.wytih/file", std::string(), false, results_2); |
| } |
| |
| // Test that file: URLs are handled appropriately on each platform. |
| // url_formatter has per-platform logic for Windows vs POSIX, and |
| // AutocompleteInput has special casing for iOS and Android. |
| TEST_F(HistoryURLProviderTest, Files) { |
| #if BUILDFLAG(IS_IOS) || BUILDFLAG(IS_ANDROID) |
| // On iOS, check that file URIs are treated like queries. |
| AutocompleteInput ios_input_1( |
| u"file:///foo", std::u16string::npos, std::string(), |
| metrics::OmniboxEventProto::OTHER, TestSchemeClassifier()); |
| provider_->Start(ios_input_1, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| EXPECT_EQ(matches_.size(), 0u); |
| #endif // BUILDFLAG(IS_IOS) |
| |
| #if !BUILDFLAG(IS_IOS) && !BUILDFLAG(IS_ANDROID) |
| // For everything but iOS, fixing up "file:" should result in an inline |
| // autocomplete offset of just after "file:", not just after "file://". |
| const std::u16string input_1(u"file:"); |
| const UrlAndLegalDefault fixup_1[] = {{"file:///C:/foo.txt", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(input_1, std::string(), false, fixup_1)); |
| EXPECT_EQ(u"///C:/foo.txt", matches_.front().inline_autocompletion); |
| #endif // !BUILDFLAG(IS_IOS) |
| |
| #if BUILDFLAG(IS_POSIX) && !BUILDFLAG(IS_IOS) && !BUILDFLAG(IS_ANDROID) |
| // url_formatter::SegmentURLInternal does URL fixup differently depending on |
| // platform. On all POSIX systems including iOS, /foo --> file:///foo. |
| const std::u16string input_2(u"/foo"); |
| const UrlAndLegalDefault fixup_2[] = {{"file:///foo", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(input_2, std::string(), false, fixup_2)); |
| EXPECT_TRUE(matches_[0].destination_url.SchemeIsFile()); |
| #elif BUILDFLAG(IS_IOS) || BUILDFLAG(IS_ANDROID) |
| // However, AutocompleteInput ignores the URL fixup on iOS because it |
| // treates iOS like a query. |
| AutocompleteInput ios_input_2(u"/foo", std::u16string::npos, std::string(), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| provider_->Start(ios_input_2, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| EXPECT_EQ(matches_.size(), 0u); |
| #endif // BUILDFLAG(IS_POSIX) && !BUILDFLAG(IS_IOS) |
| } |
| |
| TEST_F(HistoryURLProviderTest, Fixup) { |
| // Test for various past crashes we've had. |
| RunTest(u"\\", std::string(), false, {}); |
| RunTest(u"#", std::string(), false, {}); |
| RunTest(u"%20", std::string(), false, {}); |
| const UrlAndLegalDefault fixup_crash[] = {{"http://%EF%BD%A5@s/", false}}; |
| RunTest(u"\uff65@s", std::string(), false, fixup_crash); |
| RunTest(u"\u2015\u2015@ \uff7c", std::string(), false, {}); |
| |
| // Fixing up "http:/" should result in an inline autocomplete offset of just |
| // after "http:/", not just after "http:". |
| const std::u16string input_2(u"http:/"); |
| const UrlAndLegalDefault fixup_2[] = {{"http://bogussite.com/a", true}, |
| {"http://bogussite.com/b", true}, |
| {"http://bogussite.com/c", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(input_2, std::string(), false, fixup_2)); |
| EXPECT_EQ(u"/bogussite.com/a", matches_.front().inline_autocompletion); |
| |
| // Adding a TLD to a small number like "56" should result in "www.56.com" |
| // rather than "0.0.0.56.com". |
| const UrlAndLegalDefault fixup_3[] = {{"http://www.56.com/", true}}; |
| RunTest(u"56", "com", true, fixup_3); |
| |
| // An input looks like a IP address like "127.0.0.1" should result in |
| // "http://127.0.0.1/". |
| const UrlAndLegalDefault fixup_4[] = {{"http://127.0.0.1/", true}}; |
| RunTest(u"127.0.0.1", std::string(), false, fixup_4); |
| |
| // An number "17173" should result in "http://www.17173.com/" in db. |
| const UrlAndLegalDefault fixup_5[] = {{"http://www.17173.com/", true}}; |
| RunTest(u"17173", std::string(), false, fixup_5); |
| } |
| |
| // Make sure the results for the input 'p' don't change between the first and |
| // second passes. |
| TEST_F(HistoryURLProviderTest, EmptyVisits) { |
| // Wait for history to create the in memory DB. |
| history::BlockUntilHistoryProcessesPendingRequests( |
| client_->GetHistoryService()); |
| |
| AutocompleteInput input(u"pa", metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| provider_->Start(input, false); |
| // HistoryURLProvider shouldn't be done (waiting on async results). |
| EXPECT_FALSE(provider_->done()); |
| |
| // We should get back an entry for pandora. |
| matches_ = provider_->matches(); |
| ASSERT_GT(matches_.size(), 0u); |
| EXPECT_EQ(GURL("http://pandora.com/"), matches_[0].destination_url); |
| int pandora_relevance = matches_[0].relevance; |
| |
| // Run the message loop. When |autocomplete_| finishes the loop is quit. |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| EXPECT_TRUE(provider_->done()); |
| matches_ = provider_->matches(); |
| ASSERT_GT(matches_.size(), 0u); |
| EXPECT_EQ(GURL("http://pandora.com/"), matches_[0].destination_url); |
| EXPECT_EQ(pandora_relevance, matches_[0].relevance); |
| } |
| |
| TEST_F(HistoryURLProviderTestNoDB, NavigateWithoutDB) { |
| // Ensure that we will still produce matches for navigation when there is no |
| // database. |
| UrlAndLegalDefault navigation_1[] = {{"http://test.com/", true}}; |
| RunTest(u"test.com", std::string(), false, navigation_1); |
| |
| UrlAndLegalDefault navigation_2[] = {{"http://slash/", false}}; |
| RunTest(u"slash", std::string(), false, navigation_2); |
| |
| RunTest(u"this is a query", std::string(), false, {}); |
| } |
| |
| TEST_F(HistoryURLProviderTest, AutocompleteOnTrailingWhitespace) { |
| struct AutocompletionExpectation { |
| std::string fill_into_edit; |
| std::string inline_autocompletion; |
| bool allowed_to_be_default_match; |
| }; |
| |
| auto TestAutocompletion = |
| [this](std::string input_text, bool input_prevent_inline_autocomplete, |
| const std::vector<AutocompletionExpectation>& expectations) { |
| const std::string debug = base::StringPrintf( |
| "input text [%s], prevent inline [%d]", input_text.c_str(), |
| input_prevent_inline_autocomplete); |
| |
| AutocompleteInput input(ASCIIToUTF16(input_text), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| input.set_prevent_inline_autocomplete( |
| input_prevent_inline_autocomplete); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| |
| matches_ = provider_->matches(); |
| EXPECT_EQ(matches_.size(), expectations.size()) << debug; |
| for (size_t i = 0; i < matches_.size(); ++i) { |
| EXPECT_EQ(matches_[i].fill_into_edit, |
| ASCIIToUTF16(expectations[i].fill_into_edit)) |
| << debug; |
| if (matches_[i].allowed_to_be_default_match) { |
| EXPECT_EQ(matches_[i].inline_autocompletion, |
| ASCIIToUTF16(expectations[i].inline_autocompletion)) |
| << debug; |
| } |
| EXPECT_EQ(matches_[i].allowed_to_be_default_match, |
| expectations[i].allowed_to_be_default_match) |
| << debug; |
| } |
| }; |
| |
| TestAutocompletion("zebra.com/zebra", false, |
| { |
| {"zebra.com/zebra", "", true}, |
| {"https://www.zebra.com/zebras", "s", true}, |
| {"https://www.zebra.com/zebra s", " s", true}, |
| {"https://www.zebra.com/zebra s", " s", true}, |
| }); |
| |
| TestAutocompletion("zebra.com/zebra ", false, |
| { |
| {"zebra.com/zebra", "", true}, |
| {"https://www.zebra.com/zebras", "", false}, |
| {"https://www.zebra.com/zebra s", "s", true}, |
| {"https://www.zebra.com/zebra s", " s", true}, |
| }); |
| |
| TestAutocompletion("zebra.com/zebra ", false, |
| { |
| {"zebra.com/zebra", "", true}, |
| {"https://www.zebra.com/zebras", "", false}, |
| {"https://www.zebra.com/zebra s", "", false}, |
| {"https://www.zebra.com/zebra s", "s", true}, |
| }); |
| |
| TestAutocompletion("zebra.com/zebra", true, |
| { |
| {"zebra.com/zebra", "", true}, |
| {"https://www.zebra.com/zebras", "", false}, |
| {"https://www.zebra.com/zebra s", "", false}, |
| {"https://www.zebra.com/zebra s", "", false}, |
| }); |
| |
| TestAutocompletion("zebra.com/zebras", false, |
| { |
| {"zebra.com/zebras", "", true}, |
| }); |
| |
| TestAutocompletion("zebra.com/zebra s", false, |
| { |
| {"zebra.com/zebra s", "", true}, |
| }); |
| } |
| |
| TEST_F(HistoryURLProviderTest, TreatEmailsAsSearches) { |
| // Visiting foo.com should not make this string be treated as a navigation. |
| // That means the result should not be allowed to be default, and it should |
| // be scored around 1200 rather than 1400+. |
| const UrlAndLegalDefault expected[] = {{"http://user@foo.com/", false}}; |
| ASSERT_NO_FATAL_FAILURE( |
| RunTest(u"user@foo.com", std::string(), false, expected)); |
| EXPECT_LE(1200, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1210); |
| } |
| |
| TEST_F(HistoryURLProviderTest, IntranetURLsWithPaths) { |
| struct TestCase { |
| const char* input; |
| int relevance; |
| bool allowed_to_be_default_match; |
| }; |
| auto test_cases = std::to_array<TestCase>({ |
| {"fooey", 0, false}, |
| {"fooey/", 1200, true}, // 1200 for URL would still navigate by default. |
| {"fooey/a", 1200, false}, // 1200 for UNKNOWN would not. |
| {"fooey/a b", 1200, false}, // Also UNKNOWN. |
| {"gooey", 1410, true}, |
| {"gooey/", 1410, true}, |
| {"gooey/a", 1400, true}, |
| {"gooey/a b", 1400, true}, |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| SCOPED_TRACE(test_cases[i].input); |
| if (test_cases[i].relevance == 0) { |
| RunTest(ASCIIToUTF16(test_cases[i].input), std::string(), false, {}); |
| } else { |
| const UrlAndLegalDefault output[] = { |
| {url_formatter::FixupURL(test_cases[i].input, std::string()).spec(), |
| test_cases[i].allowed_to_be_default_match}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(ASCIIToUTF16(test_cases[i].input), |
| std::string(), false, output)); |
| // Actual relevance should be at least what test_cases expects and |
| // and no more than 10 more. |
| EXPECT_LE(test_cases[i].relevance, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, test_cases[i].relevance + 10); |
| } |
| } |
| } |
| |
| // Makes sure autocompletion happens for intranet sites that have been |
| // previoulsy visited. |
| TEST_F(HistoryURLProviderTest, IntranetURLCompletion) { |
| sort_matches_ = true; |
| |
| const UrlAndLegalDefault expected1[] = {{"http://intra/three", true}, |
| {"http://intra/two", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(u"intra/t", std::string(), false, expected1)); |
| EXPECT_LE(1410, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1420); |
| // It uses the default scoring. |
| EXPECT_EQ(matches_[1].relevance, 1203); |
| |
| const UrlAndLegalDefault expected2[] = {{"http://moo/b", true}, |
| {"http://moo/bar", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(u"moo/b", std::string(), false, expected2)); |
| // The url what you typed match should be around 1400, otherwise the |
| // search what you typed match is going to be first. |
| EXPECT_LE(1400, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1410); |
| |
| const UrlAndLegalDefault expected3[] = {{"http://intra/three", true}, |
| {"http://intra/one", true}, |
| {"http://intra/two", true}}; |
| RunTest(u"intra", std::string(), false, expected3); |
| |
| const UrlAndLegalDefault expected4[] = {{"http://intra/three", true}, |
| {"http://intra/one", true}, |
| {"http://intra/two", true}}; |
| RunTest(u"intra/", std::string(), false, expected4); |
| |
| const UrlAndLegalDefault expected5[] = {{"http://intra/one", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(u"intra/o", std::string(), false, expected5)); |
| EXPECT_LE(1410, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1420); |
| |
| const UrlAndLegalDefault expected6[] = {{"http://intra/x", true}}; |
| ASSERT_NO_FATAL_FAILURE(RunTest(u"intra/x", std::string(), false, expected6)); |
| EXPECT_LE(1400, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1410); |
| |
| const UrlAndLegalDefault expected7[] = { |
| {"http://typedhost/untypedpath", true}}; |
| ASSERT_NO_FATAL_FAILURE( |
| RunTest(u"typedhost/untypedpath", std::string(), false, expected7)); |
| EXPECT_LE(1400, matches_[0].relevance); |
| EXPECT_LT(matches_[0].relevance, 1410); |
| |
| const UrlAndLegalDefault expected8[] = {{"https://www.prefixintra/x", true}}; |
| ASSERT_NO_FATAL_FAILURE( |
| RunTest(u"prefixintra/x", std::string(), false, expected8)); |
| } |
| |
| TEST_F(HistoryURLProviderTest, CrashDueToFixup) { |
| // This test passes if we don't crash. The results don't matter. |
| const auto test_cases = std::to_array<const char*>({ |
| "//c", |
| "\\@st", |
| "view-source:x", |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| AutocompleteInput input(ASCIIToUTF16(test_cases[i]), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| } |
| } |
| |
| TEST_F(HistoryURLProviderTest, DoesNotProvideMatchesOnFocus) { |
| AutocompleteInput input(u"foo", metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| input.set_focus_type(metrics::OmniboxFocusType::INTERACTION_FOCUS); |
| provider_->Start(input, false); |
| EXPECT_TRUE(provider_->matches().empty()); |
| } |
| |
| TEST_F(HistoryURLProviderTest, DoesNotInlinePunycodeMatches) { |
| // A URL that matches due to a match in the punycode URL is allowed to be the |
| // default match if the URL doesn't get rendered as international characters. |
| const UrlAndLegalDefault expected1_true[] = { |
| {"http://puny.xn--h2by8byc123p.in/", true}, |
| }; |
| RunTest(u"pun", std::string(), false, expected1_true); |
| RunTest(u"puny.", std::string(), false, expected1_true); |
| RunTest(u"puny.x", std::string(), false, expected1_true); |
| RunTest(u"puny.xn", std::string(), false, expected1_true); |
| RunTest(u"puny.xn--", std::string(), false, expected1_true); |
| RunTest(u"puny.xn--h2", std::string(), false, expected1_true); |
| RunTest(u"puny.xn--h2by8byc123p", std::string(), false, expected1_true); |
| RunTest(u"puny.xn--h2by8byc123p.", std::string(), false, expected1_true); |
| |
| // When the punycode part of the URL is rendered as international characters, |
| // this match should not be allowed to be the default match if the inline |
| // autocomplete text starts in the middle of the international characters. |
| const UrlAndLegalDefault expected2_true[] = { |
| {"http://two_puny.xn--1lq90ic7f1rc.cn/", true}, |
| }; |
| const UrlAndLegalDefault expected2_false[] = { |
| {"http://two_puny.xn--1lq90ic7f1rc.cn/", false}, |
| }; |
| RunTest(u"two", std::string(), false, expected2_true); |
| RunTest(u"two_puny.", std::string(), false, expected2_true); |
| RunTest(u"two_puny.x", std::string(), false, expected2_false); |
| RunTest(u"two_puny.xn", std::string(), false, expected2_false); |
| RunTest(u"two_puny.xn--", std::string(), false, expected2_false); |
| RunTest(u"two_puny.xn--1l", std::string(), false, expected2_false); |
| RunTest(u"two_puny.xn--1lq90ic7f1rc", std::string(), false, expected2_true); |
| RunTest(u"two_puny.xn--1lq90ic7f1rc.", std::string(), false, expected2_true); |
| } |
| |
| TEST_F(HistoryURLProviderTest, CullSearchResults) { |
| // Set up a default search engine. |
| TemplateURLData data; |
| data.SetShortName(u"TestEngine"); |
| data.SetKeyword(u"TestEngine"); |
| data.SetURL("http://testsearch.com/?q={searchTerms}"); |
| TemplateURLService* template_url_service = client_->GetTemplateURLService(); |
| TemplateURL* template_url = |
| template_url_service->Add(std::make_unique<TemplateURL>(data)); |
| template_url_service->SetUserSelectedDefaultSearchProvider(template_url); |
| template_url_service->Load(); |
| |
| // URLs we will be using, plus the visit counts they will initially get |
| // (the redirect set below will also increment the visit counts). We want |
| // the results to be in A,B,C order. Note also that our visit counts are |
| // all high enough so that domain synthesizing won't get triggered. |
| struct TestCase { |
| const char* url; |
| int count; |
| }; |
| auto test_cases = std::to_array<TestCase>({ |
| {"https://testsearch.com/", 30}, |
| {"https://testsearch.com/?q=foobar", 20}, |
| {"http://foobar.com/", 10}, |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| client_->GetHistoryService()->AddPageWithDetails( |
| GURL(test_cases[i].url), u"Title", test_cases[i].count, |
| test_cases[i].count, Time::Now(), false, history::SOURCE_BROWSED); |
| } |
| |
| // We should not see search URLs when typing a previously used query. |
| const UrlAndLegalDefault expected_when_searching_query[] = { |
| {test_cases[2].url, false}}; |
| RunTest(u"foobar", std::string(), true, expected_when_searching_query); |
| |
| // We should not see search URLs when typing the search engine name. |
| const UrlAndLegalDefault expected_when_searching_site[] = { |
| {test_cases[0].url, false}}; |
| RunTest(u"testsearch", std::string(), true, expected_when_searching_site); |
| } |
| |
| TEST_F(HistoryURLProviderTest, SuggestExactInput) { |
| const size_t npos = std::string::npos; |
| struct TestCase { |
| // Inputs: |
| const char* input; |
| bool trim_http; |
| // Expected Outputs: |
| const char* contents; |
| // Offsets of the ACMatchClassifications, terminated by npos. |
| std::array<size_t, 3> offsets; |
| // The index of the ACMatchClassification that should have the MATCH bit |
| // set, npos if no ACMatchClassification should have the MATCH bit set. |
| size_t match_classification_index; |
| }; |
| auto test_cases = std::to_array<TestCase>({ |
| // clang-format off |
| { "http://www.somesite.com", false, |
| "http://www.somesite.com", {0, npos, npos}, 0 }, |
| { "http://www.somesite.com/", false, |
| "http://www.somesite.com", {0, npos, npos}, 0 }, |
| { "http://www.somesite.com/", false, |
| "http://www.somesite.com", {0, npos, npos}, 0 }, |
| { "www.somesite.com", true, |
| "www.somesite.com", {0, npos, npos}, 0 }, |
| { "somesite.com", true, |
| "somesite.com", {0, npos, npos}, 0 }, |
| { "w", true, |
| "w", {0, npos, npos}, 0 }, |
| { "w.com", true, |
| "w.com", {0, npos, npos}, 0 }, |
| { "www.w.com", true, |
| "www.w.com", {0, npos, npos}, 0 }, |
| { "view-source:w", true, |
| "view-source:w", {0, npos, npos}, 0 }, |
| { "view-source:www.w.com/", true, |
| "view-source:www.w.com", {0, npos, npos}, 0 }, |
| { "view-source:http://www.w.com/", false, |
| "view-source:http://www.w.com", {0, npos, npos}, 0 }, |
| { "view-source:", true, |
| "view-source:", {0, npos, npos}, 0 }, |
| { "http://w.com", false, |
| "http://w.com", {0, npos, npos}, 0 }, |
| { "http://www.w.com", false, |
| "http://www.w.com", {0, npos, npos}, 0 }, |
| { "http://a///www.w.com", false, |
| "http://a///www.w.com", {0, npos, npos}, 0 }, |
| { "http://a@b.com", false, "http://b.com", {0, npos, npos}, 0 }, |
| { "a@b.com", true, "b.com", {0, npos, npos} }, |
| { "mailto://a@b.com", true, |
| "mailto://b.com", {0, npos, npos}, 0 }, |
| { "mailto://a@b.com", false, |
| "mailto://b.com", {0, npos, npos}, 0 }, |
| { "http://a%20b/x%20y", false, |
| "http://a%20b/x y", {0, npos, npos}, 0 }, |
| #if !BUILDFLAG(IS_IOS) && !BUILDFLAG(IS_ANDROID) |
| // file: URIs are treated like queries on iOS and need to be excluded from |
| // this test, which assumes that all the inputs have canonical URLs. |
| { "file:///x%20y/a%20b", true, |
| "file:///x y/a b", {0, npos, npos}, 0 }, |
| { "file://x%20y/a%20b", true, |
| "file://x%20y/a b", {0, npos, npos}, 0 }, |
| #endif // !BUILDFLAG(IS_IOS) && !BUILDFLAG(IS_ANDROID) |
| { "view-source:x%20y/a%20b", true, |
| "view-source:x%20y/a b", {0, npos, npos}, 0 }, |
| { "view-source:http://x%20y/a%20b", false, |
| "view-source:http://x%20y/a b", {0, npos, npos}, 0 }, |
| // clang-format on |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| SCOPED_TRACE(testing::Message() |
| << "Index " << i << " input: " << test_cases[i].input |
| << ", trim_http: " << test_cases[i].trim_http); |
| |
| AutocompleteInput input(ASCIIToUTF16(test_cases[i].input), |
| metrics::OmniboxEventProto::BLANK, |
| TestSchemeClassifier()); |
| input.set_current_url(GURL("about:blank")); |
| AutocompleteMatch match(VerbatimMatchForInput( |
| provider_.get(), client_.get(), input, input.canonicalized_url(), |
| test_cases[i].trim_http)); |
| EXPECT_EQ(ASCIIToUTF16(test_cases[i].contents), match.contents); |
| for (size_t match_index = 0; match_index < match.contents_class.size(); |
| ++match_index) { |
| UNSAFE_TODO(EXPECT_EQ(test_cases[i].offsets[match_index], |
| match.contents_class[match_index].offset)); |
| EXPECT_EQ(ACMatchClassification::URL | |
| (match_index == test_cases[i].match_classification_index |
| ? ACMatchClassification::MATCH |
| : 0), |
| match.contents_class[match_index].style); |
| } |
| UNSAFE_TODO( |
| EXPECT_EQ(npos, test_cases[i].offsets[match.contents_class.size()])); |
| } |
| } |
| |
| TEST_F(HistoryURLProviderTest, HUPScoringExperiment) { |
| HUPScoringParams max_2000_no_time_decay; |
| max_2000_no_time_decay.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 2000)); |
| HUPScoringParams max_1250_no_time_decay; |
| max_1250_no_time_decay.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 1250)); |
| HUPScoringParams max_1000_no_time_decay; |
| max_1000_no_time_decay.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 1000)); |
| |
| HUPScoringParams max_1100_with_time_decay_and_max_cap; |
| max_1100_with_time_decay_and_max_cap.typed_count_buckets.set_relevance_cap( |
| 1400); |
| max_1100_with_time_decay_and_max_cap.typed_count_buckets.set_half_life_days( |
| 16); |
| max_1100_with_time_decay_and_max_cap.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.5, 1100)); |
| max_1100_with_time_decay_and_max_cap.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.24, 200)); |
| max_1100_with_time_decay_and_max_cap.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 100)); |
| |
| HUPScoringParams max_1100_visit_typed_decays; |
| max_1100_visit_typed_decays.typed_count_buckets.set_half_life_days(16); |
| max_1100_visit_typed_decays.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.5, 1100)); |
| max_1100_visit_typed_decays.typed_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 100)); |
| max_1100_visit_typed_decays.visited_count_buckets.set_half_life_days(16); |
| max_1100_visit_typed_decays.visited_count_buckets.buckets().push_back( |
| std::make_pair(0.5, 550)); |
| max_1100_visit_typed_decays.visited_count_buckets.buckets().push_back( |
| std::make_pair(0.0, 50)); |
| |
| const int kProviderMaxMatches = 3; |
| struct TestCase { |
| const char* input; |
| HUPScoringParams scoring_params; |
| struct ExpectedMatch { |
| const char* url; |
| int control_relevance; |
| int experiment_relevance; |
| }; |
| std::array<ExpectedMatch, kProviderMaxMatches> matches; |
| }; |
| auto test_cases = std::to_array<TestCase>({ |
| // Max score 2000 -> no demotion. |
| {"7.com/1", |
| max_2000_no_time_decay, |
| {{{"7.com/1a", 1413, 1413}, {nullptr, 0, 0}, {nullptr, 0, 0}}}}, |
| |
| // Limit score to 1250/1000 and make sure that the top match is unchanged. |
| {"7.com/1", |
| max_1250_no_time_decay, |
| {{{"7.com/1a", 1413, 1413}, {nullptr, 0, 0}, {nullptr, 0, 0}}}}, |
| {"7.com/2", |
| max_1250_no_time_decay, |
| {{{"7.com/2a", 1413, 1413}, {"7.com/2b", 1412, 1250}, {nullptr, 0, 0}}}}, |
| {"7.com/4", |
| max_1000_no_time_decay, |
| {{{"7.com/4", 1203, 1203}, |
| {"7.com/4a", 1202, 1000}, |
| {"7.com/4b", 1201, 999}}}}, |
| |
| // Max relevance cap is 1400 and half-life is 16 days. |
| {"7.com/1", |
| max_1100_with_time_decay_and_max_cap, |
| {{{"7.com/1a", 1413, 1413}, {nullptr, 0, 0}, {nullptr, 0, 0}}}}, |
| {"7.com/4", |
| max_1100_with_time_decay_and_max_cap, |
| {{{"7.com/4", 1203, 1203}, |
| {"7.com/4a", 1202, 200}, |
| {"7.com/4b", 1201, 100}}}}, |
| |
| // Max relevance cap is 1400 and half-life is 16 days for both |
| // visit/typed. |
| {"7.com/5", |
| max_1100_visit_typed_decays, |
| {{{"7.com/5", 1203, 1203}, {"7.com/5a", 1202, 50}, {nullptr, 0, 0}}}}, |
| }); |
| for (size_t i = 0; i < std::size(test_cases); ++i) { |
| SCOPED_TRACE(test_cases[i].input); |
| std::array<UrlAndLegalDefault, kProviderMaxMatches> output; |
| size_t max_matches; |
| for (max_matches = 0; max_matches < kProviderMaxMatches; ++max_matches) { |
| if (UNSAFE_TODO(test_cases[i].matches[max_matches]).url == nullptr) { |
| break; |
| } |
| output[max_matches].url = |
| url_formatter::FixupURL( |
| UNSAFE_TODO(test_cases[i].matches[max_matches]).url, |
| std::string()) |
| .spec(); |
| output[max_matches].allowed_to_be_default_match = true; |
| } |
| provider_->scoring_params_ = test_cases[i].scoring_params; |
| |
| // Test the experimental scoring params. |
| ASSERT_NO_FATAL_FAILURE(RunTest(ASCIIToUTF16(test_cases[i].input), |
| std::string(), false, |
| base::span(output).first(max_matches))); |
| for (size_t j = 0; j < max_matches; ++j) { |
| UNSAFE_TODO(EXPECT_EQ(test_cases[i].matches[j].experiment_relevance, |
| matches_[j].relevance)); |
| } |
| } |
| } |
| |
| TEST_F(HistoryURLProviderTest, MatchURLFormatting) { |
| // Sanity check behavior under default flags. |
| ExpectFormattedFullMatch("abc", L"www.abc.def.com/path", 4, 3); |
| ExpectFormattedFullMatch("hij", L"hij.com/path", 0, 3); |
| |
| // Sanity check that scheme, subdomain, and path can all be trimmed or elided. |
| ExpectFormattedFullMatch("hij", L"hij.com/path", 0, 3); |
| |
| // Verify that the scheme is preserved if part of match. |
| ExpectFormattedFullMatch("https://www.hi", L"https://www.hij.com/path", 0, |
| 14); |
| |
| // Verify that the whole subdomain is preserved if part of match. |
| ExpectFormattedFullMatch("abc", L"www.abc.def.com/path", 4, 3); |
| ExpectFormattedFullMatch("www.hij", L"www.hij.com/path", 0, 7); |
| |
| // Verify that the path is preserved if part of the match. |
| ExpectFormattedFullMatch("hij.com/path", L"hij.com/path", 0, 12); |
| |
| // Verify preserving both the scheme and subdomain. |
| ExpectFormattedFullMatch("https://www.hi", L"https://www.hij.com/path", 0, |
| 14); |
| |
| // Verify preserving everything. |
| ExpectFormattedFullMatch("https://www.hij.com/p", L"https://www.hij.com/path", |
| 0, 21); |
| |
| // Verify that upper case input still works for subdomain matching. |
| ExpectFormattedFullMatch("WWW.hij", L"www.hij.com/path", 0, 7); |
| |
| // Verify that matching in the subdomain-only preserves the subdomain. |
| ExpectFormattedFullMatch("ww", L"www.hij.com/path", 0, 2); |
| ExpectFormattedFullMatch("https://ww", L"https://www.hij.com/path", 0, 10); |
| } |
| |
| std::unique_ptr<HistoryURLProviderParams> BuildHistoryURLProviderParams( |
| const std::string& input_text, |
| const std::string& url_text, |
| bool match_in_scheme) { |
| AutocompleteInput input(ASCIIToUTF16(input_text), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| history::HistoryMatch history_match; |
| history_match.url_info.set_url(GURL(url_text)); |
| history_match.match_in_scheme = match_in_scheme; |
| auto params = std::make_unique<HistoryURLProviderParams>( |
| input, input, true, AutocompleteMatch(), nullptr, nullptr, true, nullptr); |
| params->matches.push_back(history_match); |
| |
| return params; |
| } |
| |
| // Make sure "http://" scheme is generally trimmed. |
| TEST_F(HistoryURLProviderTest, DoTrimHttpScheme) { |
| auto params = |
| BuildHistoryURLProviderParams("face", "http://www.facebook.com", false); |
| |
| AutocompleteMatch match = provider_->HistoryMatchToACMatch(*params, 0, 0); |
| EXPECT_EQ(u"facebook.com", match.contents); |
| } |
| |
| // Make sure "http://" scheme is not trimmed if input has a scheme too. |
| TEST_F(HistoryURLProviderTest, DontTrimHttpSchemeIfInputHasScheme) { |
| auto params = BuildHistoryURLProviderParams("http://face", |
| "http://www.facebook.com", false); |
| |
| AutocompleteMatch match = provider_->HistoryMatchToACMatch(*params, 0, 0); |
| EXPECT_EQ(u"http://facebook.com", match.contents); |
| } |
| |
| // Make sure "http://" scheme is not trimmed if input matches in scheme. |
| TEST_F(HistoryURLProviderTest, DontTrimHttpSchemeIfInputMatchesInScheme) { |
| auto params = |
| BuildHistoryURLProviderParams("ht face", "http://www.facebook.com", true); |
| |
| AutocompleteMatch match = provider_->HistoryMatchToACMatch(*params, 0, 0); |
| EXPECT_EQ(u"http://facebook.com", match.contents); |
| } |
| |
| // Make sure "https://" scheme is not trimmed if the input has a scheme. |
| TEST_F(HistoryURLProviderTest, DontTrimHttpsSchemeIfInputMatchesInScheme) { |
| auto params = BuildHistoryURLProviderParams( |
| "https://face", "https://www.facebook.com", false); |
| |
| AutocompleteMatch match = provider_->HistoryMatchToACMatch(*params, 0, 0); |
| EXPECT_EQ(u"https://facebook.com", match.contents); |
| } |
| |
| // Make sure "https://" scheme is trimmed if nothing prevents it. |
| TEST_F(HistoryURLProviderTest, DoTrimHttpsScheme) { |
| auto params = |
| BuildHistoryURLProviderParams("face", "https://www.facebook.com", false); |
| |
| AutocompleteMatch match = provider_->HistoryMatchToACMatch(*params, 0, 0); |
| EXPECT_EQ(u"facebook.com", match.contents); |
| } |
| |
| // Make sure that user input is trimmed correctly for starter pack keyword mode. |
| // In this mode, suggestions should be provided for only the user input after |
| // the keyword, i.e. "@history google" should only match "google". |
| TEST_F(HistoryURLProviderTest, KeywordModeExtractUserInput) { |
| const auto test = [&](std::u16string input_text, |
| bool input_prefer_keyword_mode = false) { |
| AutocompleteInput input(input_text, metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| if (input_prefer_keyword_mode) { |
| input.set_prefer_keyword(true); |
| input.set_keyword_mode_entry_method( |
| metrics::OmniboxEventProto_KeywordModeEntryMethod_TAB); |
| } |
| |
| provider_->Stop(AutocompleteStopReason::kClobbered); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| return provider_->matches(); |
| }; |
| |
| // Populate template URL with starter pack entries |
| std::vector<std::unique_ptr<TemplateURLData>> turls = |
| template_url_starter_pack_data::GetStarterPackEngines(); |
| for (auto& turl : turls) { |
| client_->GetTemplateURLService()->Add( |
| std::make_unique<TemplateURL>(std::move(*turl))); |
| } |
| |
| // Test result for user text "google", we should get back a result for google. |
| matches_ = test(u"google"); |
| ASSERT_GT(matches_.size(), 0u); |
| EXPECT_EQ(matches_[0].destination_url, GURL("http://www.google.com/")); |
| |
| // Test result for "@history", "@history.c", and "@history google" while NOT |
| // in keyword mode, we should not get results for history.com or google since |
| // we're searching for the whole input text including "@". |
| EXPECT_TRUE(test(u"@history").empty()); |
| EXPECT_TRUE(test(u"@history.c").empty()); |
| EXPECT_TRUE(test(u"@history google").empty()); |
| |
| // Test results for "@history.co"; we should see a URL what you type |
| // suggestion because that's a valid URL. |
| matches_ = test(u"@history.co"); |
| ASSERT_GT(matches_.size(), 0u); |
| EXPECT_EQ(matches_[0].destination_url, GURL("http://history.co/")); |
| |
| // Turn on keyword mode, test result again, we should get back the result for |
| // google.com since we're searching only for the user text after the keyword. |
| matches_ = test(u"@history google", true); |
| ASSERT_GT(matches_.size(), 0u); |
| EXPECT_EQ(matches_[0].destination_url, GURL("http://www.google.com/")); |
| EXPECT_TRUE(matches_[0].from_keyword); |
| // Ensure keyword and transition are set properly to keep user in keyword |
| // mode. |
| EXPECT_EQ(matches_[0].keyword, u"@history"); |
| EXPECT_TRUE(PageTransitionCoreTypeIs(matches_[0].transition, |
| ui::PAGE_TRANSITION_KEYWORD)); |
| } |
| |
| TEST_F(HistoryURLProviderTest, MaxMatches) { |
| // Keyword mode is off. We should only get provider_max_matches_ matches. |
| AutocompleteInput input(u"star", metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| |
| matches_ = provider_->matches(); |
| EXPECT_EQ(matches_.size(), provider_->provider_max_matches()); |
| |
| // Turn keyword mode on. we should be able to get more matches now. |
| input.set_keyword_mode_entry_method( |
| metrics::OmniboxEventProto_KeywordModeEntryMethod_TAB); |
| input.set_prefer_keyword(true); |
| provider_->Start(input, false); |
| if (!provider_->done()) { |
| base::RunLoop loop{base::RunLoop::Type::kNestableTasksAllowed}; |
| quit_closure_ = loop.QuitWhenIdleClosure(); |
| loop.Run(); |
| } |
| |
| matches_ = provider_->matches(); |
| EXPECT_EQ(matches_.size(), provider_->provider_max_matches_in_keyword_mode()); |
| } |
| |
| TEST_F(HistoryURLProviderTest, HistoryMatchToACMatchWithScoringSignals) { |
| const std::string input_text = "abc"; |
| AutocompleteInput input(ASCIIToUTF16(input_text), |
| metrics::OmniboxEventProto::OTHER, |
| TestSchemeClassifier()); |
| history::HistoryMatch history_match; |
| history_match.url_info.set_url(GURL("https://abc.com")); |
| history_match.url_info.set_typed_count(3); |
| history_match.url_info.set_visit_count(5); |
| history_match.match_in_scheme = false; |
| auto params = std::make_unique<HistoryURLProviderParams>( |
| input, input, true, AutocompleteMatch(), nullptr, nullptr, true, nullptr); |
| params->matches.push_back(history_match); |
| |
| AutocompleteMatch match = |
| provider_->HistoryMatchToACMatch(*params, 0, /*relevance=*/1, |
| /*populate_scoring_signals=*/true); |
| EXPECT_EQ(match.scoring_signals->typed_count(), 3); |
| EXPECT_EQ(match.scoring_signals->visit_count(), 5); |
| EXPECT_TRUE(match.scoring_signals->allowed_to_be_default_match()); |
| EXPECT_TRUE(match.scoring_signals->is_host_only()); |
| EXPECT_EQ(match.scoring_signals->length_of_url(), 16); |
| EXPECT_TRUE(match.scoring_signals->has_non_scheme_www_match()); |
| } |