| // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include <algorithm> |
| #include <fstream> |
| |
| #include "base/auto_reset.h" |
| #include "base/files/file_path.h" |
| #include "base/files/file_util.h" |
| #include "base/files/scoped_temp_dir.h" |
| #include "base/i18n/case_conversion.h" |
| #include "base/path_service.h" |
| #include "base/run_loop.h" |
| #include "base/strings/string16.h" |
| #include "base/strings/string_split.h" |
| #include "base/strings/string_util.h" |
| #include "base/strings/stringprintf.h" |
| #include "base/strings/utf_string_conversions.h" |
| #include "chrome/browser/bookmarks/bookmark_model_factory.h" |
| #include "chrome/browser/history/history_service_factory.h" |
| #include "chrome/common/chrome_paths.h" |
| #include "chrome/test/base/history_index_restore_observer.h" |
| #include "chrome/test/base/testing_profile.h" |
| #include "components/bookmarks/test/bookmark_test_helpers.h" |
| #include "components/history/core/browser/history_backend.h" |
| #include "components/history/core/browser/history_database.h" |
| #include "components/history/core/browser/history_service.h" |
| #include "components/omnibox/browser/in_memory_url_index.h" |
| #include "components/omnibox/browser/in_memory_url_index_types.h" |
| #include "components/omnibox/browser/url_index_private_data.h" |
| #include "content/public/browser/browser_thread.h" |
| #include "content/public/test/test_browser_thread_bundle.h" |
| #include "sql/transaction.h" |
| #include "testing/gtest/include/gtest/gtest.h" |
| |
| using base::ASCIIToUTF16; |
| |
| // The test version of the history url database table ('url') is contained in |
| // a database file created from a text file('url_history_provider_test.db.txt'). |
| // The only difference between this table and a live 'urls' table from a |
| // profile is that the last_visit_time column in the test table contains a |
| // number specifying the number of days relative to 'today' to which the |
| // absolute time should be set during the test setup stage. |
| // |
| // The format of the test database text file is of a SQLite .dump file. |
| // Note that only lines whose first character is an upper-case letter are |
| // processed when creating the test database. |
| |
| namespace { |
| const size_t kInvalid = base::string16::npos; |
| const size_t kMaxMatches = 3; |
| const char kTestLanguages[] = "en,ja,hi,zh"; |
| const char kClientWhitelistedScheme[] = "xyz"; |
| |
| // Helper function to set lower case |lower_string| and |lower_terms| (words |
| // list) based on supplied |search_string| and |cursor_position|. If |
| // |cursor_position| is set and useful (not at either end of the string), allow |
| // the |search_string| to be broken at |cursor_position|. We do this by |
| // pretending there's a space where the cursor is. |lower_terms| are obtained by |
| // splitting the |lower_string| on whitespace into tokens. |
| void StringToTerms(const char* search_string, |
| size_t cursor_position, |
| base::string16* lower_string, |
| String16Vector* lower_terms) { |
| *lower_string = base::i18n::ToLower(ASCIIToUTF16(search_string)); |
| if ((cursor_position != kInvalid) && |
| (cursor_position < lower_string->length()) && (cursor_position > 0)) { |
| lower_string->insert(cursor_position, base::ASCIIToUTF16(" ")); |
| } |
| |
| *lower_terms = base::SplitString(*lower_string, base::kWhitespaceUTF16, |
| base::KEEP_WHITESPACE, |
| base::SPLIT_WANT_NONEMPTY); |
| } |
| |
| } // namespace |
| |
| // ----------------------------------------------------------------------------- |
| |
| // Observer class so the unit tests can wait while the cache is being saved. |
| class CacheFileSaverObserver : public InMemoryURLIndex::SaveCacheObserver { |
| public: |
| explicit CacheFileSaverObserver(const base::Closure& task); |
| |
| bool succeeded() { return succeeded_; } |
| |
| private: |
| // SaveCacheObserver implementation. |
| void OnCacheSaveFinished(bool succeeded) override; |
| |
| base::Closure task_; |
| bool succeeded_; |
| |
| DISALLOW_COPY_AND_ASSIGN(CacheFileSaverObserver); |
| }; |
| |
| CacheFileSaverObserver::CacheFileSaverObserver(const base::Closure& task) |
| : task_(task), |
| succeeded_(false) { |
| } |
| |
| void CacheFileSaverObserver::OnCacheSaveFinished(bool succeeded) { |
| succeeded_ = succeeded; |
| task_.Run(); |
| } |
| |
| // ----------------------------------------------------------------------------- |
| |
| class InMemoryURLIndexTest : public testing::Test { |
| public: |
| InMemoryURLIndexTest(); |
| |
| protected: |
| // Test setup. |
| void SetUp() override; |
| void TearDown() override; |
| |
| // Allows the database containing the test data to be customized by |
| // subclasses. |
| virtual base::FilePath::StringType TestDBName() const; |
| |
| // Allows the test to control when the InMemoryURLIndex is initialized. |
| virtual bool InitializeInMemoryURLIndexInSetUp() const; |
| |
| // Initialize the InMemoryURLIndex for the tests. |
| void InitializeInMemoryURLIndex(); |
| |
| // Validates that the given |term| is contained in |cache| and that it is |
| // marked as in-use. |
| void CheckTerm(const URLIndexPrivateData::SearchTermCacheMap& cache, |
| base::string16 term) const; |
| |
| // Pass-through function to simplify our friendship with HistoryService. |
| sql::Connection& GetDB(); |
| |
| // Pass-through functions to simplify our friendship with InMemoryURLIndex. |
| URLIndexPrivateData* GetPrivateData() const; |
| base::CancelableTaskTracker* GetPrivateDataTracker() const; |
| void ClearPrivateData(); |
| void set_history_dir(const base::FilePath& dir_path); |
| bool GetCacheFilePath(base::FilePath* file_path) const; |
| void PostRestoreFromCacheFileTask(); |
| void PostSaveToCacheFileTask(); |
| const SchemeSet& scheme_whitelist(); |
| |
| |
| // Pass-through functions to simplify our friendship with URLIndexPrivateData. |
| bool UpdateURL(const history::URLRow& row); |
| bool DeleteURL(const GURL& url); |
| |
| // Data verification helper functions. |
| void ExpectPrivateDataNotEmpty(const URLIndexPrivateData& data); |
| void ExpectPrivateDataEmpty(const URLIndexPrivateData& data); |
| void ExpectPrivateDataEqual(const URLIndexPrivateData& expected, |
| const URLIndexPrivateData& actual); |
| |
| content::TestBrowserThreadBundle thread_bundle_; |
| scoped_ptr<InMemoryURLIndex> url_index_; |
| TestingProfile profile_; |
| history::HistoryService* history_service_; |
| history::HistoryDatabase* history_database_; |
| }; |
| |
| InMemoryURLIndexTest::InMemoryURLIndexTest() |
| : history_service_(nullptr), history_database_(nullptr) { |
| } |
| |
| sql::Connection& InMemoryURLIndexTest::GetDB() { |
| return history_database_->GetDB(); |
| } |
| |
| URLIndexPrivateData* InMemoryURLIndexTest::GetPrivateData() const { |
| DCHECK(url_index_->private_data()); |
| return url_index_->private_data(); |
| } |
| |
| base::CancelableTaskTracker* InMemoryURLIndexTest::GetPrivateDataTracker() |
| const { |
| DCHECK(url_index_->private_data_tracker()); |
| return url_index_->private_data_tracker(); |
| } |
| |
| void InMemoryURLIndexTest::ClearPrivateData() { |
| return url_index_->ClearPrivateData(); |
| } |
| |
| void InMemoryURLIndexTest::set_history_dir(const base::FilePath& dir_path) { |
| return url_index_->set_history_dir(dir_path); |
| } |
| |
| bool InMemoryURLIndexTest::GetCacheFilePath(base::FilePath* file_path) const { |
| DCHECK(file_path); |
| return url_index_->GetCacheFilePath(file_path); |
| } |
| |
| void InMemoryURLIndexTest::PostRestoreFromCacheFileTask() { |
| url_index_->PostRestoreFromCacheFileTask(); |
| } |
| |
| void InMemoryURLIndexTest::PostSaveToCacheFileTask() { |
| url_index_->PostSaveToCacheFileTask(); |
| } |
| |
| const SchemeSet& InMemoryURLIndexTest::scheme_whitelist() { |
| return url_index_->scheme_whitelist(); |
| } |
| |
| bool InMemoryURLIndexTest::UpdateURL(const history::URLRow& row) { |
| return GetPrivateData()->UpdateURL(history_service_, |
| row, |
| url_index_->languages_, |
| url_index_->scheme_whitelist_, |
| GetPrivateDataTracker()); |
| } |
| |
| bool InMemoryURLIndexTest::DeleteURL(const GURL& url) { |
| return GetPrivateData()->DeleteURL(url); |
| } |
| |
| void InMemoryURLIndexTest::SetUp() { |
| // We cannot access the database until the backend has been loaded. |
| ASSERT_TRUE(profile_.CreateHistoryService(true, false)); |
| profile_.CreateBookmarkModel(true); |
| bookmarks::test::WaitForBookmarkModelToLoad( |
| BookmarkModelFactory::GetForProfile(&profile_)); |
| profile_.BlockUntilHistoryProcessesPendingRequests(); |
| profile_.BlockUntilHistoryIndexIsRefreshed(); |
| history_service_ = HistoryServiceFactory::GetForProfile( |
| &profile_, ServiceAccessType::EXPLICIT_ACCESS); |
| ASSERT_TRUE(history_service_); |
| history::HistoryBackend* backend = history_service_->history_backend_.get(); |
| history_database_ = backend->db(); |
| |
| // Create and populate a working copy of the URL history database. |
| base::FilePath history_proto_path; |
| PathService::Get(chrome::DIR_TEST_DATA, &history_proto_path); |
| history_proto_path = history_proto_path.Append( |
| FILE_PATH_LITERAL("History")); |
| history_proto_path = history_proto_path.Append(TestDBName()); |
| EXPECT_TRUE(base::PathExists(history_proto_path)); |
| |
| std::ifstream proto_file(history_proto_path.value().c_str()); |
| static const size_t kCommandBufferMaxSize = 2048; |
| char sql_cmd_line[kCommandBufferMaxSize]; |
| |
| sql::Connection& db(GetDB()); |
| ASSERT_TRUE(db.is_open()); |
| { |
| sql::Transaction transaction(&db); |
| transaction.Begin(); |
| while (!proto_file.eof()) { |
| proto_file.getline(sql_cmd_line, kCommandBufferMaxSize); |
| if (!proto_file.eof()) { |
| // We only process lines which begin with a upper-case letter. |
| // TODO(mrossetti): Can iswupper() be used here? |
| if (sql_cmd_line[0] >= 'A' && sql_cmd_line[0] <= 'Z') { |
| std::string sql_cmd(sql_cmd_line); |
| sql::Statement sql_stmt(db.GetUniqueStatement(sql_cmd_line)); |
| EXPECT_TRUE(sql_stmt.Run()); |
| } |
| } |
| } |
| transaction.Commit(); |
| } |
| |
| // Update the last_visit_time table column in the "urls" table |
| // such that it represents a time relative to 'now'. |
| sql::Statement statement(db.GetUniqueStatement( |
| "SELECT" HISTORY_URL_ROW_FIELDS "FROM urls;")); |
| ASSERT_TRUE(statement.is_valid()); |
| base::Time time_right_now = base::Time::NowFromSystemTime(); |
| base::TimeDelta day_delta = base::TimeDelta::FromDays(1); |
| { |
| sql::Transaction transaction(&db); |
| transaction.Begin(); |
| while (statement.Step()) { |
| history::URLRow row; |
| history_database_->FillURLRow(statement, &row); |
| base::Time last_visit = time_right_now; |
| for (int64 i = row.last_visit().ToInternalValue(); i > 0; --i) |
| last_visit -= day_delta; |
| row.set_last_visit(last_visit); |
| history_database_->UpdateURLRow(row.id(), row); |
| } |
| transaction.Commit(); |
| } |
| |
| // Update the visit_time table column in the "visits" table |
| // such that it represents a time relative to 'now'. |
| statement.Assign(db.GetUniqueStatement( |
| "SELECT" HISTORY_VISIT_ROW_FIELDS "FROM visits;")); |
| ASSERT_TRUE(statement.is_valid()); |
| { |
| sql::Transaction transaction(&db); |
| transaction.Begin(); |
| while (statement.Step()) { |
| history::VisitRow row; |
| history_database_->FillVisitRow(statement, &row); |
| base::Time last_visit = time_right_now; |
| for (int64 i = row.visit_time.ToInternalValue(); i > 0; --i) |
| last_visit -= day_delta; |
| row.visit_time = last_visit; |
| history_database_->UpdateVisitRow(row); |
| } |
| transaction.Commit(); |
| } |
| |
| if (InitializeInMemoryURLIndexInSetUp()) |
| InitializeInMemoryURLIndex(); |
| } |
| |
| void InMemoryURLIndexTest::TearDown() { |
| // Ensure that the InMemoryURLIndex no longer observes HistoryService before |
| // it is destroyed in order to prevent HistoryService calling dead observer. |
| if (url_index_) |
| url_index_->Shutdown(); |
| } |
| |
| base::FilePath::StringType InMemoryURLIndexTest::TestDBName() const { |
| return FILE_PATH_LITERAL("url_history_provider_test.db.txt"); |
| } |
| |
| bool InMemoryURLIndexTest::InitializeInMemoryURLIndexInSetUp() const { |
| return true; |
| } |
| |
| void InMemoryURLIndexTest::InitializeInMemoryURLIndex() { |
| DCHECK(!url_index_); |
| |
| SchemeSet client_schemes_to_whitelist; |
| client_schemes_to_whitelist.insert(kClientWhitelistedScheme); |
| url_index_.reset(new InMemoryURLIndex( |
| nullptr, history_service_, nullptr, |
| content::BrowserThread::GetBlockingPool(), |
| base::FilePath(), kTestLanguages, client_schemes_to_whitelist)); |
| url_index_->Init(); |
| url_index_->RebuildFromHistory(history_database_); |
| } |
| |
| void InMemoryURLIndexTest::CheckTerm( |
| const URLIndexPrivateData::SearchTermCacheMap& cache, |
| base::string16 term) const { |
| URLIndexPrivateData::SearchTermCacheMap::const_iterator cache_iter( |
| cache.find(term)); |
| ASSERT_TRUE(cache.end() != cache_iter) |
| << "Cache does not contain '" << term << "' but should."; |
| URLIndexPrivateData::SearchTermCacheItem cache_item = cache_iter->second; |
| EXPECT_TRUE(cache_item.used_) |
| << "Cache item '" << term << "' should be marked as being in use."; |
| } |
| |
| void InMemoryURLIndexTest::ExpectPrivateDataNotEmpty( |
| const URLIndexPrivateData& data) { |
| EXPECT_FALSE(data.word_list_.empty()); |
| // available_words_ will be empty since we have freshly built the |
| // data set for these tests. |
| EXPECT_TRUE(data.available_words_.empty()); |
| EXPECT_FALSE(data.word_map_.empty()); |
| EXPECT_FALSE(data.char_word_map_.empty()); |
| EXPECT_FALSE(data.word_id_history_map_.empty()); |
| EXPECT_FALSE(data.history_id_word_map_.empty()); |
| EXPECT_FALSE(data.history_info_map_.empty()); |
| } |
| |
| void InMemoryURLIndexTest::ExpectPrivateDataEmpty( |
| const URLIndexPrivateData& data) { |
| EXPECT_TRUE(data.word_list_.empty()); |
| EXPECT_TRUE(data.available_words_.empty()); |
| EXPECT_TRUE(data.word_map_.empty()); |
| EXPECT_TRUE(data.char_word_map_.empty()); |
| EXPECT_TRUE(data.word_id_history_map_.empty()); |
| EXPECT_TRUE(data.history_id_word_map_.empty()); |
| EXPECT_TRUE(data.history_info_map_.empty()); |
| } |
| |
| // Helper function which compares two maps for equivalence. The maps' values |
| // are associative containers and their contents are compared as well. |
| template<typename T> |
| void ExpectMapOfContainersIdentical(const T& expected, const T& actual) { |
| ASSERT_EQ(expected.size(), actual.size()); |
| for (typename T::const_iterator expected_iter = expected.begin(); |
| expected_iter != expected.end(); ++expected_iter) { |
| typename T::const_iterator actual_iter = actual.find(expected_iter->first); |
| ASSERT_TRUE(actual.end() != actual_iter); |
| typename T::mapped_type const& expected_values(expected_iter->second); |
| typename T::mapped_type const& actual_values(actual_iter->second); |
| ASSERT_EQ(expected_values.size(), actual_values.size()); |
| for (typename T::mapped_type::const_iterator set_iter = |
| expected_values.begin(); set_iter != expected_values.end(); ++set_iter) |
| EXPECT_EQ(actual_values.count(*set_iter), |
| expected_values.count(*set_iter)); |
| } |
| } |
| |
| void InMemoryURLIndexTest::ExpectPrivateDataEqual( |
| const URLIndexPrivateData& expected, |
| const URLIndexPrivateData& actual) { |
| EXPECT_EQ(expected.word_list_.size(), actual.word_list_.size()); |
| EXPECT_EQ(expected.word_map_.size(), actual.word_map_.size()); |
| EXPECT_EQ(expected.char_word_map_.size(), actual.char_word_map_.size()); |
| EXPECT_EQ(expected.word_id_history_map_.size(), |
| actual.word_id_history_map_.size()); |
| EXPECT_EQ(expected.history_id_word_map_.size(), |
| actual.history_id_word_map_.size()); |
| EXPECT_EQ(expected.history_info_map_.size(), actual.history_info_map_.size()); |
| EXPECT_EQ(expected.word_starts_map_.size(), actual.word_starts_map_.size()); |
| // WordList must be index-by-index equal. |
| size_t count = expected.word_list_.size(); |
| for (size_t i = 0; i < count; ++i) |
| EXPECT_EQ(expected.word_list_[i], actual.word_list_[i]); |
| |
| ExpectMapOfContainersIdentical(expected.char_word_map_, |
| actual.char_word_map_); |
| ExpectMapOfContainersIdentical(expected.word_id_history_map_, |
| actual.word_id_history_map_); |
| ExpectMapOfContainersIdentical(expected.history_id_word_map_, |
| actual.history_id_word_map_); |
| |
| for (HistoryInfoMap::const_iterator expected_info = |
| expected.history_info_map_.begin(); |
| expected_info != expected.history_info_map_.end(); ++expected_info) { |
| HistoryInfoMap::const_iterator actual_info = |
| actual.history_info_map_.find(expected_info->first); |
| // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between |
| // gtest and STLPort in the Android build. See |
| // http://code.google.com/p/googletest/issues/detail?id=359 |
| ASSERT_TRUE(actual_info != actual.history_info_map_.end()); |
| const history::URLRow& expected_row(expected_info->second.url_row); |
| const history::URLRow& actual_row(actual_info->second.url_row); |
| EXPECT_EQ(expected_row.visit_count(), actual_row.visit_count()); |
| EXPECT_EQ(expected_row.typed_count(), actual_row.typed_count()); |
| EXPECT_EQ(expected_row.last_visit(), actual_row.last_visit()); |
| EXPECT_EQ(expected_row.url(), actual_row.url()); |
| const VisitInfoVector& expected_visits(expected_info->second.visits); |
| const VisitInfoVector& actual_visits(actual_info->second.visits); |
| EXPECT_EQ(expected_visits.size(), actual_visits.size()); |
| for (size_t i = 0; |
| i < std::min(expected_visits.size(), actual_visits.size()); ++i) { |
| EXPECT_EQ(expected_visits[i].first, actual_visits[i].first); |
| EXPECT_EQ(expected_visits[i].second, actual_visits[i].second); |
| } |
| } |
| |
| for (WordStartsMap::const_iterator expected_starts = |
| expected.word_starts_map_.begin(); |
| expected_starts != expected.word_starts_map_.end(); |
| ++expected_starts) { |
| WordStartsMap::const_iterator actual_starts = |
| actual.word_starts_map_.find(expected_starts->first); |
| // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between |
| // gtest and STLPort in the Android build. See |
| // http://code.google.com/p/googletest/issues/detail?id=359 |
| ASSERT_TRUE(actual_starts != actual.word_starts_map_.end()); |
| const RowWordStarts& expected_word_starts(expected_starts->second); |
| const RowWordStarts& actual_word_starts(actual_starts->second); |
| EXPECT_EQ(expected_word_starts.url_word_starts_.size(), |
| actual_word_starts.url_word_starts_.size()); |
| EXPECT_TRUE(std::equal(expected_word_starts.url_word_starts_.begin(), |
| expected_word_starts.url_word_starts_.end(), |
| actual_word_starts.url_word_starts_.begin())); |
| EXPECT_EQ(expected_word_starts.title_word_starts_.size(), |
| actual_word_starts.title_word_starts_.size()); |
| EXPECT_TRUE(std::equal(expected_word_starts.title_word_starts_.begin(), |
| expected_word_starts.title_word_starts_.end(), |
| actual_word_starts.title_word_starts_.begin())); |
| } |
| } |
| |
| //------------------------------------------------------------------------------ |
| |
| class LimitedInMemoryURLIndexTest : public InMemoryURLIndexTest { |
| protected: |
| base::FilePath::StringType TestDBName() const override; |
| bool InitializeInMemoryURLIndexInSetUp() const override; |
| }; |
| |
| base::FilePath::StringType LimitedInMemoryURLIndexTest::TestDBName() const { |
| return FILE_PATH_LITERAL("url_history_provider_test_limited.db.txt"); |
| } |
| |
| bool LimitedInMemoryURLIndexTest::InitializeInMemoryURLIndexInSetUp() const { |
| return false; |
| } |
| |
| TEST_F(LimitedInMemoryURLIndexTest, Initialization) { |
| // Verify that the database contains the expected number of items, which |
| // is the pre-filtered count, i.e. all of the items. |
| sql::Statement statement(GetDB().GetUniqueStatement("SELECT * FROM urls;")); |
| ASSERT_TRUE(statement.is_valid()); |
| uint64 row_count = 0; |
| while (statement.Step()) ++row_count; |
| EXPECT_EQ(1U, row_count); |
| |
| InitializeInMemoryURLIndex(); |
| URLIndexPrivateData& private_data(*GetPrivateData()); |
| |
| // history_info_map_ should have the same number of items as were filtered. |
| EXPECT_EQ(1U, private_data.history_info_map_.size()); |
| EXPECT_EQ(35U, private_data.char_word_map_.size()); |
| EXPECT_EQ(17U, private_data.word_map_.size()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, Retrieval) { |
| // See if a very specific term gives a single result. |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // Verify that we got back the result we expected. |
| EXPECT_EQ(5, matches[0].url_info.id()); |
| EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title()); |
| |
| // Make sure a trailing space still results in the expected result. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("DrudgeReport "), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(5, matches[0].url_info.id()); |
| EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title()); |
| |
| // Search which should result in multiple results. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("drudge"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(2U, matches.size()); |
| // The results should be in descending score order. |
| EXPECT_GE(matches[0].raw_score, matches[1].raw_score); |
| |
| // Search which should result in nearly perfect result. |
| matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("Nearly Perfect Result"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| // The results should have a very high score. |
| EXPECT_GT(matches[0].raw_score, 900); |
| EXPECT_EQ(32, matches[0].url_info.id()); |
| EXPECT_EQ("https://nearlyperfectresult.com/", |
| matches[0].url_info.url().spec()); // Note: URL gets lowercased. |
| EXPECT_EQ(ASCIIToUTF16("Practically Perfect Search Result"), |
| matches[0].url_info.title()); |
| |
| // Search which should result in very poor result. |
| // No results since it will be suppressed by default scoring. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("qui c"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // Search which will match at the end of an URL with encoded characters. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("Mice"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(30, matches[0].url_info.id()); |
| |
| // Check that URLs are not escaped an escape time. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("1% wikipedia"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(35, matches[0].url_info.id()); |
| EXPECT_EQ("http://en.wikipedia.org/wiki/1%25_rule_(Internet_culture)", |
| matches[0].url_info.url().spec()); |
| |
| // Verify that a single term can appear multiple times in the URL. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("fubar"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(34, matches[0].url_info.id()); |
| EXPECT_EQ("http://fubarfubarandfubar.com/", matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16("Situation Normal -- FUBARED"), |
| matches[0].url_info.title()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, CursorPositionRetrieval) { |
| // See if a very specific term with no cursor gives an empty result. |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("DrudReport"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // The same test with the cursor at the end should give an empty result. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("DrudReport"), 10u, |
| kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // If the cursor is between Drud and Report, we should find the desired |
| // result. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("DrudReport"), 4u, |
| kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title()); |
| |
| // Now check multi-word inputs. No cursor should fail to find a |
| // result on this input. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("MORTGAGERATE DROPS"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // Ditto with cursor at end. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("MORTGAGERATE DROPS"), |
| 18u, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // If the cursor is between MORTAGE And RATE, we should find the |
| // desired result. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("MORTGAGERATE DROPS"), |
| 8u, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708", |
| matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16( |
| "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"), |
| matches[0].url_info.title()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, URLPrefixMatching) { |
| // "drudgere" - found |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("drudgere"), base::string16::npos, kMaxMatches); |
| EXPECT_EQ(1U, matches.size()); |
| |
| // "www.atdmt" - not found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("www.atdmt"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(0U, matches.size()); |
| |
| // "atdmt" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("atdmt"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(1U, matches.size()); |
| |
| // "view.atdmt" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("view.atdmt"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // "view.atdmt" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("view.atdmt"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(1U, matches.size()); |
| |
| // "cnn.com" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("cnn.com"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(2U, matches.size()); |
| |
| // "www.cnn.com" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("www.cnn.com"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(1U, matches.size()); |
| |
| // "ww.cnn.com" - found because we suppress mid-term matches. |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("ww.cnn.com"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(0U, matches.size()); |
| |
| // "www.cnn.com" - found |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("www.cnn.com"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(1U, matches.size()); |
| |
| // "tp://www.cnn.com" - not found because we don't allow tp as a mid-term |
| // match |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("tp://www.cnn.com"), |
| base::string16::npos, kMaxMatches); |
| EXPECT_EQ(0U, matches.size()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, ProperStringMatching) { |
| // Search for the following with the expected results: |
| // "atdmt view" - found |
| // "atdmt.view" - not found |
| // "view.atdmt" - found |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("atdmt view"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("atdmt.view"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("view.atdmt"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, HugeResultSet) { |
| // Create a huge set of qualifying history items. |
| for (history::URLID row_id = 5000; row_id < 6000; ++row_id) { |
| history::URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), |
| row_id); |
| new_row.set_last_visit(base::Time::Now()); |
| EXPECT_TRUE(UpdateURL(new_row)); |
| } |
| |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("b"), base::string16::npos, kMaxMatches); |
| URLIndexPrivateData& private_data(*GetPrivateData()); |
| ASSERT_EQ(kMaxMatches, matches.size()); |
| // There are 7 matches already in the database. |
| ASSERT_EQ(1008U, private_data.pre_filter_item_count_); |
| ASSERT_EQ(500U, private_data.post_filter_item_count_); |
| ASSERT_EQ(kMaxMatches, private_data.post_scoring_item_count_); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, TitleSearch) { |
| // Signal if someone has changed the test DB. |
| EXPECT_EQ(29U, GetPrivateData()->history_info_map_.size()); |
| |
| // Ensure title is being searched. |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("MORTGAGE RATE DROPS"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // Verify that we got back the result we expected. |
| EXPECT_EQ(1, matches[0].url_info.id()); |
| EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708", |
| matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16( |
| "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"), |
| matches[0].url_info.title()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, TitleChange) { |
| // Verify current title terms retrieves desired item. |
| base::string16 original_terms = |
| ASCIIToUTF16("lebronomics could high taxes influence"); |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| original_terms, base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // Verify that we got back the result we expected. |
| const history::URLID expected_id = 3; |
| EXPECT_EQ(expected_id, matches[0].url_info.id()); |
| EXPECT_EQ("http://www.businessandmedia.org/articles/2010/20100708120415.aspx", |
| matches[0].url_info.url().spec()); |
| EXPECT_EQ(ASCIIToUTF16( |
| "LeBronomics: Could High Taxes Influence James' Team Decision?"), |
| matches[0].url_info.title()); |
| history::URLRow old_row(matches[0].url_info); |
| |
| // Verify new title terms retrieves nothing. |
| base::string16 new_terms = ASCIIToUTF16("does eat oats little lambs ivy"); |
| matches = url_index_->HistoryItemsForTerms(new_terms, base::string16::npos, |
| kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| |
| // Update the row. |
| old_row.set_title(ASCIIToUTF16("Does eat oats and little lambs eat ivy")); |
| EXPECT_TRUE(UpdateURL(old_row)); |
| |
| // Verify we get the row using the new terms but not the original terms. |
| matches = url_index_->HistoryItemsForTerms(new_terms, base::string16::npos, |
| kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(expected_id, matches[0].url_info.id()); |
| matches = url_index_->HistoryItemsForTerms(original_terms, |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(0U, matches.size()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, NonUniqueTermCharacterSets) { |
| // The presence of duplicate characters should succeed. Exercise by cycling |
| // through a string with several duplicate characters. |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("ABRA"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(28, matches[0].url_info.id()); |
| EXPECT_EQ("http://www.ddj.com/windows/184416623", |
| matches[0].url_info.url().spec()); |
| |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("ABRACAD"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(28, matches[0].url_info.id()); |
| |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("ABRACADABRA"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(28, matches[0].url_info.id()); |
| |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("ABRACADABR"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(28, matches[0].url_info.id()); |
| |
| matches = url_index_->HistoryItemsForTerms(ASCIIToUTF16("ABRACA"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| EXPECT_EQ(28, matches[0].url_info.id()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, TypedCharacterCaching) { |
| // Verify that match results for previously typed characters are retained |
| // (in the term_char_word_set_cache_) and reused, if possible, in future |
| // autocompletes. |
| |
| URLIndexPrivateData::SearchTermCacheMap& cache( |
| GetPrivateData()->search_term_cache_); |
| |
| // The cache should be empty at this point. |
| EXPECT_EQ(0U, cache.size()); |
| |
| // Now simulate typing search terms into the omnibox and check the state of |
| // the cache as each item is 'typed'. |
| |
| // Simulate typing "r" giving "r" in the simulated omnibox. The results for |
| // 'r' will be not cached because it is only 1 character long. |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("r"), base::string16::npos, |
| kMaxMatches); |
| EXPECT_EQ(0U, cache.size()); |
| |
| // Simulate typing "re" giving "r re" in the simulated omnibox. |
| // 're' should be cached at this point but not 'r' as it is a single |
| // character. |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("r re"), base::string16::npos, |
| kMaxMatches); |
| ASSERT_EQ(1U, cache.size()); |
| CheckTerm(cache, ASCIIToUTF16("re")); |
| |
| // Simulate typing "reco" giving "r re reco" in the simulated omnibox. |
| // 're' and 'reco' should be cached at this point but not 'r' as it is a |
| // single character. |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("r re reco"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(2U, cache.size()); |
| CheckTerm(cache, ASCIIToUTF16("re")); |
| CheckTerm(cache, ASCIIToUTF16("reco")); |
| |
| // Simulate typing "mort". |
| // Since we now have only one search term, the cached results for 're' and |
| // 'reco' should be purged, giving us only 1 item in the cache (for 'mort'). |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("mort"), base::string16::npos, |
| kMaxMatches); |
| ASSERT_EQ(1U, cache.size()); |
| CheckTerm(cache, ASCIIToUTF16("mort")); |
| |
| // Simulate typing "reco" giving "mort reco" in the simulated omnibox. |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("mort reco"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(2U, cache.size()); |
| CheckTerm(cache, ASCIIToUTF16("mort")); |
| CheckTerm(cache, ASCIIToUTF16("reco")); |
| |
| // Simulate a <DELETE> by removing the 'reco' and adding back the 'rec'. |
| url_index_->HistoryItemsForTerms(ASCIIToUTF16("mort rec"), |
| base::string16::npos, kMaxMatches); |
| ASSERT_EQ(2U, cache.size()); |
| CheckTerm(cache, ASCIIToUTF16("mort")); |
| CheckTerm(cache, ASCIIToUTF16("rec")); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, AddNewRows) { |
| // Verify that the row we're going to add does not already exist. |
| history::URLID new_row_id = 87654321; |
| // Newly created history::URLRows get a last_visit time of 'right now' so it |
| // should |
| // qualify as a quick result candidate. |
| EXPECT_TRUE(url_index_->HistoryItemsForTerms(ASCIIToUTF16("brokeandalone"), |
| base::string16::npos, |
| kMaxMatches).empty()); |
| |
| // Add a new row. |
| history::URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), |
| new_row_id++); |
| new_row.set_last_visit(base::Time::Now()); |
| EXPECT_TRUE(UpdateURL(new_row)); |
| |
| // Verify that we can retrieve it. |
| EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(ASCIIToUTF16("brokeandalone"), |
| base::string16::npos, |
| kMaxMatches).size()); |
| |
| // Add it again just to be sure that is harmless and that it does not update |
| // the index. |
| EXPECT_FALSE(UpdateURL(new_row)); |
| EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(ASCIIToUTF16("brokeandalone"), |
| base::string16::npos, |
| kMaxMatches).size()); |
| |
| // Make up an URL that does not qualify and try to add it. |
| history::URLRow unqualified_row( |
| GURL("http://www.brokeandaloneinmanitoba.com/"), new_row_id++); |
| EXPECT_FALSE(UpdateURL(new_row)); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, DeleteRows) { |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // Delete the URL then search again. |
| EXPECT_TRUE(DeleteURL(matches[0].url_info.url())); |
| EXPECT_TRUE(url_index_->HistoryItemsForTerms(ASCIIToUTF16("DrudgeReport"), |
| base::string16::npos, |
| kMaxMatches).empty()); |
| |
| // Make up an URL that does not exist in the database and delete it. |
| GURL url("http://www.hokeypokey.com/putyourrightfootin.html"); |
| EXPECT_FALSE(DeleteURL(url)); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, ExpireRow) { |
| ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms( |
| ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches); |
| ASSERT_EQ(1U, matches.size()); |
| |
| // Determine the row id for the result, remember that id, broadcast a |
| // delete notification, then ensure that the row has been deleted. |
| history::URLRows deleted_rows; |
| deleted_rows.push_back(matches[0].url_info); |
| url_index_->OnURLsDeleted(nullptr, false, false, deleted_rows, |
| std::set<GURL>()); |
| EXPECT_TRUE(url_index_->HistoryItemsForTerms(ASCIIToUTF16("DrudgeReport"), |
| base::string16::npos, |
| kMaxMatches).empty()); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, WhitelistedURLs) { |
| std::string client_whitelisted_url = |
| base::StringPrintf("%s://foo", kClientWhitelistedScheme); |
| struct TestData { |
| const std::string url_spec; |
| const bool expected_is_whitelisted; |
| } data[] = { |
| // URLs with whitelisted schemes. |
| { "about:histograms", true }, |
| { "file://localhost/Users/joeschmoe/sekrets", true }, |
| { "ftp://public.mycompany.com/myfile.txt", true }, |
| { "http://www.google.com/translate", true }, |
| { "https://www.gmail.com/", true }, |
| { "mailto:support@google.com", true }, |
| { client_whitelisted_url, true }, |
| // URLs with unacceptable schemes. |
| { "aaa://www.dummyhost.com;frammy", false }, |
| { "aaas://www.dummyhost.com;frammy", false }, |
| { "acap://suzie@somebody.com", false }, |
| { "cap://cal.example.com/Company/Holidays", false }, |
| { "cid:foo4*foo1@bar.net", false }, |
| { "crid://example.com/foobar", false }, |
| { "data:image/png;base64,iVBORw0KGgoAAAANSUhE=", false }, |
| { "dict://dict.org/d:shortcake:", false }, |
| { "dns://192.168.1.1/ftp.example.org?type=A", false }, |
| { "fax:+358.555.1234567", false }, |
| { "geo:13.4125,103.8667", false }, |
| { "go:Mercedes%20Benz", false }, |
| { "gopher://farnsworth.ca:666/gopher", false }, |
| { "h323:farmer-john;sixpence", false }, |
| { "iax:johnQ@example.com/12022561414", false }, |
| { "icap://icap.net/service?mode=translate&lang=french", false }, |
| { "im:fred@example.com", false }, |
| { "imap://michael@minbari.org/users.*", false }, |
| { "info:ddc/22/eng//004.678", false }, |
| { "ipp://example.com/printer/fox", false }, |
| { "iris:dreg1//example.com/local/myhosts", false }, |
| { "iris.beep:dreg1//example.com/local/myhosts", false }, |
| { "iris.lws:dreg1//example.com/local/myhosts", false }, |
| { "iris.xpc:dreg1//example.com/local/myhosts", false }, |
| { "iris.xpcs:dreg1//example.com/local/myhosts", false }, |
| { "ldap://ldap.itd.umich.edu/o=University%20of%20Michigan,c=US", false }, |
| { "mid:foo4%25foo1@bar.net", false }, |
| { "modem:+3585551234567;type=v32b?7e1;type=v110", false }, |
| { "msrp://atlanta.example.com:7654/jshA7weztas;tcp", false }, |
| { "msrps://atlanta.example.com:7654/jshA7weztas;tcp", false }, |
| { "news:colorectal.info.banned", false }, |
| { "nfs://server/d/e/f", false }, |
| { "nntp://www.example.com:6543/info.comp.lies/1234", false }, |
| { "pop://rg;AUTH=+APOP@mail.mycompany.com:8110", false }, |
| { "pres:fred@example.com", false }, |
| { "prospero://host.dom//pros/name", false }, |
| { "rsync://syler@lost.com/Source", false }, |
| { "rtsp://media.example.com:554/twister/audiotrack", false }, |
| { "service:acap://some.where.net;authentication=KERBEROSV4", false }, |
| { "shttp://www.terces.com/secret", false }, |
| { "sieve://example.com//script", false }, |
| { "sip:+1-212-555-1212:1234@gateway.com;user=phone", false }, |
| { "sips:+1-212-555-1212:1234@gateway.com;user=phone", false }, |
| { "sms:+15105551212?body=hello%20there", false }, |
| { "snmp://tester5@example.com:8161/bridge1;800002b804616263", false }, |
| { "soap.beep://stockquoteserver.example.com/StockQuote", false }, |
| { "soap.beeps://stockquoteserver.example.com/StockQuote", false }, |
| { "tag:blogger.com,1999:blog-555", false }, |
| { "tel:+358-555-1234567;postd=pp22", false }, |
| { "telnet://mayor_margie:one2rule4All@www.mycity.com:6789/", false }, |
| { "tftp://example.com/mystartupfile", false }, |
| { "tip://123.123.123.123/?urn:xopen:xid", false }, |
| { "tv:nbc.com", false }, |
| { "urn:foo:A123,456", false }, |
| { "vemmi://zeus.mctel.fr/demo", false }, |
| { "wais://www.mydomain.net:8765/mydatabase", false }, |
| { "xmpp:node@example.com", false }, |
| { "xmpp://guest@example.com", false }, |
| }; |
| |
| const SchemeSet& whitelist(scheme_whitelist()); |
| for (size_t i = 0; i < arraysize(data); ++i) { |
| GURL url(data[i].url_spec); |
| EXPECT_EQ(data[i].expected_is_whitelisted, |
| URLIndexPrivateData::URLSchemeIsWhitelisted(url, whitelist)); |
| } |
| } |
| |
| TEST_F(InMemoryURLIndexTest, ReadVisitsFromHistory) { |
| const HistoryInfoMap& history_info_map = GetPrivateData()->history_info_map_; |
| |
| // Check (for URL with id 1) that the number of visits and their |
| // transition types are what we expect. We don't bother checking |
| // the timestamps because it's too much trouble. (The timestamps go |
| // through a transformation in InMemoryURLIndexTest::SetUp(). We |
| // assume that if the count and transitions show up with the right |
| // information, we're getting the right information from the history |
| // database file.) |
| HistoryInfoMap::const_iterator entry = history_info_map.find(1); |
| ASSERT_TRUE(entry != history_info_map.end()); |
| { |
| const VisitInfoVector& visits = entry->second.visits; |
| ASSERT_EQ(3u, visits.size()); |
| EXPECT_EQ(static_cast<ui::PageTransition>(0u), visits[0].second); |
| EXPECT_EQ(static_cast<ui::PageTransition>(1u), visits[1].second); |
| EXPECT_EQ(static_cast<ui::PageTransition>(0u), visits[2].second); |
| } |
| |
| // Ditto but for URL with id 35. |
| entry = history_info_map.find(35); |
| ASSERT_TRUE(entry != history_info_map.end()); |
| { |
| const VisitInfoVector& visits = entry->second.visits; |
| ASSERT_EQ(2u, visits.size()); |
| EXPECT_EQ(static_cast<ui::PageTransition>(1u), visits[0].second); |
| EXPECT_EQ(static_cast<ui::PageTransition>(1u), visits[1].second); |
| } |
| |
| // The URL with id 32 has many visits listed in the database, but we |
| // should only read the most recent 10 (which are all transition type 0). |
| entry = history_info_map.find(32); |
| ASSERT_TRUE(entry != history_info_map.end()); |
| { |
| const VisitInfoVector& visits = entry->second.visits; |
| EXPECT_EQ(10u, visits.size()); |
| for (size_t i = 0; i < visits.size(); ++i) |
| EXPECT_EQ(static_cast<ui::PageTransition>(0u), visits[i].second); |
| } |
| } |
| |
| TEST_F(InMemoryURLIndexTest, CacheSaveRestore) { |
| base::ScopedTempDir temp_directory; |
| ASSERT_TRUE(temp_directory.CreateUniqueTempDir()); |
| set_history_dir(temp_directory.path()); |
| |
| URLIndexPrivateData& private_data(*GetPrivateData()); |
| |
| // Ensure that there is really something there to be saved. |
| EXPECT_FALSE(private_data.word_list_.empty()); |
| // available_words_ will already be empty since we have freshly built the |
| // data set for this test. |
| EXPECT_TRUE(private_data.available_words_.empty()); |
| EXPECT_FALSE(private_data.word_map_.empty()); |
| EXPECT_FALSE(private_data.char_word_map_.empty()); |
| EXPECT_FALSE(private_data.word_id_history_map_.empty()); |
| EXPECT_FALSE(private_data.history_id_word_map_.empty()); |
| EXPECT_FALSE(private_data.history_info_map_.empty()); |
| EXPECT_FALSE(private_data.word_starts_map_.empty()); |
| |
| // Make sure the data we have was built from history. (Version 0 |
| // means rebuilt from history.) |
| EXPECT_EQ(0, private_data.restored_cache_version_); |
| |
| // Capture the current private data for later comparison to restored data. |
| scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate()); |
| const base::Time rebuild_time = private_data.last_time_rebuilt_from_history_; |
| |
| { |
| // Save then restore our private data. |
| base::RunLoop run_loop; |
| CacheFileSaverObserver save_observer(run_loop.QuitClosure()); |
| url_index_->set_save_cache_observer(&save_observer); |
| PostSaveToCacheFileTask(); |
| run_loop.Run(); |
| EXPECT_TRUE(save_observer.succeeded()); |
| } |
| |
| // Clear and then prove it's clear before restoring. |
| ClearPrivateData(); |
| EXPECT_TRUE(private_data.word_list_.empty()); |
| EXPECT_TRUE(private_data.available_words_.empty()); |
| EXPECT_TRUE(private_data.word_map_.empty()); |
| EXPECT_TRUE(private_data.char_word_map_.empty()); |
| EXPECT_TRUE(private_data.word_id_history_map_.empty()); |
| EXPECT_TRUE(private_data.history_id_word_map_.empty()); |
| EXPECT_TRUE(private_data.history_info_map_.empty()); |
| EXPECT_TRUE(private_data.word_starts_map_.empty()); |
| |
| { |
| base::RunLoop run_loop; |
| HistoryIndexRestoreObserver restore_observer(run_loop.QuitClosure()); |
| url_index_->set_restore_cache_observer(&restore_observer); |
| PostRestoreFromCacheFileTask(); |
| run_loop.Run(); |
| EXPECT_TRUE(restore_observer.succeeded()); |
| } |
| |
| URLIndexPrivateData& new_data(*GetPrivateData()); |
| |
| // Make sure the data we have was reloaded from cache. (Version 0 |
| // means rebuilt from history; anything else means restored from |
| // a cache version.) Also, the rebuild time should not have changed. |
| EXPECT_GT(new_data.restored_cache_version_, 0); |
| EXPECT_EQ(rebuild_time, new_data.last_time_rebuilt_from_history_); |
| |
| // Compare the captured and restored for equality. |
| ExpectPrivateDataEqual(*old_data.get(), new_data); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, RebuildFromHistoryIfCacheOld) { |
| base::ScopedTempDir temp_directory; |
| ASSERT_TRUE(temp_directory.CreateUniqueTempDir()); |
| set_history_dir(temp_directory.path()); |
| |
| URLIndexPrivateData& private_data(*GetPrivateData()); |
| |
| // Ensure that there is really something there to be saved. |
| EXPECT_FALSE(private_data.word_list_.empty()); |
| // available_words_ will already be empty since we have freshly built the |
| // data set for this test. |
| EXPECT_TRUE(private_data.available_words_.empty()); |
| EXPECT_FALSE(private_data.word_map_.empty()); |
| EXPECT_FALSE(private_data.char_word_map_.empty()); |
| EXPECT_FALSE(private_data.word_id_history_map_.empty()); |
| EXPECT_FALSE(private_data.history_id_word_map_.empty()); |
| EXPECT_FALSE(private_data.history_info_map_.empty()); |
| EXPECT_FALSE(private_data.word_starts_map_.empty()); |
| |
| // Make sure the data we have was built from history. (Version 0 |
| // means rebuilt from history.) |
| EXPECT_EQ(0, private_data.restored_cache_version_); |
| |
| // Overwrite the build time so that we'll think the data is too old |
| // and rebuild the cache from history. |
| const base::Time fake_rebuild_time = |
| private_data.last_time_rebuilt_from_history_ - |
| base::TimeDelta::FromDays(30); |
| private_data.last_time_rebuilt_from_history_ = fake_rebuild_time; |
| |
| // Capture the current private data for later comparison to restored data. |
| scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate()); |
| |
| { |
| // Save then restore our private data. |
| base::RunLoop run_loop; |
| CacheFileSaverObserver save_observer(run_loop.QuitClosure()); |
| url_index_->set_save_cache_observer(&save_observer); |
| PostSaveToCacheFileTask(); |
| run_loop.Run(); |
| EXPECT_TRUE(save_observer.succeeded()); |
| } |
| |
| // Clear and then prove it's clear before restoring. |
| ClearPrivateData(); |
| EXPECT_TRUE(private_data.word_list_.empty()); |
| EXPECT_TRUE(private_data.available_words_.empty()); |
| EXPECT_TRUE(private_data.word_map_.empty()); |
| EXPECT_TRUE(private_data.char_word_map_.empty()); |
| EXPECT_TRUE(private_data.word_id_history_map_.empty()); |
| EXPECT_TRUE(private_data.history_id_word_map_.empty()); |
| EXPECT_TRUE(private_data.history_info_map_.empty()); |
| EXPECT_TRUE(private_data.word_starts_map_.empty()); |
| |
| { |
| base::RunLoop run_loop; |
| HistoryIndexRestoreObserver restore_observer(run_loop.QuitClosure()); |
| url_index_->set_restore_cache_observer(&restore_observer); |
| PostRestoreFromCacheFileTask(); |
| run_loop.Run(); |
| EXPECT_TRUE(restore_observer.succeeded()); |
| } |
| |
| URLIndexPrivateData& new_data(*GetPrivateData()); |
| |
| // Make sure the data we have was rebuilt from history. (Version 0 |
| // means rebuilt from history; anything else means restored from |
| // a cache version.) |
| EXPECT_EQ(0, new_data.restored_cache_version_); |
| EXPECT_NE(fake_rebuild_time, new_data.last_time_rebuilt_from_history_); |
| |
| // Compare the captured and restored for equality. |
| ExpectPrivateDataEqual(*old_data.get(), new_data); |
| } |
| |
| TEST_F(InMemoryURLIndexTest, AddHistoryMatch) { |
| const struct { |
| const char* search_string; |
| size_t cursor_position; |
| const size_t expected_word_starts_offsets_size; |
| const size_t expected_word_starts_offsets[3]; |
| } test_cases[] = { |
| /* No punctuations, only cursor position change. */ |
| { "ABCD", kInvalid, 1, {0, kInvalid, kInvalid} }, |
| { "abcd", 0, 1, {0, kInvalid, kInvalid} }, |
| { "AbcD", 1, 2, {0, 0, kInvalid} }, |
| { "abcd", 4, 1, {0, kInvalid, kInvalid} }, |
| |
| /* Starting with punctuation. */ |
| { ".abcd", kInvalid, 1, {1, kInvalid, kInvalid} }, |
| { ".abcd", 0, 1, {1, kInvalid, kInvalid} }, |
| { "!abcd", 1, 2, {1, 0, kInvalid} }, |
| { "::abcd", 1, 2, {1, 1, kInvalid} }, |
| { ":abcd", 5, 1, {1, kInvalid, kInvalid} }, |
| |
| /* Ending with punctuation. */ |
| { "abcd://", kInvalid, 1, {0, kInvalid, kInvalid} }, |
| { "ABCD://", 0, 1, {0, kInvalid, kInvalid} }, |
| { "abcd://", 1, 2, {0, 0, kInvalid} }, |
| { "abcd://", 4, 2, {0, 3, kInvalid} }, |
| { "abcd://", 7, 1, {0, kInvalid, kInvalid} }, |
| |
| /* Punctuation in the middle. */ |
| { "ab.cd", kInvalid, 1, {0, kInvalid, kInvalid} }, |
| { "ab.cd", 0, 1, {0, kInvalid, kInvalid} }, |
| { "ab!cd", 1, 2, {0, 0, kInvalid} }, |
| { "AB.cd", 2, 2, {0, 1, kInvalid} }, |
| { "AB.cd", 3, 2, {0, 0, kInvalid} }, |
| { "ab:cd", 5, 1, {0, kInvalid, kInvalid} }, |
| |
| /* Hyphenation */ |
| { "Ab-cd", kInvalid, 1, {0, kInvalid, kInvalid} }, |
| { "ab-cd", 0, 1, {0, kInvalid, kInvalid} }, |
| { "-abcd", 0, 1, {1, kInvalid, kInvalid} }, |
| { "-abcd", 1, 2, {1, 0, kInvalid} }, |
| { "abcd-", 2, 2, {0, 0, kInvalid} }, |
| { "abcd-", 4, 2, {0, 1, kInvalid} }, |
| { "ab-cd", 5, 1, {0, kInvalid, kInvalid} }, |
| |
| /* Whitespace */ |
| { "Ab cd", kInvalid, 2, {0, 0, kInvalid} }, |
| { "ab cd", 0, 2, {0, 0, kInvalid} }, |
| { " abcd", 0, 1, {0, kInvalid, kInvalid} }, |
| { " abcd", 1, 1, {0, kInvalid, kInvalid} }, |
| { "abcd ", 2, 2, {0, 0, kInvalid} }, |
| { "abcd :", 4, 2, {0, 1, kInvalid} }, |
| { "abcd :", 5, 2, {0, 1, kInvalid} }, |
| { "abcd :", 2, 3, {0, 0, 1} } |
| }; |
| |
| for (size_t i = 0; i < arraysize(test_cases); ++i) { |
| SCOPED_TRACE(testing::Message() |
| << "search_string = " << test_cases[i].search_string |
| << ", cursor_position = " << test_cases[i].cursor_position); |
| |
| base::string16 lower_string; |
| String16Vector lower_terms; |
| StringToTerms(test_cases[i].search_string, test_cases[i].cursor_position, |
| &lower_string, &lower_terms); |
| URLIndexPrivateData::AddHistoryMatch match(nullptr, nullptr, |
| *GetPrivateData(), |
| kTestLanguages, lower_string, |
| lower_terms, base::Time::Now()); |
| |
| // Verify against expectations. |
| EXPECT_EQ(test_cases[i].expected_word_starts_offsets_size, |
| match.lower_terms_to_word_starts_offsets_.size()); |
| for (size_t j = 0; j < test_cases[i].expected_word_starts_offsets_size; |
| ++j) { |
| EXPECT_EQ(test_cases[i].expected_word_starts_offsets[j], |
| match.lower_terms_to_word_starts_offsets_[j]); |
| } |
| } |
| } |
| |
| class InMemoryURLIndexCacheTest : public testing::Test { |
| public: |
| InMemoryURLIndexCacheTest() {} |
| |
| protected: |
| void SetUp() override; |
| void TearDown() override; |
| |
| // Pass-through functions to simplify our friendship with InMemoryURLIndex. |
| void set_history_dir(const base::FilePath& dir_path); |
| bool GetCacheFilePath(base::FilePath* file_path) const; |
| |
| content::TestBrowserThreadBundle thread_bundle_; |
| base::ScopedTempDir temp_dir_; |
| scoped_ptr<InMemoryURLIndex> url_index_; |
| }; |
| |
| void InMemoryURLIndexCacheTest::SetUp() { |
| ASSERT_TRUE(temp_dir_.CreateUniqueTempDir()); |
| base::FilePath path(temp_dir_.path()); |
| url_index_.reset(new InMemoryURLIndex( |
| nullptr, nullptr, nullptr, content::BrowserThread::GetBlockingPool(), |
| path, kTestLanguages, SchemeSet())); |
| } |
| |
| void InMemoryURLIndexCacheTest::TearDown() { |
| if (url_index_) |
| url_index_->Shutdown(); |
| } |
| |
| void InMemoryURLIndexCacheTest::set_history_dir( |
| const base::FilePath& dir_path) { |
| return url_index_->set_history_dir(dir_path); |
| } |
| |
| bool InMemoryURLIndexCacheTest::GetCacheFilePath( |
| base::FilePath* file_path) const { |
| DCHECK(file_path); |
| return url_index_->GetCacheFilePath(file_path); |
| } |
| |
| TEST_F(InMemoryURLIndexCacheTest, CacheFilePath) { |
| base::FilePath expectedPath = |
| temp_dir_.path().Append(FILE_PATH_LITERAL("History Provider Cache")); |
| std::vector<base::FilePath::StringType> expected_parts; |
| expectedPath.GetComponents(&expected_parts); |
| base::FilePath full_file_path; |
| ASSERT_TRUE(GetCacheFilePath(&full_file_path)); |
| std::vector<base::FilePath::StringType> actual_parts; |
| full_file_path.GetComponents(&actual_parts); |
| ASSERT_EQ(expected_parts.size(), actual_parts.size()); |
| size_t count = expected_parts.size(); |
| for (size_t i = 0; i < count; ++i) |
| EXPECT_EQ(expected_parts[i], actual_parts[i]); |
| // Must clear the history_dir_ to satisfy the dtor's DCHECK. |
| set_history_dir(base::FilePath()); |
| } |