Home | History | Annotate | Download | only in history
      1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style license that can be
      3 // found in the LICENSE file.
      4 
      5 #include <algorithm>
      6 #include <fstream>
      7 
      8 #include "base/auto_reset.h"
      9 #include "base/file_util.h"
     10 #include "base/files/file_path.h"
     11 #include "base/files/scoped_temp_dir.h"
     12 #include "base/message_loop/message_loop.h"
     13 #include "base/path_service.h"
     14 #include "base/strings/string16.h"
     15 #include "base/strings/string_util.h"
     16 #include "base/strings/utf_string_conversions.h"
     17 #include "chrome/browser/bookmarks/bookmark_model_factory.h"
     18 #include "chrome/browser/chrome_notification_types.h"
     19 #include "chrome/browser/history/history_backend.h"
     20 #include "chrome/browser/history/history_database.h"
     21 #include "chrome/browser/history/history_notifications.h"
     22 #include "chrome/browser/history/history_service.h"
     23 #include "chrome/browser/history/history_service_factory.h"
     24 #include "chrome/browser/history/in_memory_url_index.h"
     25 #include "chrome/browser/history/in_memory_url_index_types.h"
     26 #include "chrome/browser/history/url_index_private_data.h"
     27 #include "chrome/common/chrome_paths.h"
     28 #include "chrome/test/base/history_index_restore_observer.h"
     29 #include "chrome/test/base/testing_profile.h"
     30 #include "components/bookmarks/test/bookmark_test_helpers.h"
     31 #include "components/history/core/browser/history_client.h"
     32 #include "content/public/browser/notification_details.h"
     33 #include "content/public/browser/notification_source.h"
     34 #include "content/public/test/test_browser_thread.h"
     35 #include "sql/transaction.h"
     36 #include "testing/gtest/include/gtest/gtest.h"
     37 
     38 using base::ASCIIToUTF16;
     39 using content::BrowserThread;
     40 
     41 namespace {
     42 const size_t kMaxMatches = 3;
     43 }  // namespace
     44 
     45 // The test version of the history url database table ('url') is contained in
     46 // a database file created from a text file('url_history_provider_test.db.txt').
     47 // The only difference between this table and a live 'urls' table from a
     48 // profile is that the last_visit_time column in the test table contains a
     49 // number specifying the number of days relative to 'today' to which the
     50 // absolute time should be set during the test setup stage.
     51 //
     52 // The format of the test database text file is of a SQLite .dump file.
     53 // Note that only lines whose first character is an upper-case letter are
     54 // processed when creating the test database.
     55 
     56 namespace history {
     57 
     58 // -----------------------------------------------------------------------------
     59 
     60 // Observer class so the unit tests can wait while the cache is being saved.
     61 class CacheFileSaverObserver : public InMemoryURLIndex::SaveCacheObserver {
     62  public:
     63   explicit CacheFileSaverObserver(base::MessageLoop* loop);
     64   virtual void OnCacheSaveFinished(bool succeeded) OVERRIDE;
     65 
     66   base::MessageLoop* loop_;
     67   bool succeeded_;
     68   DISALLOW_COPY_AND_ASSIGN(CacheFileSaverObserver);
     69 };
     70 
     71 CacheFileSaverObserver::CacheFileSaverObserver(base::MessageLoop* loop)
     72     : loop_(loop),
     73       succeeded_(false) {
     74   DCHECK(loop);
     75 }
     76 
     77 void CacheFileSaverObserver::OnCacheSaveFinished(bool succeeded) {
     78   succeeded_ = succeeded;
     79   loop_->Quit();
     80 }
     81 
     82 // -----------------------------------------------------------------------------
     83 
     84 class InMemoryURLIndexTest : public testing::Test {
     85  public:
     86   InMemoryURLIndexTest();
     87 
     88  protected:
     89   // Test setup.
     90   virtual void SetUp();
     91 
     92   // Allows the database containing the test data to be customized by
     93   // subclasses.
     94   virtual base::FilePath::StringType TestDBName() const;
     95 
     96   // Validates that the given |term| is contained in |cache| and that it is
     97   // marked as in-use.
     98   void CheckTerm(const URLIndexPrivateData::SearchTermCacheMap& cache,
     99                  base::string16 term) const;
    100 
    101   // Pass-through function to simplify our friendship with HistoryService.
    102   sql::Connection& GetDB();
    103 
    104   // Pass-through functions to simplify our friendship with InMemoryURLIndex.
    105   URLIndexPrivateData* GetPrivateData() const;
    106   void ClearPrivateData();
    107   void set_history_dir(const base::FilePath& dir_path);
    108   bool GetCacheFilePath(base::FilePath* file_path) const;
    109   void PostRestoreFromCacheFileTask();
    110   void PostSaveToCacheFileTask();
    111   void Observe(int notification_type,
    112                const content::NotificationSource& source,
    113                const content::NotificationDetails& details);
    114   const std::set<std::string>& scheme_whitelist();
    115 
    116 
    117   // Pass-through functions to simplify our friendship with URLIndexPrivateData.
    118   bool UpdateURL(const URLRow& row);
    119   bool DeleteURL(const GURL& url);
    120 
    121   // Data verification helper functions.
    122   void ExpectPrivateDataNotEmpty(const URLIndexPrivateData& data);
    123   void ExpectPrivateDataEmpty(const URLIndexPrivateData& data);
    124   void ExpectPrivateDataEqual(const URLIndexPrivateData& expected,
    125                               const URLIndexPrivateData& actual);
    126 
    127   base::MessageLoopForUI message_loop_;
    128   content::TestBrowserThread ui_thread_;
    129   content::TestBrowserThread file_thread_;
    130   TestingProfile profile_;
    131   HistoryService* history_service_;
    132 
    133   scoped_ptr<InMemoryURLIndex> url_index_;
    134   HistoryDatabase* history_database_;
    135 };
    136 
    137 InMemoryURLIndexTest::InMemoryURLIndexTest()
    138     : ui_thread_(content::BrowserThread::UI, &message_loop_),
    139       file_thread_(content::BrowserThread::FILE, &message_loop_) {
    140 }
    141 
    142 sql::Connection& InMemoryURLIndexTest::GetDB() {
    143   return history_database_->GetDB();
    144 }
    145 
    146 URLIndexPrivateData* InMemoryURLIndexTest::GetPrivateData() const {
    147   DCHECK(url_index_->private_data());
    148   return url_index_->private_data();
    149 }
    150 
    151 void InMemoryURLIndexTest::ClearPrivateData() {
    152   return url_index_->ClearPrivateData();
    153 }
    154 
    155 void InMemoryURLIndexTest::set_history_dir(const base::FilePath& dir_path) {
    156   return url_index_->set_history_dir(dir_path);
    157 }
    158 
    159 bool InMemoryURLIndexTest::GetCacheFilePath(base::FilePath* file_path) const {
    160   DCHECK(file_path);
    161   return url_index_->GetCacheFilePath(file_path);
    162 }
    163 
    164 void InMemoryURLIndexTest::PostRestoreFromCacheFileTask() {
    165   url_index_->PostRestoreFromCacheFileTask();
    166 }
    167 
    168 void InMemoryURLIndexTest::PostSaveToCacheFileTask() {
    169   url_index_->PostSaveToCacheFileTask();
    170 }
    171 
    172 void InMemoryURLIndexTest::Observe(
    173     int notification_type,
    174     const content::NotificationSource& source,
    175     const content::NotificationDetails& details) {
    176   url_index_->Observe(notification_type, source, details);
    177 }
    178 
    179 const std::set<std::string>& InMemoryURLIndexTest::scheme_whitelist() {
    180   return url_index_->scheme_whitelist();
    181 }
    182 
    183 bool InMemoryURLIndexTest::UpdateURL(const URLRow& row) {
    184   return GetPrivateData()->UpdateURL(
    185       history_service_, row, url_index_->languages_,
    186       url_index_->scheme_whitelist_);
    187 }
    188 
    189 bool InMemoryURLIndexTest::DeleteURL(const GURL& url) {
    190   return GetPrivateData()->DeleteURL(url);
    191 }
    192 
    193 void InMemoryURLIndexTest::SetUp() {
    194   // We cannot access the database until the backend has been loaded.
    195   ASSERT_TRUE(profile_.CreateHistoryService(true, false));
    196   profile_.CreateBookmarkModel(true);
    197   test::WaitForBookmarkModelToLoad(
    198       BookmarkModelFactory::GetForProfile(&profile_));
    199   profile_.BlockUntilHistoryProcessesPendingRequests();
    200   profile_.BlockUntilHistoryIndexIsRefreshed();
    201   history_service_ = HistoryServiceFactory::GetForProfile(
    202       &profile_, Profile::EXPLICIT_ACCESS);
    203   ASSERT_TRUE(history_service_);
    204   HistoryBackend* backend = history_service_->history_backend_.get();
    205   history_database_ = backend->db();
    206 
    207   // Create and populate a working copy of the URL history database.
    208   base::FilePath history_proto_path;
    209   PathService::Get(chrome::DIR_TEST_DATA, &history_proto_path);
    210   history_proto_path = history_proto_path.Append(
    211       FILE_PATH_LITERAL("History"));
    212   history_proto_path = history_proto_path.Append(TestDBName());
    213   EXPECT_TRUE(base::PathExists(history_proto_path));
    214 
    215   std::ifstream proto_file(history_proto_path.value().c_str());
    216   static const size_t kCommandBufferMaxSize = 2048;
    217   char sql_cmd_line[kCommandBufferMaxSize];
    218 
    219   sql::Connection& db(GetDB());
    220   ASSERT_TRUE(db.is_open());
    221   {
    222     sql::Transaction transaction(&db);
    223     transaction.Begin();
    224     while (!proto_file.eof()) {
    225       proto_file.getline(sql_cmd_line, kCommandBufferMaxSize);
    226       if (!proto_file.eof()) {
    227         // We only process lines which begin with a upper-case letter.
    228         // TODO(mrossetti): Can iswupper() be used here?
    229         if (sql_cmd_line[0] >= 'A' && sql_cmd_line[0] <= 'Z') {
    230           std::string sql_cmd(sql_cmd_line);
    231           sql::Statement sql_stmt(db.GetUniqueStatement(sql_cmd_line));
    232           EXPECT_TRUE(sql_stmt.Run());
    233         }
    234       }
    235     }
    236     transaction.Commit();
    237   }
    238 
    239   // Update the last_visit_time table column in the "urls" table
    240   // such that it represents a time relative to 'now'.
    241   sql::Statement statement(db.GetUniqueStatement(
    242       "SELECT" HISTORY_URL_ROW_FIELDS "FROM urls;"));
    243   ASSERT_TRUE(statement.is_valid());
    244   base::Time time_right_now = base::Time::NowFromSystemTime();
    245   base::TimeDelta day_delta = base::TimeDelta::FromDays(1);
    246   {
    247     sql::Transaction transaction(&db);
    248     transaction.Begin();
    249     while (statement.Step()) {
    250       URLRow row;
    251       history_database_->FillURLRow(statement, &row);
    252       base::Time last_visit = time_right_now;
    253       for (int64 i = row.last_visit().ToInternalValue(); i > 0; --i)
    254         last_visit -= day_delta;
    255       row.set_last_visit(last_visit);
    256       history_database_->UpdateURLRow(row.id(), row);
    257     }
    258     transaction.Commit();
    259   }
    260 
    261   // Update the visit_time table column in the "visits" table
    262   // such that it represents a time relative to 'now'.
    263   statement.Assign(db.GetUniqueStatement(
    264       "SELECT" HISTORY_VISIT_ROW_FIELDS "FROM visits;"));
    265   ASSERT_TRUE(statement.is_valid());
    266   {
    267     sql::Transaction transaction(&db);
    268     transaction.Begin();
    269     while (statement.Step()) {
    270       VisitRow row;
    271       history_database_->FillVisitRow(statement, &row);
    272       base::Time last_visit = time_right_now;
    273       for (int64 i = row.visit_time.ToInternalValue(); i > 0; --i)
    274         last_visit -= day_delta;
    275       row.visit_time = last_visit;
    276       history_database_->UpdateVisitRow(row);
    277     }
    278     transaction.Commit();
    279   }
    280 
    281   url_index_.reset(new InMemoryURLIndex(
    282       &profile_, base::FilePath(), "en,ja,hi,zh",
    283       history_service_->history_client()));
    284   url_index_->Init();
    285   url_index_->RebuildFromHistory(history_database_);
    286 }
    287 
    288 base::FilePath::StringType InMemoryURLIndexTest::TestDBName() const {
    289     return FILE_PATH_LITERAL("url_history_provider_test.db.txt");
    290 }
    291 
    292 void InMemoryURLIndexTest::CheckTerm(
    293     const URLIndexPrivateData::SearchTermCacheMap& cache,
    294     base::string16 term) const {
    295   URLIndexPrivateData::SearchTermCacheMap::const_iterator cache_iter(
    296       cache.find(term));
    297   ASSERT_TRUE(cache.end() != cache_iter)
    298       << "Cache does not contain '" << term << "' but should.";
    299   URLIndexPrivateData::SearchTermCacheItem cache_item = cache_iter->second;
    300   EXPECT_TRUE(cache_item.used_)
    301       << "Cache item '" << term << "' should be marked as being in use.";
    302 }
    303 
    304 void InMemoryURLIndexTest::ExpectPrivateDataNotEmpty(
    305     const URLIndexPrivateData& data) {
    306   EXPECT_FALSE(data.word_list_.empty());
    307   // available_words_ will be empty since we have freshly built the
    308   // data set for these tests.
    309   EXPECT_TRUE(data.available_words_.empty());
    310   EXPECT_FALSE(data.word_map_.empty());
    311   EXPECT_FALSE(data.char_word_map_.empty());
    312   EXPECT_FALSE(data.word_id_history_map_.empty());
    313   EXPECT_FALSE(data.history_id_word_map_.empty());
    314   EXPECT_FALSE(data.history_info_map_.empty());
    315 }
    316 
    317 void InMemoryURLIndexTest::ExpectPrivateDataEmpty(
    318     const URLIndexPrivateData& data) {
    319   EXPECT_TRUE(data.word_list_.empty());
    320   EXPECT_TRUE(data.available_words_.empty());
    321   EXPECT_TRUE(data.word_map_.empty());
    322   EXPECT_TRUE(data.char_word_map_.empty());
    323   EXPECT_TRUE(data.word_id_history_map_.empty());
    324   EXPECT_TRUE(data.history_id_word_map_.empty());
    325   EXPECT_TRUE(data.history_info_map_.empty());
    326 }
    327 
    328 // Helper function which compares two maps for equivalence. The maps' values
    329 // are associative containers and their contents are compared as well.
    330 template<typename T>
    331 void ExpectMapOfContainersIdentical(const T& expected, const T& actual) {
    332   ASSERT_EQ(expected.size(), actual.size());
    333   for (typename T::const_iterator expected_iter = expected.begin();
    334        expected_iter != expected.end(); ++expected_iter) {
    335     typename T::const_iterator actual_iter = actual.find(expected_iter->first);
    336     ASSERT_TRUE(actual.end() != actual_iter);
    337     typename T::mapped_type const& expected_values(expected_iter->second);
    338     typename T::mapped_type const& actual_values(actual_iter->second);
    339     ASSERT_EQ(expected_values.size(), actual_values.size());
    340     for (typename T::mapped_type::const_iterator set_iter =
    341          expected_values.begin(); set_iter != expected_values.end(); ++set_iter)
    342       EXPECT_EQ(actual_values.count(*set_iter),
    343                 expected_values.count(*set_iter));
    344   }
    345 }
    346 
    347 void InMemoryURLIndexTest::ExpectPrivateDataEqual(
    348     const URLIndexPrivateData& expected,
    349     const URLIndexPrivateData& actual) {
    350   EXPECT_EQ(expected.word_list_.size(), actual.word_list_.size());
    351   EXPECT_EQ(expected.word_map_.size(), actual.word_map_.size());
    352   EXPECT_EQ(expected.char_word_map_.size(), actual.char_word_map_.size());
    353   EXPECT_EQ(expected.word_id_history_map_.size(),
    354             actual.word_id_history_map_.size());
    355   EXPECT_EQ(expected.history_id_word_map_.size(),
    356             actual.history_id_word_map_.size());
    357   EXPECT_EQ(expected.history_info_map_.size(), actual.history_info_map_.size());
    358   EXPECT_EQ(expected.word_starts_map_.size(), actual.word_starts_map_.size());
    359   // WordList must be index-by-index equal.
    360   size_t count = expected.word_list_.size();
    361   for (size_t i = 0; i < count; ++i)
    362     EXPECT_EQ(expected.word_list_[i], actual.word_list_[i]);
    363 
    364   ExpectMapOfContainersIdentical(expected.char_word_map_,
    365                                  actual.char_word_map_);
    366   ExpectMapOfContainersIdentical(expected.word_id_history_map_,
    367                                  actual.word_id_history_map_);
    368   ExpectMapOfContainersIdentical(expected.history_id_word_map_,
    369                                  actual.history_id_word_map_);
    370 
    371   for (HistoryInfoMap::const_iterator expected_info =
    372       expected.history_info_map_.begin();
    373       expected_info != expected.history_info_map_.end(); ++expected_info) {
    374     HistoryInfoMap::const_iterator actual_info =
    375         actual.history_info_map_.find(expected_info->first);
    376     // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between
    377     // gtest and STLPort in the Android build. See
    378     // http://code.google.com/p/googletest/issues/detail?id=359
    379     ASSERT_TRUE(actual_info != actual.history_info_map_.end());
    380     const URLRow& expected_row(expected_info->second.url_row);
    381     const URLRow& actual_row(actual_info->second.url_row);
    382     EXPECT_EQ(expected_row.visit_count(), actual_row.visit_count());
    383     EXPECT_EQ(expected_row.typed_count(), actual_row.typed_count());
    384     EXPECT_EQ(expected_row.last_visit(), actual_row.last_visit());
    385     EXPECT_EQ(expected_row.url(), actual_row.url());
    386     const VisitInfoVector& expected_visits(expected_info->second.visits);
    387     const VisitInfoVector& actual_visits(actual_info->second.visits);
    388     EXPECT_EQ(expected_visits.size(), actual_visits.size());
    389     for (size_t i = 0;
    390          i < std::min(expected_visits.size(), actual_visits.size()); ++i) {
    391       EXPECT_EQ(expected_visits[i].first, actual_visits[i].first);
    392       EXPECT_EQ(expected_visits[i].second, actual_visits[i].second);
    393     }
    394   }
    395 
    396   for (WordStartsMap::const_iterator expected_starts =
    397       expected.word_starts_map_.begin();
    398       expected_starts != expected.word_starts_map_.end();
    399       ++expected_starts) {
    400     WordStartsMap::const_iterator actual_starts =
    401         actual.word_starts_map_.find(expected_starts->first);
    402     // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between
    403     // gtest and STLPort in the Android build. See
    404     // http://code.google.com/p/googletest/issues/detail?id=359
    405     ASSERT_TRUE(actual_starts != actual.word_starts_map_.end());
    406     const RowWordStarts& expected_word_starts(expected_starts->second);
    407     const RowWordStarts& actual_word_starts(actual_starts->second);
    408     EXPECT_EQ(expected_word_starts.url_word_starts_.size(),
    409               actual_word_starts.url_word_starts_.size());
    410     EXPECT_TRUE(std::equal(expected_word_starts.url_word_starts_.begin(),
    411                            expected_word_starts.url_word_starts_.end(),
    412                            actual_word_starts.url_word_starts_.begin()));
    413     EXPECT_EQ(expected_word_starts.title_word_starts_.size(),
    414               actual_word_starts.title_word_starts_.size());
    415     EXPECT_TRUE(std::equal(expected_word_starts.title_word_starts_.begin(),
    416                            expected_word_starts.title_word_starts_.end(),
    417                            actual_word_starts.title_word_starts_.begin()));
    418   }
    419 }
    420 
    421 //------------------------------------------------------------------------------
    422 
    423 class LimitedInMemoryURLIndexTest : public InMemoryURLIndexTest {
    424  protected:
    425   virtual base::FilePath::StringType TestDBName() const OVERRIDE;
    426 };
    427 
    428 base::FilePath::StringType LimitedInMemoryURLIndexTest::TestDBName() const {
    429   return FILE_PATH_LITERAL("url_history_provider_test_limited.db.txt");
    430 }
    431 
    432 TEST_F(LimitedInMemoryURLIndexTest, Initialization) {
    433   // Verify that the database contains the expected number of items, which
    434   // is the pre-filtered count, i.e. all of the items.
    435   sql::Statement statement(GetDB().GetUniqueStatement("SELECT * FROM urls;"));
    436   ASSERT_TRUE(statement.is_valid());
    437   uint64 row_count = 0;
    438   while (statement.Step()) ++row_count;
    439   EXPECT_EQ(1U, row_count);
    440   url_index_.reset(new InMemoryURLIndex(
    441       &profile_, base::FilePath(), "en,ja,hi,zh",
    442       history_service_->history_client()));
    443   url_index_->Init();
    444   url_index_->RebuildFromHistory(history_database_);
    445   URLIndexPrivateData& private_data(*GetPrivateData());
    446 
    447   // history_info_map_ should have the same number of items as were filtered.
    448   EXPECT_EQ(1U, private_data.history_info_map_.size());
    449   EXPECT_EQ(35U, private_data.char_word_map_.size());
    450   EXPECT_EQ(17U, private_data.word_map_.size());
    451 }
    452 
    453 #if defined(OS_WIN)
    454 // Flaky on windows trybots: http://crbug.com/351500
    455 #define MAYBE_Retrieval DISABLED_Retrieval
    456 #else
    457 #define MAYBE_Retrieval Retrieval
    458 #endif
    459 TEST_F(InMemoryURLIndexTest, MAYBE_Retrieval) {
    460   // See if a very specific term gives a single result.
    461   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    462       ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
    463   ASSERT_EQ(1U, matches.size());
    464 
    465   // Verify that we got back the result we expected.
    466   EXPECT_EQ(5, matches[0].url_info.id());
    467   EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
    468   EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
    469   EXPECT_TRUE(matches[0].can_inline());
    470 
    471   // Make sure a trailing space prevents inline-ability but still results
    472   // in the expected result.
    473   matches = url_index_->HistoryItemsForTerms(
    474       ASCIIToUTF16("DrudgeReport "), base::string16::npos, kMaxMatches);
    475   ASSERT_EQ(1U, matches.size());
    476   EXPECT_EQ(5, matches[0].url_info.id());
    477   EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
    478   EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
    479   EXPECT_FALSE(matches[0].can_inline());
    480 
    481   // Search which should result in multiple results.
    482   matches = url_index_->HistoryItemsForTerms(
    483       ASCIIToUTF16("drudge"), base::string16::npos, kMaxMatches);
    484   ASSERT_EQ(2U, matches.size());
    485   // The results should be in descending score order.
    486   EXPECT_GE(matches[0].raw_score(), matches[1].raw_score());
    487 
    488   // Search which should result in nearly perfect result.
    489   matches = url_index_->HistoryItemsForTerms(
    490       ASCIIToUTF16("Nearly Perfect Result"), base::string16::npos, kMaxMatches);
    491   ASSERT_EQ(1U, matches.size());
    492   // The results should have a very high score.
    493   EXPECT_GT(matches[0].raw_score(), 900);
    494   EXPECT_EQ(32, matches[0].url_info.id());
    495   EXPECT_EQ("https://nearlyperfectresult.com/",
    496             matches[0].url_info.url().spec());  // Note: URL gets lowercased.
    497   EXPECT_EQ(ASCIIToUTF16("Practically Perfect Search Result"),
    498             matches[0].url_info.title());
    499   EXPECT_FALSE(matches[0].can_inline());
    500 
    501   // Search which should result in very poor result.
    502   matches = url_index_->HistoryItemsForTerms(
    503       ASCIIToUTF16("qui c"), base::string16::npos, kMaxMatches);
    504   ASSERT_EQ(1U, matches.size());
    505   // The results should have a poor score.
    506   EXPECT_LT(matches[0].raw_score(), 500);
    507   EXPECT_EQ(33, matches[0].url_info.id());
    508   EXPECT_EQ("http://quiteuselesssearchresultxyz.com/",
    509             matches[0].url_info.url().spec());  // Note: URL gets lowercased.
    510   EXPECT_EQ(ASCIIToUTF16("Practically Useless Search Result"),
    511             matches[0].url_info.title());
    512   EXPECT_FALSE(matches[0].can_inline());
    513 
    514   // Search which will match at the end of an URL with encoded characters.
    515   matches = url_index_->HistoryItemsForTerms(
    516       ASCIIToUTF16("Mice"), base::string16::npos, kMaxMatches);
    517   ASSERT_EQ(1U, matches.size());
    518   EXPECT_EQ(30, matches[0].url_info.id());
    519   EXPECT_FALSE(matches[0].can_inline());
    520 
    521   // Check that URLs are not escaped an escape time.
    522   matches = url_index_->HistoryItemsForTerms(
    523        ASCIIToUTF16("1% wikipedia"), base::string16::npos, kMaxMatches);
    524   ASSERT_EQ(1U, matches.size());
    525   EXPECT_EQ(35, matches[0].url_info.id());
    526   EXPECT_EQ("http://en.wikipedia.org/wiki/1%25_rule_(Internet_culture)",
    527             matches[0].url_info.url().spec());
    528 
    529   // Verify that a single term can appear multiple times in the URL and as long
    530   // as one starts the URL it is still inlined.
    531   matches = url_index_->HistoryItemsForTerms(
    532       ASCIIToUTF16("fubar"), base::string16::npos, kMaxMatches);
    533   ASSERT_EQ(1U, matches.size());
    534   EXPECT_EQ(34, matches[0].url_info.id());
    535   EXPECT_EQ("http://fubarfubarandfubar.com/", matches[0].url_info.url().spec());
    536   EXPECT_EQ(ASCIIToUTF16("Situation Normal -- FUBARED"),
    537             matches[0].url_info.title());
    538   EXPECT_TRUE(matches[0].can_inline());
    539 }
    540 
    541 TEST_F(InMemoryURLIndexTest, CursorPositionRetrieval) {
    542   // See if a very specific term with no cursor gives an empty result.
    543   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    544       ASCIIToUTF16("DrudReport"), base::string16::npos, kMaxMatches);
    545   ASSERT_EQ(0U, matches.size());
    546 
    547   // The same test with the cursor at the end should give an empty result.
    548   matches = url_index_->HistoryItemsForTerms(
    549       ASCIIToUTF16("DrudReport"), 10u, kMaxMatches);
    550   ASSERT_EQ(0U, matches.size());
    551 
    552   // If the cursor is between Drud and Report, we should find the desired
    553   // result.
    554   matches = url_index_->HistoryItemsForTerms(
    555       ASCIIToUTF16("DrudReport"), 4u, kMaxMatches);
    556   ASSERT_EQ(1U, matches.size());
    557   EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
    558   EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
    559 
    560   // Now check multi-word inputs.  No cursor should fail to find a
    561   // result on this input.
    562   matches = url_index_->HistoryItemsForTerms(
    563       ASCIIToUTF16("MORTGAGERATE DROPS"), base::string16::npos, kMaxMatches);
    564   ASSERT_EQ(0U, matches.size());
    565 
    566   // Ditto with cursor at end.
    567   matches = url_index_->HistoryItemsForTerms(
    568       ASCIIToUTF16("MORTGAGERATE DROPS"), 18u, kMaxMatches);
    569   ASSERT_EQ(0U, matches.size());
    570 
    571   // If the cursor is between MORTAGE And RATE, we should find the
    572   // desired result.
    573   matches = url_index_->HistoryItemsForTerms(
    574       ASCIIToUTF16("MORTGAGERATE DROPS"), 8u, kMaxMatches);
    575   ASSERT_EQ(1U, matches.size());
    576   EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708",
    577             matches[0].url_info.url().spec());
    578   EXPECT_EQ(ASCIIToUTF16(
    579       "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"),
    580             matches[0].url_info.title());
    581 }
    582 
    583 TEST_F(InMemoryURLIndexTest, URLPrefixMatching) {
    584   // "drudgere" - found, can inline
    585   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    586       ASCIIToUTF16("drudgere"), base::string16::npos, kMaxMatches);
    587   ASSERT_EQ(1U, matches.size());
    588   EXPECT_TRUE(matches[0].can_inline());
    589 
    590   // "drudgere" - found, can inline
    591   matches = url_index_->HistoryItemsForTerms(
    592       ASCIIToUTF16("drudgere"), base::string16::npos, kMaxMatches);
    593   ASSERT_EQ(1U, matches.size());
    594   EXPECT_TRUE(matches[0].can_inline());
    595 
    596   // "www.atdmt" - not found
    597   matches = url_index_->HistoryItemsForTerms(
    598       ASCIIToUTF16("www.atdmt"), base::string16::npos, kMaxMatches);
    599   EXPECT_EQ(0U, matches.size());
    600 
    601   // "atdmt" - found, cannot inline
    602   matches = url_index_->HistoryItemsForTerms(
    603       ASCIIToUTF16("atdmt"), base::string16::npos, kMaxMatches);
    604   ASSERT_EQ(1U, matches.size());
    605   EXPECT_FALSE(matches[0].can_inline());
    606 
    607   // "view.atdmt" - found, can inline
    608   matches = url_index_->HistoryItemsForTerms(
    609       ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
    610   ASSERT_EQ(1U, matches.size());
    611   EXPECT_TRUE(matches[0].can_inline());
    612 
    613   // "view.atdmt" - found, can inline
    614   matches = url_index_->HistoryItemsForTerms(
    615       ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
    616   ASSERT_EQ(1U, matches.size());
    617   EXPECT_TRUE(matches[0].can_inline());
    618 
    619   // "cnn.com" - found, can inline
    620   matches = url_index_->HistoryItemsForTerms(
    621       ASCIIToUTF16("cnn.com"), base::string16::npos, kMaxMatches);
    622   ASSERT_EQ(2U, matches.size());
    623   // One match should be inline-able, the other not.
    624   EXPECT_TRUE(matches[0].can_inline() != matches[1].can_inline());
    625 
    626   // "www.cnn.com" - found, can inline
    627   matches = url_index_->HistoryItemsForTerms(
    628       ASCIIToUTF16("www.cnn.com"), base::string16::npos, kMaxMatches);
    629   ASSERT_EQ(1U, matches.size());
    630   EXPECT_TRUE(matches[0].can_inline());
    631 
    632   // "ww.cnn.com" - found because we allow mid-term matches in hostnames
    633   matches = url_index_->HistoryItemsForTerms(
    634       ASCIIToUTF16("ww.cnn.com"), base::string16::npos, kMaxMatches);
    635   ASSERT_EQ(1U, matches.size());
    636 
    637   // "www.cnn.com" - found, can inline
    638   matches = url_index_->HistoryItemsForTerms(
    639       ASCIIToUTF16("www.cnn.com"), base::string16::npos, kMaxMatches);
    640   ASSERT_EQ(1U, matches.size());
    641   EXPECT_TRUE(matches[0].can_inline());
    642 
    643   // "tp://www.cnn.com" - not found because we don't allow tp as a mid-term
    644   // match
    645   matches = url_index_->HistoryItemsForTerms(
    646       ASCIIToUTF16("tp://www.cnn.com"), base::string16::npos, kMaxMatches);
    647   ASSERT_EQ(0U, matches.size());
    648 }
    649 
    650 TEST_F(InMemoryURLIndexTest, ProperStringMatching) {
    651   // Search for the following with the expected results:
    652   // "atdmt view" - found
    653   // "atdmt.view" - not found
    654   // "view.atdmt" - found
    655   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    656       ASCIIToUTF16("atdmt view"), base::string16::npos, kMaxMatches);
    657   ASSERT_EQ(1U, matches.size());
    658   matches = url_index_->HistoryItemsForTerms(
    659        ASCIIToUTF16("atdmt.view"), base::string16::npos, kMaxMatches);
    660   ASSERT_EQ(0U, matches.size());
    661   matches = url_index_->HistoryItemsForTerms(
    662       ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
    663   ASSERT_EQ(1U, matches.size());
    664 }
    665 
    666 TEST_F(InMemoryURLIndexTest, HugeResultSet) {
    667   // Create a huge set of qualifying history items.
    668   for (URLID row_id = 5000; row_id < 6000; ++row_id) {
    669     URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), row_id);
    670     new_row.set_last_visit(base::Time::Now());
    671     EXPECT_TRUE(UpdateURL(new_row));
    672   }
    673 
    674   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    675       ASCIIToUTF16("b"), base::string16::npos, kMaxMatches);
    676   URLIndexPrivateData& private_data(*GetPrivateData());
    677   ASSERT_EQ(kMaxMatches, matches.size());
    678   // There are 7 matches already in the database.
    679   ASSERT_EQ(1008U, private_data.pre_filter_item_count_);
    680   ASSERT_EQ(500U, private_data.post_filter_item_count_);
    681   ASSERT_EQ(kMaxMatches, private_data.post_scoring_item_count_);
    682 }
    683 
    684 #if defined(OS_WIN)
    685 // Flaky on windows trybots: http://crbug.com/351500
    686 #define MAYBE_TitleSearch DISABLED_TitleSearch
    687 #else
    688 #define MAYBE_TitleSearch TitleSearch
    689 #endif
    690 TEST_F(InMemoryURLIndexTest, MAYBE_TitleSearch) {
    691   // Signal if someone has changed the test DB.
    692   EXPECT_EQ(29U, GetPrivateData()->history_info_map_.size());
    693 
    694   // Ensure title is being searched.
    695   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    696       ASCIIToUTF16("MORTGAGE RATE DROPS"), base::string16::npos, kMaxMatches);
    697   ASSERT_EQ(1U, matches.size());
    698 
    699   // Verify that we got back the result we expected.
    700   EXPECT_EQ(1, matches[0].url_info.id());
    701   EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708",
    702             matches[0].url_info.url().spec());
    703   EXPECT_EQ(ASCIIToUTF16(
    704       "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"),
    705       matches[0].url_info.title());
    706 }
    707 
    708 TEST_F(InMemoryURLIndexTest, TitleChange) {
    709   // Verify current title terms retrieves desired item.
    710   base::string16 original_terms =
    711       ASCIIToUTF16("lebronomics could high taxes influence");
    712   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    713       original_terms, base::string16::npos, kMaxMatches);
    714   ASSERT_EQ(1U, matches.size());
    715 
    716   // Verify that we got back the result we expected.
    717   const URLID expected_id = 3;
    718   EXPECT_EQ(expected_id, matches[0].url_info.id());
    719   EXPECT_EQ("http://www.businessandmedia.org/articles/2010/20100708120415.aspx",
    720             matches[0].url_info.url().spec());
    721   EXPECT_EQ(ASCIIToUTF16(
    722       "LeBronomics: Could High Taxes Influence James' Team Decision?"),
    723       matches[0].url_info.title());
    724   URLRow old_row(matches[0].url_info);
    725 
    726   // Verify new title terms retrieves nothing.
    727   base::string16 new_terms = ASCIIToUTF16("does eat oats little lambs ivy");
    728   matches = url_index_->HistoryItemsForTerms(
    729       new_terms, base::string16::npos, kMaxMatches);
    730   ASSERT_EQ(0U, matches.size());
    731 
    732   // Update the row.
    733   old_row.set_title(ASCIIToUTF16("Does eat oats and little lambs eat ivy"));
    734   EXPECT_TRUE(UpdateURL(old_row));
    735 
    736   // Verify we get the row using the new terms but not the original terms.
    737   matches = url_index_->HistoryItemsForTerms(
    738       new_terms, base::string16::npos, kMaxMatches);
    739   ASSERT_EQ(1U, matches.size());
    740   EXPECT_EQ(expected_id, matches[0].url_info.id());
    741   matches = url_index_->HistoryItemsForTerms(
    742       original_terms, base::string16::npos, kMaxMatches);
    743   ASSERT_EQ(0U, matches.size());
    744 }
    745 
    746 TEST_F(InMemoryURLIndexTest, NonUniqueTermCharacterSets) {
    747   // The presence of duplicate characters should succeed. Exercise by cycling
    748   // through a string with several duplicate characters.
    749   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    750       ASCIIToUTF16("ABRA"), base::string16::npos, kMaxMatches);
    751   ASSERT_EQ(1U, matches.size());
    752   EXPECT_EQ(28, matches[0].url_info.id());
    753   EXPECT_EQ("http://www.ddj.com/windows/184416623",
    754             matches[0].url_info.url().spec());
    755 
    756   matches = url_index_->HistoryItemsForTerms(
    757       ASCIIToUTF16("ABRACAD"), base::string16::npos, kMaxMatches);
    758   ASSERT_EQ(1U, matches.size());
    759   EXPECT_EQ(28, matches[0].url_info.id());
    760 
    761   matches = url_index_->HistoryItemsForTerms(
    762       ASCIIToUTF16("ABRACADABRA"), base::string16::npos, kMaxMatches);
    763   ASSERT_EQ(1U, matches.size());
    764   EXPECT_EQ(28, matches[0].url_info.id());
    765 
    766   matches = url_index_->HistoryItemsForTerms(
    767       ASCIIToUTF16("ABRACADABR"), base::string16::npos, kMaxMatches);
    768   ASSERT_EQ(1U, matches.size());
    769   EXPECT_EQ(28, matches[0].url_info.id());
    770 
    771   matches = url_index_->HistoryItemsForTerms(
    772       ASCIIToUTF16("ABRACA"), base::string16::npos, kMaxMatches);
    773   ASSERT_EQ(1U, matches.size());
    774   EXPECT_EQ(28, matches[0].url_info.id());
    775 }
    776 
    777 TEST_F(InMemoryURLIndexTest, TypedCharacterCaching) {
    778   // Verify that match results for previously typed characters are retained
    779   // (in the term_char_word_set_cache_) and reused, if possible, in future
    780   // autocompletes.
    781 
    782   URLIndexPrivateData::SearchTermCacheMap& cache(
    783       GetPrivateData()->search_term_cache_);
    784 
    785   // The cache should be empty at this point.
    786   EXPECT_EQ(0U, cache.size());
    787 
    788   // Now simulate typing search terms into the omnibox and check the state of
    789   // the cache as each item is 'typed'.
    790 
    791   // Simulate typing "r" giving "r" in the simulated omnibox. The results for
    792   // 'r' will be not cached because it is only 1 character long.
    793   url_index_->HistoryItemsForTerms(
    794       ASCIIToUTF16("r"), base::string16::npos, kMaxMatches);
    795   EXPECT_EQ(0U, cache.size());
    796 
    797   // Simulate typing "re" giving "r re" in the simulated omnibox.
    798   // 're' should be cached at this point but not 'r' as it is a single
    799   // character.
    800   url_index_->HistoryItemsForTerms(
    801       ASCIIToUTF16("r re"), base::string16::npos, kMaxMatches);
    802   ASSERT_EQ(1U, cache.size());
    803   CheckTerm(cache, ASCIIToUTF16("re"));
    804 
    805   // Simulate typing "reco" giving "r re reco" in the simulated omnibox.
    806   // 're' and 'reco' should be cached at this point but not 'r' as it is a
    807   // single character.
    808   url_index_->HistoryItemsForTerms(
    809       ASCIIToUTF16("r re reco"), base::string16::npos, kMaxMatches);
    810   ASSERT_EQ(2U, cache.size());
    811   CheckTerm(cache, ASCIIToUTF16("re"));
    812   CheckTerm(cache, ASCIIToUTF16("reco"));
    813 
    814   // Simulate typing "mort".
    815   // Since we now have only one search term, the cached results for 're' and
    816   // 'reco' should be purged, giving us only 1 item in the cache (for 'mort').
    817   url_index_->HistoryItemsForTerms(
    818       ASCIIToUTF16("mort"), base::string16::npos, kMaxMatches);
    819   ASSERT_EQ(1U, cache.size());
    820   CheckTerm(cache, ASCIIToUTF16("mort"));
    821 
    822   // Simulate typing "reco" giving "mort reco" in the simulated omnibox.
    823   url_index_->HistoryItemsForTerms(
    824       ASCIIToUTF16("mort reco"), base::string16::npos, kMaxMatches);
    825   ASSERT_EQ(2U, cache.size());
    826   CheckTerm(cache, ASCIIToUTF16("mort"));
    827   CheckTerm(cache, ASCIIToUTF16("reco"));
    828 
    829   // Simulate a <DELETE> by removing the 'reco' and adding back the 'rec'.
    830   url_index_->HistoryItemsForTerms(
    831       ASCIIToUTF16("mort rec"), base::string16::npos, kMaxMatches);
    832   ASSERT_EQ(2U, cache.size());
    833   CheckTerm(cache, ASCIIToUTF16("mort"));
    834   CheckTerm(cache, ASCIIToUTF16("rec"));
    835 }
    836 
    837 TEST_F(InMemoryURLIndexTest, AddNewRows) {
    838   // Verify that the row we're going to add does not already exist.
    839   URLID new_row_id = 87654321;
    840   // Newly created URLRows get a last_visit time of 'right now' so it should
    841   // qualify as a quick result candidate.
    842   EXPECT_TRUE(url_index_->HistoryItemsForTerms(
    843       ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches)
    844           .empty());
    845 
    846   // Add a new row.
    847   URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), new_row_id++);
    848   new_row.set_last_visit(base::Time::Now());
    849   EXPECT_TRUE(UpdateURL(new_row));
    850 
    851   // Verify that we can retrieve it.
    852   EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(
    853       ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches).size());
    854 
    855   // Add it again just to be sure that is harmless and that it does not update
    856   // the index.
    857   EXPECT_FALSE(UpdateURL(new_row));
    858   EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(
    859       ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches).size());
    860 
    861   // Make up an URL that does not qualify and try to add it.
    862   URLRow unqualified_row(GURL("http://www.brokeandaloneinmanitoba.com/"),
    863                          new_row_id++);
    864   EXPECT_FALSE(UpdateURL(new_row));
    865 }
    866 
    867 TEST_F(InMemoryURLIndexTest, DeleteRows) {
    868   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    869       ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
    870   ASSERT_EQ(1U, matches.size());
    871 
    872   // Delete the URL then search again.
    873   EXPECT_TRUE(DeleteURL(matches[0].url_info.url()));
    874   EXPECT_TRUE(url_index_->HistoryItemsForTerms(
    875       ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches).empty());
    876 
    877   // Make up an URL that does not exist in the database and delete it.
    878   GURL url("http://www.hokeypokey.com/putyourrightfootin.html");
    879   EXPECT_FALSE(DeleteURL(url));
    880 }
    881 
    882 TEST_F(InMemoryURLIndexTest, ExpireRow) {
    883   ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
    884       ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
    885   ASSERT_EQ(1U, matches.size());
    886 
    887   // Determine the row id for the result, remember that id, broadcast a
    888   // delete notification, then ensure that the row has been deleted.
    889   URLsDeletedDetails deleted_details;
    890   deleted_details.all_history = false;
    891   deleted_details.rows.push_back(matches[0].url_info);
    892   Observe(chrome::NOTIFICATION_HISTORY_URLS_DELETED,
    893           content::Source<InMemoryURLIndexTest>(this),
    894           content::Details<history::HistoryDetails>(&deleted_details));
    895   EXPECT_TRUE(url_index_->HistoryItemsForTerms(
    896       ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches).empty());
    897 }
    898 
    899 TEST_F(InMemoryURLIndexTest, WhitelistedURLs) {
    900   struct TestData {
    901     const std::string url_spec;
    902     const bool expected_is_whitelisted;
    903   } data[] = {
    904     // URLs with whitelisted schemes.
    905     { "about:histograms", true },
    906     { "chrome://settings", true },
    907     { "file://localhost/Users/joeschmoe/sekrets", true },
    908     { "ftp://public.mycompany.com/myfile.txt", true },
    909     { "http://www.google.com/translate", true },
    910     { "https://www.gmail.com/", true },
    911     { "mailto:support (at) google.com", true },
    912     // URLs with unacceptable schemes.
    913     { "aaa://www.dummyhost.com;frammy", false },
    914     { "aaas://www.dummyhost.com;frammy", false },
    915     { "acap://suzie (at) somebody.com", false },
    916     { "cap://cal.example.com/Company/Holidays", false },
    917     { "cid:foo4*foo1 (at) bar.net", false },
    918     { "crid://example.com/foobar", false },
    919     { "", false },
    920     { "dict://dict.org/d:shortcake:", false },
    921     { "dns://192.168.1.1/ftp.example.org?type=A", false },
    922     { "fax:+358.555.1234567", false },
    923     { "geo:13.4125,103.8667", false },
    924     { "go:Mercedes%20Benz", false },
    925     { "gopher://farnsworth.ca:666/gopher", false },
    926     { "h323:farmer-john;sixpence", false },
    927     { "iax:johnQ (at) example.com/12022561414", false },
    928     { "icap://icap.net/service?mode=translate&lang=french", false },
    929     { "im:fred (at) example.com", false },
    930     { "imap://michael (at) minbari.org/users.*", false },
    931     { "info:ddc/22/eng//004.678", false },
    932     { "ipp://example.com/printer/fox", false },
    933     { "iris:dreg1//example.com/local/myhosts", false },
    934     { "iris.beep:dreg1//example.com/local/myhosts", false },
    935     { "iris.lws:dreg1//example.com/local/myhosts", false },
    936     { "iris.xpc:dreg1//example.com/local/myhosts", false },
    937     { "iris.xpcs:dreg1//example.com/local/myhosts", false },
    938     { "ldap://ldap.itd.umich.edu/o=University%20of%20Michigan,c=US", false },
    939     { "mid:foo4%25foo1 (at) bar.net", false },
    940     { "modem:+3585551234567;type=v32b?7e1;type=v110", false },
    941     { "msrp://atlanta.example.com:7654/jshA7weztas;tcp", false },
    942     { "msrps://atlanta.example.com:7654/jshA7weztas;tcp", false },
    943     { "news:colorectal.info.banned", false },
    944     { "nfs://server/d/e/f", false },
    945     { "nntp://www.example.com:6543/info.comp.lies/1234", false },
    946     { "pop://rg;AUTH=+APOP (at) mail.mycompany.com:8110", false },
    947     { "pres:fred (at) example.com", false },
    948     { "prospero://host.dom//pros/name", false },
    949     { "rsync://syler (at) lost.com/Source", false },
    950     { "rtsp://media.example.com:554/twister/audiotrack", false },
    951     { "service:acap://some.where.net;authentication=KERBEROSV4", false },
    952     { "shttp://www.terces.com/secret", false },
    953     { "sieve://example.com//script", false },
    954     { "sip:+1-212-555-1212:1234 (at) gateway.com;user=phone", false },
    955     { "sips:+1-212-555-1212:1234 (at) gateway.com;user=phone", false },
    956     { "sms:+15105551212?body=hello%20there", false },
    957     { "snmp://tester5 (at) example.com:8161/bridge1;800002b804616263", false },
    958     { "soap.beep://stockquoteserver.example.com/StockQuote", false },
    959     { "soap.beeps://stockquoteserver.example.com/StockQuote", false },
    960     { "tag:blogger.com,1999:blog-555", false },
    961     { "tel:+358-555-1234567;postd=pp22", false },
    962     { "telnet://mayor_margie:one2rule4All (at) www.mycity.com:6789/", false },
    963     { "tftp://example.com/mystartupfile", false },
    964     { "tip://123.123.123.123/?urn:xopen:xid", false },
    965     { "tv:nbc.com", false },
    966     { "urn:foo:A123,456", false },
    967     { "vemmi://zeus.mctel.fr/demo", false },
    968     { "wais://www.mydomain.net:8765/mydatabase", false },
    969     { "xmpp:node (at) example.com", false },
    970     { "xmpp://guest (at) example.com", false },
    971   };
    972 
    973   URLIndexPrivateData& private_data(*GetPrivateData());
    974   const std::set<std::string>& whitelist(scheme_whitelist());
    975   for (size_t i = 0; i < ARRAYSIZE_UNSAFE(data); ++i) {
    976     GURL url(data[i].url_spec);
    977     EXPECT_EQ(data[i].expected_is_whitelisted,
    978               private_data.URLSchemeIsWhitelisted(url, whitelist));
    979   }
    980 }
    981 
    982 TEST_F(InMemoryURLIndexTest, ReadVisitsFromHistory) {
    983   const HistoryInfoMap& history_info_map = GetPrivateData()->history_info_map_;
    984 
    985   // Check (for URL with id 1) that the number of visits and their
    986   // transition types are what we expect.  We don't bother checking
    987   // the timestamps because it's too much trouble.  (The timestamps go
    988   // through a transformation in InMemoryURLIndexTest::SetUp().  We
    989   // assume that if the count and transitions show up with the right
    990   // information, we're getting the right information from the history
    991   // database file.)
    992   HistoryInfoMap::const_iterator entry = history_info_map.find(1);
    993   ASSERT_TRUE(entry != history_info_map.end());
    994   {
    995     const VisitInfoVector& visits = entry->second.visits;
    996     EXPECT_EQ(3u, visits.size());
    997     EXPECT_EQ(0u, visits[0].second);
    998     EXPECT_EQ(1u, visits[1].second);
    999     EXPECT_EQ(0u, visits[2].second);
   1000   }
   1001 
   1002   // Ditto but for URL with id 35.
   1003   entry = history_info_map.find(35);
   1004   ASSERT_TRUE(entry != history_info_map.end());
   1005   {
   1006     const VisitInfoVector& visits = entry->second.visits;
   1007     EXPECT_EQ(2u, visits.size());
   1008     EXPECT_EQ(1u, visits[0].second);
   1009     EXPECT_EQ(1u, visits[1].second);
   1010   }
   1011 
   1012   // The URL with id 32 has many visits listed in the database, but we
   1013   // should only read the most recent 10 (which are all transition type 0).
   1014   entry = history_info_map.find(32);
   1015   ASSERT_TRUE(entry != history_info_map.end());
   1016   {
   1017     const VisitInfoVector& visits = entry->second.visits;
   1018     EXPECT_EQ(10u, visits.size());
   1019     for (size_t i = 0; i < visits.size(); ++i)
   1020       EXPECT_EQ(0u, visits[i].second);
   1021   }
   1022 }
   1023 
   1024 TEST_F(InMemoryURLIndexTest, CacheSaveRestore) {
   1025   base::ScopedTempDir temp_directory;
   1026   ASSERT_TRUE(temp_directory.CreateUniqueTempDir());
   1027   set_history_dir(temp_directory.path());
   1028 
   1029   URLIndexPrivateData& private_data(*GetPrivateData());
   1030 
   1031   // Ensure that there is really something there to be saved.
   1032   EXPECT_FALSE(private_data.word_list_.empty());
   1033   // available_words_ will already be empty since we have freshly built the
   1034   // data set for this test.
   1035   EXPECT_TRUE(private_data.available_words_.empty());
   1036   EXPECT_FALSE(private_data.word_map_.empty());
   1037   EXPECT_FALSE(private_data.char_word_map_.empty());
   1038   EXPECT_FALSE(private_data.word_id_history_map_.empty());
   1039   EXPECT_FALSE(private_data.history_id_word_map_.empty());
   1040   EXPECT_FALSE(private_data.history_info_map_.empty());
   1041   EXPECT_FALSE(private_data.word_starts_map_.empty());
   1042 
   1043   // Make sure the data we have was built from history.  (Version 0
   1044   // means rebuilt from history.)
   1045   EXPECT_EQ(0, private_data.restored_cache_version_);
   1046 
   1047   // Capture the current private data for later comparison to restored data.
   1048   scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate());
   1049   const base::Time rebuild_time = private_data.last_time_rebuilt_from_history_;
   1050 
   1051   // Save then restore our private data.
   1052   CacheFileSaverObserver save_observer(&message_loop_);
   1053   url_index_->set_save_cache_observer(&save_observer);
   1054   PostSaveToCacheFileTask();
   1055   message_loop_.Run();
   1056   EXPECT_TRUE(save_observer.succeeded_);
   1057 
   1058   // Clear and then prove it's clear before restoring.
   1059   ClearPrivateData();
   1060   EXPECT_TRUE(private_data.word_list_.empty());
   1061   EXPECT_TRUE(private_data.available_words_.empty());
   1062   EXPECT_TRUE(private_data.word_map_.empty());
   1063   EXPECT_TRUE(private_data.char_word_map_.empty());
   1064   EXPECT_TRUE(private_data.word_id_history_map_.empty());
   1065   EXPECT_TRUE(private_data.history_id_word_map_.empty());
   1066   EXPECT_TRUE(private_data.history_info_map_.empty());
   1067   EXPECT_TRUE(private_data.word_starts_map_.empty());
   1068 
   1069   HistoryIndexRestoreObserver restore_observer(
   1070       base::Bind(&base::MessageLoop::Quit, base::Unretained(&message_loop_)));
   1071   url_index_->set_restore_cache_observer(&restore_observer);
   1072   PostRestoreFromCacheFileTask();
   1073   message_loop_.Run();
   1074   EXPECT_TRUE(restore_observer.succeeded());
   1075 
   1076   URLIndexPrivateData& new_data(*GetPrivateData());
   1077 
   1078   // Make sure the data we have was reloaded from cache.  (Version 0
   1079   // means rebuilt from history; anything else means restored from
   1080   // a cache version.)  Also, the rebuild time should not have changed.
   1081   EXPECT_GT(new_data.restored_cache_version_, 0);
   1082   EXPECT_EQ(rebuild_time, new_data.last_time_rebuilt_from_history_);
   1083 
   1084   // Compare the captured and restored for equality.
   1085   ExpectPrivateDataEqual(*old_data.get(), new_data);
   1086 }
   1087 
   1088 TEST_F(InMemoryURLIndexTest, RebuildFromHistoryIfCacheOld) {
   1089   base::ScopedTempDir temp_directory;
   1090   ASSERT_TRUE(temp_directory.CreateUniqueTempDir());
   1091   set_history_dir(temp_directory.path());
   1092 
   1093   URLIndexPrivateData& private_data(*GetPrivateData());
   1094 
   1095   // Ensure that there is really something there to be saved.
   1096   EXPECT_FALSE(private_data.word_list_.empty());
   1097   // available_words_ will already be empty since we have freshly built the
   1098   // data set for this test.
   1099   EXPECT_TRUE(private_data.available_words_.empty());
   1100   EXPECT_FALSE(private_data.word_map_.empty());
   1101   EXPECT_FALSE(private_data.char_word_map_.empty());
   1102   EXPECT_FALSE(private_data.word_id_history_map_.empty());
   1103   EXPECT_FALSE(private_data.history_id_word_map_.empty());
   1104   EXPECT_FALSE(private_data.history_info_map_.empty());
   1105   EXPECT_FALSE(private_data.word_starts_map_.empty());
   1106 
   1107   // Make sure the data we have was built from history.  (Version 0
   1108   // means rebuilt from history.)
   1109   EXPECT_EQ(0, private_data.restored_cache_version_);
   1110 
   1111   // Overwrite the build time so that we'll think the data is too old
   1112   // and rebuild the cache from history.
   1113   const base::Time fake_rebuild_time =
   1114       private_data.last_time_rebuilt_from_history_ -
   1115       base::TimeDelta::FromDays(30);
   1116   private_data.last_time_rebuilt_from_history_ = fake_rebuild_time;
   1117 
   1118   // Capture the current private data for later comparison to restored data.
   1119   scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate());
   1120 
   1121   // Save then restore our private data.
   1122   CacheFileSaverObserver save_observer(&message_loop_);
   1123   url_index_->set_save_cache_observer(&save_observer);
   1124   PostSaveToCacheFileTask();
   1125   message_loop_.Run();
   1126   EXPECT_TRUE(save_observer.succeeded_);
   1127 
   1128   // Clear and then prove it's clear before restoring.
   1129   ClearPrivateData();
   1130   EXPECT_TRUE(private_data.word_list_.empty());
   1131   EXPECT_TRUE(private_data.available_words_.empty());
   1132   EXPECT_TRUE(private_data.word_map_.empty());
   1133   EXPECT_TRUE(private_data.char_word_map_.empty());
   1134   EXPECT_TRUE(private_data.word_id_history_map_.empty());
   1135   EXPECT_TRUE(private_data.history_id_word_map_.empty());
   1136   EXPECT_TRUE(private_data.history_info_map_.empty());
   1137   EXPECT_TRUE(private_data.word_starts_map_.empty());
   1138 
   1139   HistoryIndexRestoreObserver restore_observer(
   1140       base::Bind(&base::MessageLoop::Quit, base::Unretained(&message_loop_)));
   1141   url_index_->set_restore_cache_observer(&restore_observer);
   1142   PostRestoreFromCacheFileTask();
   1143   message_loop_.Run();
   1144   EXPECT_TRUE(restore_observer.succeeded());
   1145 
   1146   URLIndexPrivateData& new_data(*GetPrivateData());
   1147 
   1148   // Make sure the data we have was rebuilt from history.  (Version 0
   1149   // means rebuilt from history; anything else means restored from
   1150   // a cache version.)
   1151   EXPECT_EQ(0, new_data.restored_cache_version_);
   1152   EXPECT_NE(fake_rebuild_time, new_data.last_time_rebuilt_from_history_);
   1153 
   1154   // Compare the captured and restored for equality.
   1155   ExpectPrivateDataEqual(*old_data.get(), new_data);
   1156 }
   1157 
   1158 class InMemoryURLIndexCacheTest : public testing::Test {
   1159  public:
   1160   InMemoryURLIndexCacheTest() {}
   1161 
   1162  protected:
   1163   virtual void SetUp() OVERRIDE;
   1164 
   1165   // Pass-through functions to simplify our friendship with InMemoryURLIndex.
   1166   void set_history_dir(const base::FilePath& dir_path);
   1167   bool GetCacheFilePath(base::FilePath* file_path) const;
   1168 
   1169   base::ScopedTempDir temp_dir_;
   1170   scoped_ptr<InMemoryURLIndex> url_index_;
   1171 };
   1172 
   1173 void InMemoryURLIndexCacheTest::SetUp() {
   1174   ASSERT_TRUE(temp_dir_.CreateUniqueTempDir());
   1175   HistoryClient history_client;
   1176   base::FilePath path(temp_dir_.path());
   1177   url_index_.reset(new InMemoryURLIndex(
   1178       NULL, path, "en,ja,hi,zh", &history_client));
   1179 }
   1180 
   1181 void InMemoryURLIndexCacheTest::set_history_dir(
   1182     const base::FilePath& dir_path) {
   1183   return url_index_->set_history_dir(dir_path);
   1184 }
   1185 
   1186 bool InMemoryURLIndexCacheTest::GetCacheFilePath(
   1187     base::FilePath* file_path) const {
   1188   DCHECK(file_path);
   1189   return url_index_->GetCacheFilePath(file_path);
   1190 }
   1191 
   1192 TEST_F(InMemoryURLIndexCacheTest, CacheFilePath) {
   1193   base::FilePath expectedPath =
   1194       temp_dir_.path().Append(FILE_PATH_LITERAL("History Provider Cache"));
   1195   std::vector<base::FilePath::StringType> expected_parts;
   1196   expectedPath.GetComponents(&expected_parts);
   1197   base::FilePath full_file_path;
   1198   ASSERT_TRUE(GetCacheFilePath(&full_file_path));
   1199   std::vector<base::FilePath::StringType> actual_parts;
   1200   full_file_path.GetComponents(&actual_parts);
   1201   ASSERT_EQ(expected_parts.size(), actual_parts.size());
   1202   size_t count = expected_parts.size();
   1203   for (size_t i = 0; i < count; ++i)
   1204     EXPECT_EQ(expected_parts[i], actual_parts[i]);
   1205   // Must clear the history_dir_ to satisfy the dtor's DCHECK.
   1206   set_history_dir(base::FilePath());
   1207 }
   1208 
   1209 }  // namespace history
   1210