1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
8 #include "base/auto_reset.h"
9 #include "base/file_util.h"
10 #include "base/files/file_path.h"
11 #include "base/files/scoped_temp_dir.h"
12 #include "base/message_loop/message_loop.h"
13 #include "base/path_service.h"
14 #include "base/strings/string16.h"
15 #include "base/strings/string_util.h"
16 #include "base/strings/utf_string_conversions.h"
17 #include "chrome/browser/bookmarks/bookmark_model_factory.h"
18 #include "chrome/browser/chrome_notification_types.h"
19 #include "chrome/browser/history/history_backend.h"
20 #include "chrome/browser/history/history_database.h"
21 #include "chrome/browser/history/history_notifications.h"
22 #include "chrome/browser/history/history_service.h"
23 #include "chrome/browser/history/history_service_factory.h"
24 #include "chrome/browser/history/in_memory_url_index.h"
25 #include "chrome/browser/history/in_memory_url_index_types.h"
26 #include "chrome/browser/history/url_index_private_data.h"
27 #include "chrome/common/chrome_paths.h"
28 #include "chrome/test/base/history_index_restore_observer.h"
29 #include "chrome/test/base/testing_profile.h"
30 #include "components/bookmarks/test/bookmark_test_helpers.h"
31 #include "components/history/core/browser/history_client.h"
32 #include "content/public/browser/notification_details.h"
33 #include "content/public/browser/notification_source.h"
34 #include "content/public/test/test_browser_thread.h"
35 #include "sql/transaction.h"
36 #include "testing/gtest/include/gtest/gtest.h"
38 using base::ASCIIToUTF16;
39 using content::BrowserThread;
42 const size_t kMaxMatches = 3;
45 // The test version of the history url database table ('url') is contained in
46 // a database file created from a text file('url_history_provider_test.db.txt').
47 // The only difference between this table and a live 'urls' table from a
48 // profile is that the last_visit_time column in the test table contains a
49 // number specifying the number of days relative to 'today' to which the
50 // absolute time should be set during the test setup stage.
52 // The format of the test database text file is of a SQLite .dump file.
53 // Note that only lines whose first character is an upper-case letter are
54 // processed when creating the test database.
58 // -----------------------------------------------------------------------------
60 // Observer class so the unit tests can wait while the cache is being saved.
61 class CacheFileSaverObserver : public InMemoryURLIndex::SaveCacheObserver {
63 explicit CacheFileSaverObserver(base::MessageLoop* loop);
64 virtual void OnCacheSaveFinished(bool succeeded) OVERRIDE;
66 base::MessageLoop* loop_;
68 DISALLOW_COPY_AND_ASSIGN(CacheFileSaverObserver);
71 CacheFileSaverObserver::CacheFileSaverObserver(base::MessageLoop* loop)
77 void CacheFileSaverObserver::OnCacheSaveFinished(bool succeeded) {
78 succeeded_ = succeeded;
82 // -----------------------------------------------------------------------------
84 class InMemoryURLIndexTest : public testing::Test {
86 InMemoryURLIndexTest();
92 // Allows the database containing the test data to be customized by
94 virtual base::FilePath::StringType TestDBName() const;
96 // Validates that the given |term| is contained in |cache| and that it is
98 void CheckTerm(const URLIndexPrivateData::SearchTermCacheMap& cache,
99 base::string16 term) const;
101 // Pass-through function to simplify our friendship with HistoryService.
102 sql::Connection& GetDB();
104 // Pass-through functions to simplify our friendship with InMemoryURLIndex.
105 URLIndexPrivateData* GetPrivateData() const;
106 void ClearPrivateData();
107 void set_history_dir(const base::FilePath& dir_path);
108 bool GetCacheFilePath(base::FilePath* file_path) const;
109 void PostRestoreFromCacheFileTask();
110 void PostSaveToCacheFileTask();
111 void Observe(int notification_type,
112 const content::NotificationSource& source,
113 const content::NotificationDetails& details);
114 const std::set<std::string>& scheme_whitelist();
117 // Pass-through functions to simplify our friendship with URLIndexPrivateData.
118 bool UpdateURL(const URLRow& row);
119 bool DeleteURL(const GURL& url);
121 // Data verification helper functions.
122 void ExpectPrivateDataNotEmpty(const URLIndexPrivateData& data);
123 void ExpectPrivateDataEmpty(const URLIndexPrivateData& data);
124 void ExpectPrivateDataEqual(const URLIndexPrivateData& expected,
125 const URLIndexPrivateData& actual);
127 base::MessageLoopForUI message_loop_;
128 content::TestBrowserThread ui_thread_;
129 content::TestBrowserThread file_thread_;
130 TestingProfile profile_;
131 HistoryService* history_service_;
133 scoped_ptr<InMemoryURLIndex> url_index_;
134 HistoryDatabase* history_database_;
137 InMemoryURLIndexTest::InMemoryURLIndexTest()
138 : ui_thread_(content::BrowserThread::UI, &message_loop_),
139 file_thread_(content::BrowserThread::FILE, &message_loop_) {
142 sql::Connection& InMemoryURLIndexTest::GetDB() {
143 return history_database_->GetDB();
146 URLIndexPrivateData* InMemoryURLIndexTest::GetPrivateData() const {
147 DCHECK(url_index_->private_data());
148 return url_index_->private_data();
151 void InMemoryURLIndexTest::ClearPrivateData() {
152 return url_index_->ClearPrivateData();
155 void InMemoryURLIndexTest::set_history_dir(const base::FilePath& dir_path) {
156 return url_index_->set_history_dir(dir_path);
159 bool InMemoryURLIndexTest::GetCacheFilePath(base::FilePath* file_path) const {
161 return url_index_->GetCacheFilePath(file_path);
164 void InMemoryURLIndexTest::PostRestoreFromCacheFileTask() {
165 url_index_->PostRestoreFromCacheFileTask();
168 void InMemoryURLIndexTest::PostSaveToCacheFileTask() {
169 url_index_->PostSaveToCacheFileTask();
172 void InMemoryURLIndexTest::Observe(
173 int notification_type,
174 const content::NotificationSource& source,
175 const content::NotificationDetails& details) {
176 url_index_->Observe(notification_type, source, details);
179 const std::set<std::string>& InMemoryURLIndexTest::scheme_whitelist() {
180 return url_index_->scheme_whitelist();
183 bool InMemoryURLIndexTest::UpdateURL(const URLRow& row) {
184 return GetPrivateData()->UpdateURL(
185 history_service_, row, url_index_->languages_,
186 url_index_->scheme_whitelist_);
189 bool InMemoryURLIndexTest::DeleteURL(const GURL& url) {
190 return GetPrivateData()->DeleteURL(url);
193 void InMemoryURLIndexTest::SetUp() {
194 // We cannot access the database until the backend has been loaded.
195 ASSERT_TRUE(profile_.CreateHistoryService(true, false));
196 profile_.CreateBookmarkModel(true);
197 test::WaitForBookmarkModelToLoad(
198 BookmarkModelFactory::GetForProfile(&profile_));
199 profile_.BlockUntilHistoryProcessesPendingRequests();
200 profile_.BlockUntilHistoryIndexIsRefreshed();
201 history_service_ = HistoryServiceFactory::GetForProfile(
202 &profile_, Profile::EXPLICIT_ACCESS);
203 ASSERT_TRUE(history_service_);
204 HistoryBackend* backend = history_service_->history_backend_.get();
205 history_database_ = backend->db();
207 // Create and populate a working copy of the URL history database.
208 base::FilePath history_proto_path;
209 PathService::Get(chrome::DIR_TEST_DATA, &history_proto_path);
210 history_proto_path = history_proto_path.Append(
211 FILE_PATH_LITERAL("History"));
212 history_proto_path = history_proto_path.Append(TestDBName());
213 EXPECT_TRUE(base::PathExists(history_proto_path));
215 std::ifstream proto_file(history_proto_path.value().c_str());
216 static const size_t kCommandBufferMaxSize = 2048;
217 char sql_cmd_line[kCommandBufferMaxSize];
219 sql::Connection& db(GetDB());
220 ASSERT_TRUE(db.is_open());
222 sql::Transaction transaction(&db);
224 while (!proto_file.eof()) {
225 proto_file.getline(sql_cmd_line, kCommandBufferMaxSize);
226 if (!proto_file.eof()) {
227 // We only process lines which begin with a upper-case letter.
228 // TODO(mrossetti): Can iswupper() be used here?
229 if (sql_cmd_line[0] >= 'A' && sql_cmd_line[0] <= 'Z') {
230 std::string sql_cmd(sql_cmd_line);
231 sql::Statement sql_stmt(db.GetUniqueStatement(sql_cmd_line));
232 EXPECT_TRUE(sql_stmt.Run());
236 transaction.Commit();
239 // Update the last_visit_time table column in the "urls" table
240 // such that it represents a time relative to 'now'.
241 sql::Statement statement(db.GetUniqueStatement(
242 "SELECT" HISTORY_URL_ROW_FIELDS "FROM urls;"));
243 ASSERT_TRUE(statement.is_valid());
244 base::Time time_right_now = base::Time::NowFromSystemTime();
245 base::TimeDelta day_delta = base::TimeDelta::FromDays(1);
247 sql::Transaction transaction(&db);
249 while (statement.Step()) {
251 history_database_->FillURLRow(statement, &row);
252 base::Time last_visit = time_right_now;
253 for (int64 i = row.last_visit().ToInternalValue(); i > 0; --i)
254 last_visit -= day_delta;
255 row.set_last_visit(last_visit);
256 history_database_->UpdateURLRow(row.id(), row);
258 transaction.Commit();
261 // Update the visit_time table column in the "visits" table
262 // such that it represents a time relative to 'now'.
263 statement.Assign(db.GetUniqueStatement(
264 "SELECT" HISTORY_VISIT_ROW_FIELDS "FROM visits;"));
265 ASSERT_TRUE(statement.is_valid());
267 sql::Transaction transaction(&db);
269 while (statement.Step()) {
271 history_database_->FillVisitRow(statement, &row);
272 base::Time last_visit = time_right_now;
273 for (int64 i = row.visit_time.ToInternalValue(); i > 0; --i)
274 last_visit -= day_delta;
275 row.visit_time = last_visit;
276 history_database_->UpdateVisitRow(row);
278 transaction.Commit();
281 url_index_.reset(new InMemoryURLIndex(
282 &profile_, base::FilePath(), "en,ja,hi,zh",
283 history_service_->history_client()));
285 url_index_->RebuildFromHistory(history_database_);
288 base::FilePath::StringType InMemoryURLIndexTest::TestDBName() const {
289 return FILE_PATH_LITERAL("url_history_provider_test.db.txt");
292 void InMemoryURLIndexTest::CheckTerm(
293 const URLIndexPrivateData::SearchTermCacheMap& cache,
294 base::string16 term) const {
295 URLIndexPrivateData::SearchTermCacheMap::const_iterator cache_iter(
297 ASSERT_TRUE(cache.end() != cache_iter)
298 << "Cache does not contain '" << term << "' but should.";
299 URLIndexPrivateData::SearchTermCacheItem cache_item = cache_iter->second;
300 EXPECT_TRUE(cache_item.used_)
301 << "Cache item '" << term << "' should be marked as being in use.";
304 void InMemoryURLIndexTest::ExpectPrivateDataNotEmpty(
305 const URLIndexPrivateData& data) {
306 EXPECT_FALSE(data.word_list_.empty());
307 // available_words_ will be empty since we have freshly built the
308 // data set for these tests.
309 EXPECT_TRUE(data.available_words_.empty());
310 EXPECT_FALSE(data.word_map_.empty());
311 EXPECT_FALSE(data.char_word_map_.empty());
312 EXPECT_FALSE(data.word_id_history_map_.empty());
313 EXPECT_FALSE(data.history_id_word_map_.empty());
314 EXPECT_FALSE(data.history_info_map_.empty());
317 void InMemoryURLIndexTest::ExpectPrivateDataEmpty(
318 const URLIndexPrivateData& data) {
319 EXPECT_TRUE(data.word_list_.empty());
320 EXPECT_TRUE(data.available_words_.empty());
321 EXPECT_TRUE(data.word_map_.empty());
322 EXPECT_TRUE(data.char_word_map_.empty());
323 EXPECT_TRUE(data.word_id_history_map_.empty());
324 EXPECT_TRUE(data.history_id_word_map_.empty());
325 EXPECT_TRUE(data.history_info_map_.empty());
328 // Helper function which compares two maps for equivalence. The maps' values
329 // are associative containers and their contents are compared as well.
331 void ExpectMapOfContainersIdentical(const T& expected, const T& actual) {
332 ASSERT_EQ(expected.size(), actual.size());
333 for (typename T::const_iterator expected_iter = expected.begin();
334 expected_iter != expected.end(); ++expected_iter) {
335 typename T::const_iterator actual_iter = actual.find(expected_iter->first);
336 ASSERT_TRUE(actual.end() != actual_iter);
337 typename T::mapped_type const& expected_values(expected_iter->second);
338 typename T::mapped_type const& actual_values(actual_iter->second);
339 ASSERT_EQ(expected_values.size(), actual_values.size());
340 for (typename T::mapped_type::const_iterator set_iter =
341 expected_values.begin(); set_iter != expected_values.end(); ++set_iter)
342 EXPECT_EQ(actual_values.count(*set_iter),
343 expected_values.count(*set_iter));
347 void InMemoryURLIndexTest::ExpectPrivateDataEqual(
348 const URLIndexPrivateData& expected,
349 const URLIndexPrivateData& actual) {
350 EXPECT_EQ(expected.word_list_.size(), actual.word_list_.size());
351 EXPECT_EQ(expected.word_map_.size(), actual.word_map_.size());
352 EXPECT_EQ(expected.char_word_map_.size(), actual.char_word_map_.size());
353 EXPECT_EQ(expected.word_id_history_map_.size(),
354 actual.word_id_history_map_.size());
355 EXPECT_EQ(expected.history_id_word_map_.size(),
356 actual.history_id_word_map_.size());
357 EXPECT_EQ(expected.history_info_map_.size(), actual.history_info_map_.size());
358 EXPECT_EQ(expected.word_starts_map_.size(), actual.word_starts_map_.size());
359 // WordList must be index-by-index equal.
360 size_t count = expected.word_list_.size();
361 for (size_t i = 0; i < count; ++i)
362 EXPECT_EQ(expected.word_list_[i], actual.word_list_[i]);
364 ExpectMapOfContainersIdentical(expected.char_word_map_,
365 actual.char_word_map_);
366 ExpectMapOfContainersIdentical(expected.word_id_history_map_,
367 actual.word_id_history_map_);
368 ExpectMapOfContainersIdentical(expected.history_id_word_map_,
369 actual.history_id_word_map_);
371 for (HistoryInfoMap::const_iterator expected_info =
372 expected.history_info_map_.begin();
373 expected_info != expected.history_info_map_.end(); ++expected_info) {
374 HistoryInfoMap::const_iterator actual_info =
375 actual.history_info_map_.find(expected_info->first);
376 // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between
377 // gtest and STLPort in the Android build. See
378 // http://code.google.com/p/googletest/issues/detail?id=359
379 ASSERT_TRUE(actual_info != actual.history_info_map_.end());
380 const URLRow& expected_row(expected_info->second.url_row);
381 const URLRow& actual_row(actual_info->second.url_row);
382 EXPECT_EQ(expected_row.visit_count(), actual_row.visit_count());
383 EXPECT_EQ(expected_row.typed_count(), actual_row.typed_count());
384 EXPECT_EQ(expected_row.last_visit(), actual_row.last_visit());
385 EXPECT_EQ(expected_row.url(), actual_row.url());
386 const VisitInfoVector& expected_visits(expected_info->second.visits);
387 const VisitInfoVector& actual_visits(actual_info->second.visits);
388 EXPECT_EQ(expected_visits.size(), actual_visits.size());
390 i < std::min(expected_visits.size(), actual_visits.size()); ++i) {
391 EXPECT_EQ(expected_visits[i].first, actual_visits[i].first);
392 EXPECT_EQ(expected_visits[i].second, actual_visits[i].second);
396 for (WordStartsMap::const_iterator expected_starts =
397 expected.word_starts_map_.begin();
398 expected_starts != expected.word_starts_map_.end();
400 WordStartsMap::const_iterator actual_starts =
401 actual.word_starts_map_.find(expected_starts->first);
402 // NOTE(yfriedman): ASSERT_NE can't be used due to incompatibility between
403 // gtest and STLPort in the Android build. See
404 // http://code.google.com/p/googletest/issues/detail?id=359
405 ASSERT_TRUE(actual_starts != actual.word_starts_map_.end());
406 const RowWordStarts& expected_word_starts(expected_starts->second);
407 const RowWordStarts& actual_word_starts(actual_starts->second);
408 EXPECT_EQ(expected_word_starts.url_word_starts_.size(),
409 actual_word_starts.url_word_starts_.size());
410 EXPECT_TRUE(std::equal(expected_word_starts.url_word_starts_.begin(),
411 expected_word_starts.url_word_starts_.end(),
412 actual_word_starts.url_word_starts_.begin()));
413 EXPECT_EQ(expected_word_starts.title_word_starts_.size(),
414 actual_word_starts.title_word_starts_.size());
415 EXPECT_TRUE(std::equal(expected_word_starts.title_word_starts_.begin(),
416 expected_word_starts.title_word_starts_.end(),
417 actual_word_starts.title_word_starts_.begin()));
421 //------------------------------------------------------------------------------
423 class LimitedInMemoryURLIndexTest : public InMemoryURLIndexTest {
425 virtual base::FilePath::StringType TestDBName() const OVERRIDE;
428 base::FilePath::StringType LimitedInMemoryURLIndexTest::TestDBName() const {
429 return FILE_PATH_LITERAL("url_history_provider_test_limited.db.txt");
432 TEST_F(LimitedInMemoryURLIndexTest, Initialization) {
433 // Verify that the database contains the expected number of items, which
434 // is the pre-filtered count, i.e. all of the items.
435 sql::Statement statement(GetDB().GetUniqueStatement("SELECT * FROM urls;"));
436 ASSERT_TRUE(statement.is_valid());
437 uint64 row_count = 0;
438 while (statement.Step()) ++row_count;
439 EXPECT_EQ(1U, row_count);
440 url_index_.reset(new InMemoryURLIndex(
441 &profile_, base::FilePath(), "en,ja,hi,zh",
442 history_service_->history_client()));
444 url_index_->RebuildFromHistory(history_database_);
445 URLIndexPrivateData& private_data(*GetPrivateData());
447 // history_info_map_ should have the same number of items as were filtered.
448 EXPECT_EQ(1U, private_data.history_info_map_.size());
449 EXPECT_EQ(35U, private_data.char_word_map_.size());
450 EXPECT_EQ(17U, private_data.word_map_.size());
454 // Flaky on windows trybots: http://crbug.com/351500
455 #define MAYBE_Retrieval DISABLED_Retrieval
457 #define MAYBE_Retrieval Retrieval
459 TEST_F(InMemoryURLIndexTest, MAYBE_Retrieval) {
460 // See if a very specific term gives a single result.
461 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
462 ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
463 ASSERT_EQ(1U, matches.size());
465 // Verify that we got back the result we expected.
466 EXPECT_EQ(5, matches[0].url_info.id());
467 EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
468 EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
469 EXPECT_TRUE(matches[0].can_inline());
471 // Make sure a trailing space prevents inline-ability but still results
472 // in the expected result.
473 matches = url_index_->HistoryItemsForTerms(
474 ASCIIToUTF16("DrudgeReport "), base::string16::npos, kMaxMatches);
475 ASSERT_EQ(1U, matches.size());
476 EXPECT_EQ(5, matches[0].url_info.id());
477 EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
478 EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
479 EXPECT_FALSE(matches[0].can_inline());
481 // Search which should result in multiple results.
482 matches = url_index_->HistoryItemsForTerms(
483 ASCIIToUTF16("drudge"), base::string16::npos, kMaxMatches);
484 ASSERT_EQ(2U, matches.size());
485 // The results should be in descending score order.
486 EXPECT_GE(matches[0].raw_score(), matches[1].raw_score());
488 // Search which should result in nearly perfect result.
489 matches = url_index_->HistoryItemsForTerms(
490 ASCIIToUTF16("Nearly Perfect Result"), base::string16::npos, kMaxMatches);
491 ASSERT_EQ(1U, matches.size());
492 // The results should have a very high score.
493 EXPECT_GT(matches[0].raw_score(), 900);
494 EXPECT_EQ(32, matches[0].url_info.id());
495 EXPECT_EQ("https://nearlyperfectresult.com/",
496 matches[0].url_info.url().spec()); // Note: URL gets lowercased.
497 EXPECT_EQ(ASCIIToUTF16("Practically Perfect Search Result"),
498 matches[0].url_info.title());
499 EXPECT_FALSE(matches[0].can_inline());
501 // Search which should result in very poor result.
502 matches = url_index_->HistoryItemsForTerms(
503 ASCIIToUTF16("qui c"), base::string16::npos, kMaxMatches);
504 ASSERT_EQ(1U, matches.size());
505 // The results should have a poor score.
506 EXPECT_LT(matches[0].raw_score(), 500);
507 EXPECT_EQ(33, matches[0].url_info.id());
508 EXPECT_EQ("http://quiteuselesssearchresultxyz.com/",
509 matches[0].url_info.url().spec()); // Note: URL gets lowercased.
510 EXPECT_EQ(ASCIIToUTF16("Practically Useless Search Result"),
511 matches[0].url_info.title());
512 EXPECT_FALSE(matches[0].can_inline());
514 // Search which will match at the end of an URL with encoded characters.
515 matches = url_index_->HistoryItemsForTerms(
516 ASCIIToUTF16("Mice"), base::string16::npos, kMaxMatches);
517 ASSERT_EQ(1U, matches.size());
518 EXPECT_EQ(30, matches[0].url_info.id());
519 EXPECT_FALSE(matches[0].can_inline());
521 // Check that URLs are not escaped an escape time.
522 matches = url_index_->HistoryItemsForTerms(
523 ASCIIToUTF16("1% wikipedia"), base::string16::npos, kMaxMatches);
524 ASSERT_EQ(1U, matches.size());
525 EXPECT_EQ(35, matches[0].url_info.id());
526 EXPECT_EQ("http://en.wikipedia.org/wiki/1%25_rule_(Internet_culture)",
527 matches[0].url_info.url().spec());
529 // Verify that a single term can appear multiple times in the URL and as long
530 // as one starts the URL it is still inlined.
531 matches = url_index_->HistoryItemsForTerms(
532 ASCIIToUTF16("fubar"), base::string16::npos, kMaxMatches);
533 ASSERT_EQ(1U, matches.size());
534 EXPECT_EQ(34, matches[0].url_info.id());
535 EXPECT_EQ("http://fubarfubarandfubar.com/", matches[0].url_info.url().spec());
536 EXPECT_EQ(ASCIIToUTF16("Situation Normal -- FUBARED"),
537 matches[0].url_info.title());
538 EXPECT_TRUE(matches[0].can_inline());
541 TEST_F(InMemoryURLIndexTest, CursorPositionRetrieval) {
542 // See if a very specific term with no cursor gives an empty result.
543 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
544 ASCIIToUTF16("DrudReport"), base::string16::npos, kMaxMatches);
545 ASSERT_EQ(0U, matches.size());
547 // The same test with the cursor at the end should give an empty result.
548 matches = url_index_->HistoryItemsForTerms(
549 ASCIIToUTF16("DrudReport"), 10u, kMaxMatches);
550 ASSERT_EQ(0U, matches.size());
552 // If the cursor is between Drud and Report, we should find the desired
554 matches = url_index_->HistoryItemsForTerms(
555 ASCIIToUTF16("DrudReport"), 4u, kMaxMatches);
556 ASSERT_EQ(1U, matches.size());
557 EXPECT_EQ("http://drudgereport.com/", matches[0].url_info.url().spec());
558 EXPECT_EQ(ASCIIToUTF16("DRUDGE REPORT 2010"), matches[0].url_info.title());
560 // Now check multi-word inputs. No cursor should fail to find a
561 // result on this input.
562 matches = url_index_->HistoryItemsForTerms(
563 ASCIIToUTF16("MORTGAGERATE DROPS"), base::string16::npos, kMaxMatches);
564 ASSERT_EQ(0U, matches.size());
566 // Ditto with cursor at end.
567 matches = url_index_->HistoryItemsForTerms(
568 ASCIIToUTF16("MORTGAGERATE DROPS"), 18u, kMaxMatches);
569 ASSERT_EQ(0U, matches.size());
571 // If the cursor is between MORTAGE And RATE, we should find the
573 matches = url_index_->HistoryItemsForTerms(
574 ASCIIToUTF16("MORTGAGERATE DROPS"), 8u, kMaxMatches);
575 ASSERT_EQ(1U, matches.size());
576 EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708",
577 matches[0].url_info.url().spec());
578 EXPECT_EQ(ASCIIToUTF16(
579 "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"),
580 matches[0].url_info.title());
583 TEST_F(InMemoryURLIndexTest, URLPrefixMatching) {
584 // "drudgere" - found, can inline
585 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
586 ASCIIToUTF16("drudgere"), base::string16::npos, kMaxMatches);
587 ASSERT_EQ(1U, matches.size());
588 EXPECT_TRUE(matches[0].can_inline());
590 // "drudgere" - found, can inline
591 matches = url_index_->HistoryItemsForTerms(
592 ASCIIToUTF16("drudgere"), base::string16::npos, kMaxMatches);
593 ASSERT_EQ(1U, matches.size());
594 EXPECT_TRUE(matches[0].can_inline());
596 // "www.atdmt" - not found
597 matches = url_index_->HistoryItemsForTerms(
598 ASCIIToUTF16("www.atdmt"), base::string16::npos, kMaxMatches);
599 EXPECT_EQ(0U, matches.size());
601 // "atdmt" - found, cannot inline
602 matches = url_index_->HistoryItemsForTerms(
603 ASCIIToUTF16("atdmt"), base::string16::npos, kMaxMatches);
604 ASSERT_EQ(1U, matches.size());
605 EXPECT_FALSE(matches[0].can_inline());
607 // "view.atdmt" - found, can inline
608 matches = url_index_->HistoryItemsForTerms(
609 ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
610 ASSERT_EQ(1U, matches.size());
611 EXPECT_TRUE(matches[0].can_inline());
613 // "view.atdmt" - found, can inline
614 matches = url_index_->HistoryItemsForTerms(
615 ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
616 ASSERT_EQ(1U, matches.size());
617 EXPECT_TRUE(matches[0].can_inline());
619 // "cnn.com" - found, can inline
620 matches = url_index_->HistoryItemsForTerms(
621 ASCIIToUTF16("cnn.com"), base::string16::npos, kMaxMatches);
622 ASSERT_EQ(2U, matches.size());
623 // One match should be inline-able, the other not.
624 EXPECT_TRUE(matches[0].can_inline() != matches[1].can_inline());
626 // "www.cnn.com" - found, can inline
627 matches = url_index_->HistoryItemsForTerms(
628 ASCIIToUTF16("www.cnn.com"), base::string16::npos, kMaxMatches);
629 ASSERT_EQ(1U, matches.size());
630 EXPECT_TRUE(matches[0].can_inline());
632 // "ww.cnn.com" - found because we allow mid-term matches in hostnames
633 matches = url_index_->HistoryItemsForTerms(
634 ASCIIToUTF16("ww.cnn.com"), base::string16::npos, kMaxMatches);
635 ASSERT_EQ(1U, matches.size());
637 // "www.cnn.com" - found, can inline
638 matches = url_index_->HistoryItemsForTerms(
639 ASCIIToUTF16("www.cnn.com"), base::string16::npos, kMaxMatches);
640 ASSERT_EQ(1U, matches.size());
641 EXPECT_TRUE(matches[0].can_inline());
643 // "tp://www.cnn.com" - not found because we don't allow tp as a mid-term
645 matches = url_index_->HistoryItemsForTerms(
646 ASCIIToUTF16("tp://www.cnn.com"), base::string16::npos, kMaxMatches);
647 ASSERT_EQ(0U, matches.size());
650 TEST_F(InMemoryURLIndexTest, ProperStringMatching) {
651 // Search for the following with the expected results:
652 // "atdmt view" - found
653 // "atdmt.view" - not found
654 // "view.atdmt" - found
655 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
656 ASCIIToUTF16("atdmt view"), base::string16::npos, kMaxMatches);
657 ASSERT_EQ(1U, matches.size());
658 matches = url_index_->HistoryItemsForTerms(
659 ASCIIToUTF16("atdmt.view"), base::string16::npos, kMaxMatches);
660 ASSERT_EQ(0U, matches.size());
661 matches = url_index_->HistoryItemsForTerms(
662 ASCIIToUTF16("view.atdmt"), base::string16::npos, kMaxMatches);
663 ASSERT_EQ(1U, matches.size());
666 TEST_F(InMemoryURLIndexTest, HugeResultSet) {
667 // Create a huge set of qualifying history items.
668 for (URLID row_id = 5000; row_id < 6000; ++row_id) {
669 URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), row_id);
670 new_row.set_last_visit(base::Time::Now());
671 EXPECT_TRUE(UpdateURL(new_row));
674 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
675 ASCIIToUTF16("b"), base::string16::npos, kMaxMatches);
676 URLIndexPrivateData& private_data(*GetPrivateData());
677 ASSERT_EQ(kMaxMatches, matches.size());
678 // There are 7 matches already in the database.
679 ASSERT_EQ(1008U, private_data.pre_filter_item_count_);
680 ASSERT_EQ(500U, private_data.post_filter_item_count_);
681 ASSERT_EQ(kMaxMatches, private_data.post_scoring_item_count_);
685 // Flaky on windows trybots: http://crbug.com/351500
686 #define MAYBE_TitleSearch DISABLED_TitleSearch
688 #define MAYBE_TitleSearch TitleSearch
690 TEST_F(InMemoryURLIndexTest, MAYBE_TitleSearch) {
691 // Signal if someone has changed the test DB.
692 EXPECT_EQ(29U, GetPrivateData()->history_info_map_.size());
694 // Ensure title is being searched.
695 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
696 ASCIIToUTF16("MORTGAGE RATE DROPS"), base::string16::npos, kMaxMatches);
697 ASSERT_EQ(1U, matches.size());
699 // Verify that we got back the result we expected.
700 EXPECT_EQ(1, matches[0].url_info.id());
701 EXPECT_EQ("http://www.reuters.com/article/idUSN0839880620100708",
702 matches[0].url_info.url().spec());
703 EXPECT_EQ(ASCIIToUTF16(
704 "UPDATE 1-US 30-yr mortgage rate drops to new record low | Reuters"),
705 matches[0].url_info.title());
708 TEST_F(InMemoryURLIndexTest, TitleChange) {
709 // Verify current title terms retrieves desired item.
710 base::string16 original_terms =
711 ASCIIToUTF16("lebronomics could high taxes influence");
712 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
713 original_terms, base::string16::npos, kMaxMatches);
714 ASSERT_EQ(1U, matches.size());
716 // Verify that we got back the result we expected.
717 const URLID expected_id = 3;
718 EXPECT_EQ(expected_id, matches[0].url_info.id());
719 EXPECT_EQ("http://www.businessandmedia.org/articles/2010/20100708120415.aspx",
720 matches[0].url_info.url().spec());
721 EXPECT_EQ(ASCIIToUTF16(
722 "LeBronomics: Could High Taxes Influence James' Team Decision?"),
723 matches[0].url_info.title());
724 URLRow old_row(matches[0].url_info);
726 // Verify new title terms retrieves nothing.
727 base::string16 new_terms = ASCIIToUTF16("does eat oats little lambs ivy");
728 matches = url_index_->HistoryItemsForTerms(
729 new_terms, base::string16::npos, kMaxMatches);
730 ASSERT_EQ(0U, matches.size());
733 old_row.set_title(ASCIIToUTF16("Does eat oats and little lambs eat ivy"));
734 EXPECT_TRUE(UpdateURL(old_row));
736 // Verify we get the row using the new terms but not the original terms.
737 matches = url_index_->HistoryItemsForTerms(
738 new_terms, base::string16::npos, kMaxMatches);
739 ASSERT_EQ(1U, matches.size());
740 EXPECT_EQ(expected_id, matches[0].url_info.id());
741 matches = url_index_->HistoryItemsForTerms(
742 original_terms, base::string16::npos, kMaxMatches);
743 ASSERT_EQ(0U, matches.size());
746 TEST_F(InMemoryURLIndexTest, NonUniqueTermCharacterSets) {
747 // The presence of duplicate characters should succeed. Exercise by cycling
748 // through a string with several duplicate characters.
749 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
750 ASCIIToUTF16("ABRA"), base::string16::npos, kMaxMatches);
751 ASSERT_EQ(1U, matches.size());
752 EXPECT_EQ(28, matches[0].url_info.id());
753 EXPECT_EQ("http://www.ddj.com/windows/184416623",
754 matches[0].url_info.url().spec());
756 matches = url_index_->HistoryItemsForTerms(
757 ASCIIToUTF16("ABRACAD"), base::string16::npos, kMaxMatches);
758 ASSERT_EQ(1U, matches.size());
759 EXPECT_EQ(28, matches[0].url_info.id());
761 matches = url_index_->HistoryItemsForTerms(
762 ASCIIToUTF16("ABRACADABRA"), base::string16::npos, kMaxMatches);
763 ASSERT_EQ(1U, matches.size());
764 EXPECT_EQ(28, matches[0].url_info.id());
766 matches = url_index_->HistoryItemsForTerms(
767 ASCIIToUTF16("ABRACADABR"), base::string16::npos, kMaxMatches);
768 ASSERT_EQ(1U, matches.size());
769 EXPECT_EQ(28, matches[0].url_info.id());
771 matches = url_index_->HistoryItemsForTerms(
772 ASCIIToUTF16("ABRACA"), base::string16::npos, kMaxMatches);
773 ASSERT_EQ(1U, matches.size());
774 EXPECT_EQ(28, matches[0].url_info.id());
777 TEST_F(InMemoryURLIndexTest, TypedCharacterCaching) {
778 // Verify that match results for previously typed characters are retained
779 // (in the term_char_word_set_cache_) and reused, if possible, in future
782 URLIndexPrivateData::SearchTermCacheMap& cache(
783 GetPrivateData()->search_term_cache_);
785 // The cache should be empty at this point.
786 EXPECT_EQ(0U, cache.size());
788 // Now simulate typing search terms into the omnibox and check the state of
789 // the cache as each item is 'typed'.
791 // Simulate typing "r" giving "r" in the simulated omnibox. The results for
792 // 'r' will be not cached because it is only 1 character long.
793 url_index_->HistoryItemsForTerms(
794 ASCIIToUTF16("r"), base::string16::npos, kMaxMatches);
795 EXPECT_EQ(0U, cache.size());
797 // Simulate typing "re" giving "r re" in the simulated omnibox.
798 // 're' should be cached at this point but not 'r' as it is a single
800 url_index_->HistoryItemsForTerms(
801 ASCIIToUTF16("r re"), base::string16::npos, kMaxMatches);
802 ASSERT_EQ(1U, cache.size());
803 CheckTerm(cache, ASCIIToUTF16("re"));
805 // Simulate typing "reco" giving "r re reco" in the simulated omnibox.
806 // 're' and 'reco' should be cached at this point but not 'r' as it is a
808 url_index_->HistoryItemsForTerms(
809 ASCIIToUTF16("r re reco"), base::string16::npos, kMaxMatches);
810 ASSERT_EQ(2U, cache.size());
811 CheckTerm(cache, ASCIIToUTF16("re"));
812 CheckTerm(cache, ASCIIToUTF16("reco"));
814 // Simulate typing "mort".
815 // Since we now have only one search term, the cached results for 're' and
816 // 'reco' should be purged, giving us only 1 item in the cache (for 'mort').
817 url_index_->HistoryItemsForTerms(
818 ASCIIToUTF16("mort"), base::string16::npos, kMaxMatches);
819 ASSERT_EQ(1U, cache.size());
820 CheckTerm(cache, ASCIIToUTF16("mort"));
822 // Simulate typing "reco" giving "mort reco" in the simulated omnibox.
823 url_index_->HistoryItemsForTerms(
824 ASCIIToUTF16("mort reco"), base::string16::npos, kMaxMatches);
825 ASSERT_EQ(2U, cache.size());
826 CheckTerm(cache, ASCIIToUTF16("mort"));
827 CheckTerm(cache, ASCIIToUTF16("reco"));
829 // Simulate a <DELETE> by removing the 'reco' and adding back the 'rec'.
830 url_index_->HistoryItemsForTerms(
831 ASCIIToUTF16("mort rec"), base::string16::npos, kMaxMatches);
832 ASSERT_EQ(2U, cache.size());
833 CheckTerm(cache, ASCIIToUTF16("mort"));
834 CheckTerm(cache, ASCIIToUTF16("rec"));
837 TEST_F(InMemoryURLIndexTest, AddNewRows) {
838 // Verify that the row we're going to add does not already exist.
839 URLID new_row_id = 87654321;
840 // Newly created URLRows get a last_visit time of 'right now' so it should
841 // qualify as a quick result candidate.
842 EXPECT_TRUE(url_index_->HistoryItemsForTerms(
843 ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches)
847 URLRow new_row(GURL("http://www.brokeandaloneinmanitoba.com/"), new_row_id++);
848 new_row.set_last_visit(base::Time::Now());
849 EXPECT_TRUE(UpdateURL(new_row));
851 // Verify that we can retrieve it.
852 EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(
853 ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches).size());
855 // Add it again just to be sure that is harmless and that it does not update
857 EXPECT_FALSE(UpdateURL(new_row));
858 EXPECT_EQ(1U, url_index_->HistoryItemsForTerms(
859 ASCIIToUTF16("brokeandalone"), base::string16::npos, kMaxMatches).size());
861 // Make up an URL that does not qualify and try to add it.
862 URLRow unqualified_row(GURL("http://www.brokeandaloneinmanitoba.com/"),
864 EXPECT_FALSE(UpdateURL(new_row));
867 TEST_F(InMemoryURLIndexTest, DeleteRows) {
868 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
869 ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
870 ASSERT_EQ(1U, matches.size());
872 // Delete the URL then search again.
873 EXPECT_TRUE(DeleteURL(matches[0].url_info.url()));
874 EXPECT_TRUE(url_index_->HistoryItemsForTerms(
875 ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches).empty());
877 // Make up an URL that does not exist in the database and delete it.
878 GURL url("http://www.hokeypokey.com/putyourrightfootin.html");
879 EXPECT_FALSE(DeleteURL(url));
882 TEST_F(InMemoryURLIndexTest, ExpireRow) {
883 ScoredHistoryMatches matches = url_index_->HistoryItemsForTerms(
884 ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches);
885 ASSERT_EQ(1U, matches.size());
887 // Determine the row id for the result, remember that id, broadcast a
888 // delete notification, then ensure that the row has been deleted.
889 URLsDeletedDetails deleted_details;
890 deleted_details.all_history = false;
891 deleted_details.rows.push_back(matches[0].url_info);
892 Observe(chrome::NOTIFICATION_HISTORY_URLS_DELETED,
893 content::Source<InMemoryURLIndexTest>(this),
894 content::Details<history::HistoryDetails>(&deleted_details));
895 EXPECT_TRUE(url_index_->HistoryItemsForTerms(
896 ASCIIToUTF16("DrudgeReport"), base::string16::npos, kMaxMatches).empty());
899 TEST_F(InMemoryURLIndexTest, WhitelistedURLs) {
901 const std::string url_spec;
902 const bool expected_is_whitelisted;
904 // URLs with whitelisted schemes.
905 { "about:histograms", true },
906 { "chrome://settings", true },
907 { "file://localhost/Users/joeschmoe/sekrets", true },
908 { "ftp://public.mycompany.com/myfile.txt", true },
909 { "http://www.google.com/translate", true },
910 { "https://www.gmail.com/", true },
911 { "mailto:support@google.com", true },
912 // URLs with unacceptable schemes.
913 { "aaa://www.dummyhost.com;frammy", false },
914 { "aaas://www.dummyhost.com;frammy", false },
915 { "acap://suzie@somebody.com", false },
916 { "cap://cal.example.com/Company/Holidays", false },
917 { "cid:foo4*foo1@bar.net", false },
918 { "crid://example.com/foobar", false },
919 { "data:image/png;base64,iVBORw0KGgoAAAANSUhE=", false },
920 { "dict://dict.org/d:shortcake:", false },
921 { "dns://192.168.1.1/ftp.example.org?type=A", false },
922 { "fax:+358.555.1234567", false },
923 { "geo:13.4125,103.8667", false },
924 { "go:Mercedes%20Benz", false },
925 { "gopher://farnsworth.ca:666/gopher", false },
926 { "h323:farmer-john;sixpence", false },
927 { "iax:johnQ@example.com/12022561414", false },
928 { "icap://icap.net/service?mode=translate&lang=french", false },
929 { "im:fred@example.com", false },
930 { "imap://michael@minbari.org/users.*", false },
931 { "info:ddc/22/eng//004.678", false },
932 { "ipp://example.com/printer/fox", false },
933 { "iris:dreg1//example.com/local/myhosts", false },
934 { "iris.beep:dreg1//example.com/local/myhosts", false },
935 { "iris.lws:dreg1//example.com/local/myhosts", false },
936 { "iris.xpc:dreg1//example.com/local/myhosts", false },
937 { "iris.xpcs:dreg1//example.com/local/myhosts", false },
938 { "ldap://ldap.itd.umich.edu/o=University%20of%20Michigan,c=US", false },
939 { "mid:foo4%25foo1@bar.net", false },
940 { "modem:+3585551234567;type=v32b?7e1;type=v110", false },
941 { "msrp://atlanta.example.com:7654/jshA7weztas;tcp", false },
942 { "msrps://atlanta.example.com:7654/jshA7weztas;tcp", false },
943 { "news:colorectal.info.banned", false },
944 { "nfs://server/d/e/f", false },
945 { "nntp://www.example.com:6543/info.comp.lies/1234", false },
946 { "pop://rg;AUTH=+APOP@mail.mycompany.com:8110", false },
947 { "pres:fred@example.com", false },
948 { "prospero://host.dom//pros/name", false },
949 { "rsync://syler@lost.com/Source", false },
950 { "rtsp://media.example.com:554/twister/audiotrack", false },
951 { "service:acap://some.where.net;authentication=KERBEROSV4", false },
952 { "shttp://www.terces.com/secret", false },
953 { "sieve://example.com//script", false },
954 { "sip:+1-212-555-1212:1234@gateway.com;user=phone", false },
955 { "sips:+1-212-555-1212:1234@gateway.com;user=phone", false },
956 { "sms:+15105551212?body=hello%20there", false },
957 { "snmp://tester5@example.com:8161/bridge1;800002b804616263", false },
958 { "soap.beep://stockquoteserver.example.com/StockQuote", false },
959 { "soap.beeps://stockquoteserver.example.com/StockQuote", false },
960 { "tag:blogger.com,1999:blog-555", false },
961 { "tel:+358-555-1234567;postd=pp22", false },
962 { "telnet://mayor_margie:one2rule4All@www.mycity.com:6789/", false },
963 { "tftp://example.com/mystartupfile", false },
964 { "tip://123.123.123.123/?urn:xopen:xid", false },
965 { "tv:nbc.com", false },
966 { "urn:foo:A123,456", false },
967 { "vemmi://zeus.mctel.fr/demo", false },
968 { "wais://www.mydomain.net:8765/mydatabase", false },
969 { "xmpp:node@example.com", false },
970 { "xmpp://guest@example.com", false },
973 URLIndexPrivateData& private_data(*GetPrivateData());
974 const std::set<std::string>& whitelist(scheme_whitelist());
975 for (size_t i = 0; i < ARRAYSIZE_UNSAFE(data); ++i) {
976 GURL url(data[i].url_spec);
977 EXPECT_EQ(data[i].expected_is_whitelisted,
978 private_data.URLSchemeIsWhitelisted(url, whitelist));
982 TEST_F(InMemoryURLIndexTest, ReadVisitsFromHistory) {
983 const HistoryInfoMap& history_info_map = GetPrivateData()->history_info_map_;
985 // Check (for URL with id 1) that the number of visits and their
986 // transition types are what we expect. We don't bother checking
987 // the timestamps because it's too much trouble. (The timestamps go
988 // through a transformation in InMemoryURLIndexTest::SetUp(). We
989 // assume that if the count and transitions show up with the right
990 // information, we're getting the right information from the history
992 HistoryInfoMap::const_iterator entry = history_info_map.find(1);
993 ASSERT_TRUE(entry != history_info_map.end());
995 const VisitInfoVector& visits = entry->second.visits;
996 EXPECT_EQ(3u, visits.size());
997 EXPECT_EQ(0u, visits[0].second);
998 EXPECT_EQ(1u, visits[1].second);
999 EXPECT_EQ(0u, visits[2].second);
1002 // Ditto but for URL with id 35.
1003 entry = history_info_map.find(35);
1004 ASSERT_TRUE(entry != history_info_map.end());
1006 const VisitInfoVector& visits = entry->second.visits;
1007 EXPECT_EQ(2u, visits.size());
1008 EXPECT_EQ(1u, visits[0].second);
1009 EXPECT_EQ(1u, visits[1].second);
1012 // The URL with id 32 has many visits listed in the database, but we
1013 // should only read the most recent 10 (which are all transition type 0).
1014 entry = history_info_map.find(32);
1015 ASSERT_TRUE(entry != history_info_map.end());
1017 const VisitInfoVector& visits = entry->second.visits;
1018 EXPECT_EQ(10u, visits.size());
1019 for (size_t i = 0; i < visits.size(); ++i)
1020 EXPECT_EQ(0u, visits[i].second);
1024 TEST_F(InMemoryURLIndexTest, CacheSaveRestore) {
1025 base::ScopedTempDir temp_directory;
1026 ASSERT_TRUE(temp_directory.CreateUniqueTempDir());
1027 set_history_dir(temp_directory.path());
1029 URLIndexPrivateData& private_data(*GetPrivateData());
1031 // Ensure that there is really something there to be saved.
1032 EXPECT_FALSE(private_data.word_list_.empty());
1033 // available_words_ will already be empty since we have freshly built the
1034 // data set for this test.
1035 EXPECT_TRUE(private_data.available_words_.empty());
1036 EXPECT_FALSE(private_data.word_map_.empty());
1037 EXPECT_FALSE(private_data.char_word_map_.empty());
1038 EXPECT_FALSE(private_data.word_id_history_map_.empty());
1039 EXPECT_FALSE(private_data.history_id_word_map_.empty());
1040 EXPECT_FALSE(private_data.history_info_map_.empty());
1041 EXPECT_FALSE(private_data.word_starts_map_.empty());
1043 // Make sure the data we have was built from history. (Version 0
1044 // means rebuilt from history.)
1045 EXPECT_EQ(0, private_data.restored_cache_version_);
1047 // Capture the current private data for later comparison to restored data.
1048 scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate());
1049 const base::Time rebuild_time = private_data.last_time_rebuilt_from_history_;
1051 // Save then restore our private data.
1052 CacheFileSaverObserver save_observer(&message_loop_);
1053 url_index_->set_save_cache_observer(&save_observer);
1054 PostSaveToCacheFileTask();
1055 message_loop_.Run();
1056 EXPECT_TRUE(save_observer.succeeded_);
1058 // Clear and then prove it's clear before restoring.
1060 EXPECT_TRUE(private_data.word_list_.empty());
1061 EXPECT_TRUE(private_data.available_words_.empty());
1062 EXPECT_TRUE(private_data.word_map_.empty());
1063 EXPECT_TRUE(private_data.char_word_map_.empty());
1064 EXPECT_TRUE(private_data.word_id_history_map_.empty());
1065 EXPECT_TRUE(private_data.history_id_word_map_.empty());
1066 EXPECT_TRUE(private_data.history_info_map_.empty());
1067 EXPECT_TRUE(private_data.word_starts_map_.empty());
1069 HistoryIndexRestoreObserver restore_observer(
1070 base::Bind(&base::MessageLoop::Quit, base::Unretained(&message_loop_)));
1071 url_index_->set_restore_cache_observer(&restore_observer);
1072 PostRestoreFromCacheFileTask();
1073 message_loop_.Run();
1074 EXPECT_TRUE(restore_observer.succeeded());
1076 URLIndexPrivateData& new_data(*GetPrivateData());
1078 // Make sure the data we have was reloaded from cache. (Version 0
1079 // means rebuilt from history; anything else means restored from
1080 // a cache version.) Also, the rebuild time should not have changed.
1081 EXPECT_GT(new_data.restored_cache_version_, 0);
1082 EXPECT_EQ(rebuild_time, new_data.last_time_rebuilt_from_history_);
1084 // Compare the captured and restored for equality.
1085 ExpectPrivateDataEqual(*old_data.get(), new_data);
1088 TEST_F(InMemoryURLIndexTest, RebuildFromHistoryIfCacheOld) {
1089 base::ScopedTempDir temp_directory;
1090 ASSERT_TRUE(temp_directory.CreateUniqueTempDir());
1091 set_history_dir(temp_directory.path());
1093 URLIndexPrivateData& private_data(*GetPrivateData());
1095 // Ensure that there is really something there to be saved.
1096 EXPECT_FALSE(private_data.word_list_.empty());
1097 // available_words_ will already be empty since we have freshly built the
1098 // data set for this test.
1099 EXPECT_TRUE(private_data.available_words_.empty());
1100 EXPECT_FALSE(private_data.word_map_.empty());
1101 EXPECT_FALSE(private_data.char_word_map_.empty());
1102 EXPECT_FALSE(private_data.word_id_history_map_.empty());
1103 EXPECT_FALSE(private_data.history_id_word_map_.empty());
1104 EXPECT_FALSE(private_data.history_info_map_.empty());
1105 EXPECT_FALSE(private_data.word_starts_map_.empty());
1107 // Make sure the data we have was built from history. (Version 0
1108 // means rebuilt from history.)
1109 EXPECT_EQ(0, private_data.restored_cache_version_);
1111 // Overwrite the build time so that we'll think the data is too old
1112 // and rebuild the cache from history.
1113 const base::Time fake_rebuild_time =
1114 private_data.last_time_rebuilt_from_history_ -
1115 base::TimeDelta::FromDays(30);
1116 private_data.last_time_rebuilt_from_history_ = fake_rebuild_time;
1118 // Capture the current private data for later comparison to restored data.
1119 scoped_refptr<URLIndexPrivateData> old_data(private_data.Duplicate());
1121 // Save then restore our private data.
1122 CacheFileSaverObserver save_observer(&message_loop_);
1123 url_index_->set_save_cache_observer(&save_observer);
1124 PostSaveToCacheFileTask();
1125 message_loop_.Run();
1126 EXPECT_TRUE(save_observer.succeeded_);
1128 // Clear and then prove it's clear before restoring.
1130 EXPECT_TRUE(private_data.word_list_.empty());
1131 EXPECT_TRUE(private_data.available_words_.empty());
1132 EXPECT_TRUE(private_data.word_map_.empty());
1133 EXPECT_TRUE(private_data.char_word_map_.empty());
1134 EXPECT_TRUE(private_data.word_id_history_map_.empty());
1135 EXPECT_TRUE(private_data.history_id_word_map_.empty());
1136 EXPECT_TRUE(private_data.history_info_map_.empty());
1137 EXPECT_TRUE(private_data.word_starts_map_.empty());
1139 HistoryIndexRestoreObserver restore_observer(
1140 base::Bind(&base::MessageLoop::Quit, base::Unretained(&message_loop_)));
1141 url_index_->set_restore_cache_observer(&restore_observer);
1142 PostRestoreFromCacheFileTask();
1143 message_loop_.Run();
1144 EXPECT_TRUE(restore_observer.succeeded());
1146 URLIndexPrivateData& new_data(*GetPrivateData());
1148 // Make sure the data we have was rebuilt from history. (Version 0
1149 // means rebuilt from history; anything else means restored from
1150 // a cache version.)
1151 EXPECT_EQ(0, new_data.restored_cache_version_);
1152 EXPECT_NE(fake_rebuild_time, new_data.last_time_rebuilt_from_history_);
1154 // Compare the captured and restored for equality.
1155 ExpectPrivateDataEqual(*old_data.get(), new_data);
1158 class InMemoryURLIndexCacheTest : public testing::Test {
1160 InMemoryURLIndexCacheTest() {}
1163 virtual void SetUp() OVERRIDE;
1165 // Pass-through functions to simplify our friendship with InMemoryURLIndex.
1166 void set_history_dir(const base::FilePath& dir_path);
1167 bool GetCacheFilePath(base::FilePath* file_path) const;
1169 base::ScopedTempDir temp_dir_;
1170 scoped_ptr<InMemoryURLIndex> url_index_;
1173 void InMemoryURLIndexCacheTest::SetUp() {
1174 ASSERT_TRUE(temp_dir_.CreateUniqueTempDir());
1175 HistoryClient history_client;
1176 base::FilePath path(temp_dir_.path());
1177 url_index_.reset(new InMemoryURLIndex(
1178 NULL, path, "en,ja,hi,zh", &history_client));
1181 void InMemoryURLIndexCacheTest::set_history_dir(
1182 const base::FilePath& dir_path) {
1183 return url_index_->set_history_dir(dir_path);
1186 bool InMemoryURLIndexCacheTest::GetCacheFilePath(
1187 base::FilePath* file_path) const {
1189 return url_index_->GetCacheFilePath(file_path);
1192 TEST_F(InMemoryURLIndexCacheTest, CacheFilePath) {
1193 base::FilePath expectedPath =
1194 temp_dir_.path().Append(FILE_PATH_LITERAL("History Provider Cache"));
1195 std::vector<base::FilePath::StringType> expected_parts;
1196 expectedPath.GetComponents(&expected_parts);
1197 base::FilePath full_file_path;
1198 ASSERT_TRUE(GetCacheFilePath(&full_file_path));
1199 std::vector<base::FilePath::StringType> actual_parts;
1200 full_file_path.GetComponents(&actual_parts);
1201 ASSERT_EQ(expected_parts.size(), actual_parts.size());
1202 size_t count = expected_parts.size();
1203 for (size_t i = 0; i < count; ++i)
1204 EXPECT_EQ(expected_parts[i], actual_parts[i]);
1205 // Must clear the history_dir_ to satisfy the dtor's DCHECK.
1206 set_history_dir(base::FilePath());
1209 } // namespace history