1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "base/file_util.h"
6 #include "base/memory/ref_counted.h"
7 #include "base/metrics/histogram.h"
8 #include "base/strings/string_split.h"
9 #include "base/strings/string_util.h"
10 #include "chrome/browser/history/history_types.h"
11 #include "chrome/browser/history/top_sites.h"
12 #include "chrome/browser/history/top_sites_database.h"
13 #include "chrome/common/thumbnail_score.h"
14 #include "sql/connection.h"
15 #include "sql/recovery.h"
16 #include "sql/statement.h"
17 #include "sql/transaction.h"
18 #include "third_party/sqlite/sqlite3.h"
19
20 // Description of database table:
21 //
22 // thumbnails
23 // url URL of the sites for which we have a thumbnail.
24 // url_rank Index of the URL in that thumbnail, 0-based. The thumbnail
25 // with the highest rank will be the next one evicted. Forced
26 // thumbnails have a rank of -1.
27 // title The title to display under that thumbnail.
28 // redirects A space separated list of URLs that are known to redirect
29 // to this url.
30 // boring_score How "boring" that thumbnail is. See ThumbnailScore.
31 // good_clipping True if the thumbnail was clipped from the bottom, keeping
32 // the entire width of the window. See ThumbnailScore.
33 // at_top True if the thumbnail was captured at the top of the
34 // website.
35 // last_updated The time at which this thumbnail was last updated.
36 // load_completed True if the thumbnail was captured after the page load was
37 // completed.
38 // last_forced If this is a forced thumbnail, records the last time it
39 // was forced. If it's not a forced thumbnail, 0.
40
41 namespace {
42
43 // For this database, schema migrations are deprecated after two
44 // years. This means that the oldest non-deprecated version should be
45 // two years old or greater (thus the migrations to get there are
46 // older). Databases containing deprecated versions will be cleared
47 // at startup. Since this database is a cache, losing old data is not
48 // fatal (in fact, very old data may be expired immediately at startup
49 // anyhow).
50
51 // Version 3: b6d6a783/r231648 by beaudoin@chromium.org on 2013-10-29
52 // Version 2: eb0b24e6/r87284 by satorux@chromium.org on 2011-05-31
53 // Version 1: 809cc4d8/r64072 by sky@chromium.org on 2010-10-27 (deprecated)
54
55 // NOTE(shess): When changing the version, add a new golden file for
56 // the new version and a test to verify that Init() works with it.
57 // NOTE(shess): RecoverDatabaseOrRaze() depends on the specific
58 // version number. The code is subtle and in development, contact me
59 // if the necessary changes are not obvious.
60 static const int kVersionNumber = 3;
61 static const int kDeprecatedVersionNumber = 1; // and earlier.
62
InitTables(sql::Connection * db)63 bool InitTables(sql::Connection* db) {
64 const char kThumbnailsSql[] =
65 "CREATE TABLE IF NOT EXISTS thumbnails ("
66 "url LONGVARCHAR PRIMARY KEY,"
67 "url_rank INTEGER,"
68 "title LONGVARCHAR,"
69 "thumbnail BLOB,"
70 "redirects LONGVARCHAR,"
71 "boring_score DOUBLE DEFAULT 1.0,"
72 "good_clipping INTEGER DEFAULT 0,"
73 "at_top INTEGER DEFAULT 0,"
74 "last_updated INTEGER DEFAULT 0,"
75 "load_completed INTEGER DEFAULT 0,"
76 "last_forced INTEGER DEFAULT 0)";
77 return db->Execute(kThumbnailsSql);
78 }
79
80 // Encodes redirects into a string.
GetRedirects(const history::MostVisitedURL & url)81 std::string GetRedirects(const history::MostVisitedURL& url) {
82 std::vector<std::string> redirects;
83 for (size_t i = 0; i < url.redirects.size(); i++)
84 redirects.push_back(url.redirects[i].spec());
85 return JoinString(redirects, ' ');
86 }
87
88 // Decodes redirects from a string and sets them for the url.
SetRedirects(const std::string & redirects,history::MostVisitedURL * url)89 void SetRedirects(const std::string& redirects, history::MostVisitedURL* url) {
90 std::vector<std::string> redirects_vector;
91 base::SplitStringAlongWhitespace(redirects, &redirects_vector);
92 for (size_t i = 0; i < redirects_vector.size(); ++i)
93 url->redirects.push_back(GURL(redirects_vector[i]));
94 }
95
96 // Track various failure (and success) cases in recovery code.
97 //
98 // TODO(shess): The recovery code is complete, but by nature runs in challenging
99 // circumstances, so initially the default error response is to leave the
100 // existing database in place. This histogram is intended to expose the
101 // failures seen in the fleet. Frequent failure cases can be explored more
102 // deeply to see if the complexity to fix them is warranted. Infrequent failure
103 // cases can be resolved by marking the database unrecoverable (which will
104 // delete the data).
105 //
106 // Based on the thumbnail_database.cc recovery code, FAILED_SCOPER should
107 // dominate, followed distantly by FAILED_META, with few or no other failures.
108 enum RecoveryEventType {
109 // Database successfully recovered.
110 RECOVERY_EVENT_RECOVERED = 0,
111
112 // Database successfully deprecated.
113 RECOVERY_EVENT_DEPRECATED,
114
115 // Sqlite.RecoveryEvent can usually be used to get more detail about the
116 // specific failure (see sql/recovery.cc).
117 RECOVERY_EVENT_FAILED_SCOPER,
118 RECOVERY_EVENT_FAILED_META_VERSION,
119 RECOVERY_EVENT_FAILED_META_WRONG_VERSION,
120 RECOVERY_EVENT_FAILED_META_INIT,
121 RECOVERY_EVENT_FAILED_SCHEMA_INIT,
122 RECOVERY_EVENT_FAILED_AUTORECOVER_THUMBNAILS,
123 RECOVERY_EVENT_FAILED_COMMIT,
124
125 // Track invariants resolved by FixThumbnailsTable().
126 RECOVERY_EVENT_INVARIANT_RANK,
127 RECOVERY_EVENT_INVARIANT_REDIRECT,
128 RECOVERY_EVENT_INVARIANT_CONTIGUOUS,
129
130 // Always keep this at the end.
131 RECOVERY_EVENT_MAX,
132 };
133
RecordRecoveryEvent(RecoveryEventType recovery_event)134 void RecordRecoveryEvent(RecoveryEventType recovery_event) {
135 UMA_HISTOGRAM_ENUMERATION("History.TopSitesRecovery",
136 recovery_event, RECOVERY_EVENT_MAX);
137 }
138
139 // Most corruption comes down to atomic updates between pages being broken
140 // somehow. This can result in either missing data, or overlapping data,
141 // depending on the operation broken. This table has large rows, which will use
142 // overflow pages, so it is possible (though unlikely) that a chain could fit
143 // together and yield a row with errors.
FixThumbnailsTable(sql::Connection * db)144 void FixThumbnailsTable(sql::Connection* db) {
145 // Enforce invariant separating forced and non-forced thumbnails.
146 const char kFixRankSql[] =
147 "DELETE FROM thumbnails "
148 "WHERE (url_rank = -1 AND last_forced = 0) "
149 "OR (url_rank <> -1 AND last_forced <> 0)";
150 ignore_result(db->Execute(kFixRankSql));
151 if (db->GetLastChangeCount() > 0)
152 RecordRecoveryEvent(RECOVERY_EVENT_INVARIANT_RANK);
153
154 // Enforce invariant that url is in its own redirects.
155 const char kFixRedirectsSql[] =
156 "DELETE FROM thumbnails "
157 "WHERE url <> substr(redirects, -length(url), length(url))";
158 ignore_result(db->Execute(kFixRedirectsSql));
159 if (db->GetLastChangeCount() > 0)
160 RecordRecoveryEvent(RECOVERY_EVENT_INVARIANT_REDIRECT);
161
162 // Enforce invariant that url_rank>=0 forms a contiguous series.
163 // TODO(shess): I have not found an UPDATE+SUBSELECT method of managing this.
164 // It can be done with a temporary table and a subselect, but doing it
165 // manually is easier to follow. Another option would be to somehow integrate
166 // the renumbering into the table recovery code.
167 const char kByRankSql[] =
168 "SELECT url_rank, rowid FROM thumbnails WHERE url_rank <> -1 "
169 "ORDER BY url_rank";
170 sql::Statement select_statement(db->GetUniqueStatement(kByRankSql));
171
172 const char kAdjustRankSql[] =
173 "UPDATE thumbnails SET url_rank = ? WHERE rowid = ?";
174 sql::Statement update_statement(db->GetUniqueStatement(kAdjustRankSql));
175
176 // Update any rows where |next_rank| doesn't match |url_rank|.
177 int next_rank = 0;
178 bool adjusted = false;
179 while (select_statement.Step()) {
180 const int url_rank = select_statement.ColumnInt(0);
181 if (url_rank != next_rank) {
182 adjusted = true;
183 update_statement.Reset(true);
184 update_statement.BindInt(0, next_rank);
185 update_statement.BindInt64(1, select_statement.ColumnInt64(1));
186 update_statement.Run();
187 }
188 ++next_rank;
189 }
190 if (adjusted)
191 RecordRecoveryEvent(RECOVERY_EVENT_INVARIANT_CONTIGUOUS);
192 }
193
194 // Recover the database to the extent possible, razing it if recovery is not
195 // possible.
RecoverDatabaseOrRaze(sql::Connection * db,const base::FilePath & db_path)196 void RecoverDatabaseOrRaze(sql::Connection* db, const base::FilePath& db_path) {
197 // NOTE(shess): If the version changes, review this code.
198 DCHECK_EQ(3, kVersionNumber);
199
200 // It is almost certain that some operation against |db| will fail, prevent
201 // reentry.
202 db->reset_error_callback();
203
204 // For generating histogram stats.
205 size_t thumbnails_recovered = 0;
206 int64 original_size = 0;
207 base::GetFileSize(db_path, &original_size);
208
209 scoped_ptr<sql::Recovery> recovery = sql::Recovery::Begin(db, db_path);
210 if (!recovery) {
211 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_SCOPER);
212 return;
213 }
214
215 // Setup the meta recovery table and fetch the version number from the corrupt
216 // database.
217 int version = 0;
218 if (!recovery->SetupMeta() || !recovery->GetMetaVersionNumber(&version)) {
219 // TODO(shess): Prior histograms indicate all failures are in creating the
220 // recover virtual table for corrupt.meta. The table may not exist, or the
221 // database may be too far gone. Either way, unclear how to resolve.
222 sql::Recovery::Rollback(recovery.Pass());
223 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_META_VERSION);
224 return;
225 }
226
227 // This code runs in a context which may be able to read version information
228 // that the regular deprecation path cannot. The effect of this code will be
229 // to raze the database.
230 if (version <= kDeprecatedVersionNumber) {
231 sql::Recovery::Unrecoverable(recovery.Pass());
232 RecordRecoveryEvent(RECOVERY_EVENT_DEPRECATED);
233 return;
234 }
235
236 // TODO(shess): Earlier versions have been deprecated, later versions should
237 // be impossible. Unrecoverable() seems like a feasible response if this is
238 // infrequent enough.
239 if (version != 2 && version != 3) {
240 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_META_WRONG_VERSION);
241 sql::Recovery::Rollback(recovery.Pass());
242 return;
243 }
244
245 // Both v2 and v3 recover to current schema version.
246 sql::MetaTable recover_meta_table;
247 if (!recover_meta_table.Init(recovery->db(), kVersionNumber,
248 kVersionNumber)) {
249 sql::Recovery::Rollback(recovery.Pass());
250 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_META_INIT);
251 return;
252 }
253
254 // Create a fresh version of the schema. The recovery code uses
255 // conflict-resolution to handle duplicates, so any indices are necessary.
256 if (!InitTables(recovery->db())) {
257 // TODO(shess): Unable to create the new schema in the new database. The
258 // new database should be a temporary file, so being unable to work with it
259 // is pretty unclear.
260 //
261 // What are the potential responses, even? The recovery database could be
262 // opened as in-memory. If the temp database had a filesystem problem and
263 // the temp filesystem differs from the main database, then that could fix
264 // it.
265 sql::Recovery::Rollback(recovery.Pass());
266 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_SCHEMA_INIT);
267 return;
268 }
269
270 // The |1| is because v2 [thumbnails] has one less column than v3 did. In the
271 // v2 case the column will get default values.
272 if (!recovery->AutoRecoverTable("thumbnails", 1, &thumbnails_recovered)) {
273 sql::Recovery::Rollback(recovery.Pass());
274 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_AUTORECOVER_THUMBNAILS);
275 return;
276 }
277
278 // TODO(shess): Inline this?
279 FixThumbnailsTable(recovery->db());
280
281 if (!sql::Recovery::Recovered(recovery.Pass())) {
282 // TODO(shess): Very unclear what this failure would actually mean, and what
283 // should be done. Add histograms to Recovered() implementation to get some
284 // insight.
285 RecordRecoveryEvent(RECOVERY_EVENT_FAILED_COMMIT);
286 return;
287 }
288
289 // Track the size of the recovered database relative to the size of the input
290 // database. The size should almost always be smaller, unless the input
291 // database was empty to start with. If the percentage results are very low,
292 // something is awry.
293 int64 final_size = 0;
294 if (original_size > 0 &&
295 base::GetFileSize(db_path, &final_size) &&
296 final_size > 0) {
297 UMA_HISTOGRAM_PERCENTAGE("History.TopSitesRecoveredPercentage",
298 final_size * 100 / original_size);
299 }
300
301 // Using 10,000 because these cases mostly care about "none recovered" and
302 // "lots recovered". More than 10,000 rows recovered probably means there's
303 // something wrong with the profile.
304 UMA_HISTOGRAM_COUNTS_10000("History.TopSitesRecoveredRowsThumbnails",
305 thumbnails_recovered);
306
307 RecordRecoveryEvent(RECOVERY_EVENT_RECOVERED);
308 }
309
DatabaseErrorCallback(sql::Connection * db,const base::FilePath & db_path,int extended_error,sql::Statement * stmt)310 void DatabaseErrorCallback(sql::Connection* db,
311 const base::FilePath& db_path,
312 int extended_error,
313 sql::Statement* stmt) {
314 // TODO(shess): Assert that this is running on a safe thread. AFAICT, should
315 // be the history thread, but at this level I can't see how to reach that.
316
317 // Attempt to recover corrupt databases.
318 int error = (extended_error & 0xFF);
319 if (error == SQLITE_CORRUPT ||
320 error == SQLITE_CANTOPEN ||
321 error == SQLITE_NOTADB) {
322 RecoverDatabaseOrRaze(db, db_path);
323 }
324
325 // TODO(shess): This database's error histograms look like:
326 // 84% SQLITE_CORRUPT, SQLITE_CANTOPEN, SQLITE_NOTADB
327 // 7% SQLITE_ERROR
328 // 6% SQLITE_IOERR variants
329 // 2% SQLITE_READONLY
330 // .4% SQLITE_FULL
331 // nominal SQLITE_TOBIG, SQLITE_AUTH, and SQLITE_BUSY. In the case of
332 // thumbnail_database.cc, as soon as the recovery code landed, SQLITE_IOERR
333 // shot to leadership. If the I/O error is system-level, there is probably no
334 // hope, but if it is restricted to something about the database file, it is
335 // possible that the recovery code could be brought to bear. In fact, it is
336 // possible that running recovery would be a reasonable default when errors
337 // are seen.
338
339 // The default handling is to assert on debug and to ignore on release.
340 if (!sql::Connection::ShouldIgnoreSqliteError(extended_error))
341 DLOG(FATAL) << db->GetErrorMessage();
342 }
343
344 } // namespace
345
346 namespace history {
347
348 // static
349 const int TopSitesDatabase::kRankOfForcedURL = -1;
350
351 // static
352 const int TopSitesDatabase::kRankOfNonExistingURL = -2;
353
TopSitesDatabase()354 TopSitesDatabase::TopSitesDatabase() {
355 }
356
~TopSitesDatabase()357 TopSitesDatabase::~TopSitesDatabase() {
358 }
359
Init(const base::FilePath & db_name)360 bool TopSitesDatabase::Init(const base::FilePath& db_name) {
361 // Retry failed InitImpl() in case the recovery system fixed things.
362 // TODO(shess): Instrument to figure out if there are any persistent failure
363 // cases which do not resolve themselves.
364 const size_t kAttempts = 2;
365
366 for (size_t i = 0; i < kAttempts; ++i) {
367 if (InitImpl(db_name))
368 return true;
369
370 meta_table_.Reset();
371 db_.reset();
372 }
373 return false;
374 }
375
InitImpl(const base::FilePath & db_name)376 bool TopSitesDatabase::InitImpl(const base::FilePath& db_name) {
377 const bool file_existed = base::PathExists(db_name);
378
379 db_.reset(CreateDB(db_name));
380 if (!db_)
381 return false;
382
383 // An older version had data with no meta table. Deprecate by razing.
384 // TODO(shess): Just have RazeIfDeprecated() handle this case.
385 const bool does_meta_exist = sql::MetaTable::DoesTableExist(db_.get());
386 if (!does_meta_exist && file_existed) {
387 if (!db_->Raze())
388 return false;
389 }
390
391 // Clear databases which are too old to process.
392 DCHECK_LT(kDeprecatedVersionNumber, kVersionNumber);
393 sql::MetaTable::RazeIfDeprecated(db_.get(), kDeprecatedVersionNumber);
394
395 // Scope initialization in a transaction so we can't be partially
396 // initialized.
397 sql::Transaction transaction(db_.get());
398 // TODO(shess): Failure to open transaction is bad, address it.
399 if (!transaction.Begin())
400 return false;
401
402 if (!meta_table_.Init(db_.get(), kVersionNumber, kVersionNumber))
403 return false;
404
405 if (!InitTables(db_.get()))
406 return false;
407
408 if (meta_table_.GetVersionNumber() == 2) {
409 if (!UpgradeToVersion3()) {
410 LOG(WARNING) << "Unable to upgrade top sites database to version 3.";
411 return false;
412 }
413 }
414
415 // Version check.
416 if (meta_table_.GetVersionNumber() != kVersionNumber)
417 return false;
418
419 // Initialization is complete.
420 if (!transaction.Commit())
421 return false;
422
423 return true;
424 }
425
UpgradeToVersion3()426 bool TopSitesDatabase::UpgradeToVersion3() {
427 // Add 'last_forced' column.
428 if (!db_->Execute(
429 "ALTER TABLE thumbnails ADD last_forced INTEGER DEFAULT 0")) {
430 NOTREACHED();
431 return false;
432 }
433 meta_table_.SetVersionNumber(3);
434 return true;
435 }
436
GetPageThumbnails(MostVisitedURLList * urls,URLToImagesMap * thumbnails)437 void TopSitesDatabase::GetPageThumbnails(MostVisitedURLList* urls,
438 URLToImagesMap* thumbnails) {
439 sql::Statement statement(db_->GetCachedStatement(
440 SQL_FROM_HERE,
441 "SELECT url, url_rank, title, thumbnail, redirects, "
442 "boring_score, good_clipping, at_top, last_updated, load_completed, "
443 "last_forced FROM thumbnails ORDER BY url_rank, last_forced"));
444
445 if (!statement.is_valid()) {
446 LOG(WARNING) << db_->GetErrorMessage();
447 return;
448 }
449
450 urls->clear();
451 thumbnails->clear();
452
453 while (statement.Step()) {
454 // Results are sorted by url_rank. For forced thumbnails with url_rank = -1,
455 // thumbnails are sorted by last_forced.
456 MostVisitedURL url;
457 GURL gurl(statement.ColumnString(0));
458 url.url = gurl;
459 url.title = statement.ColumnString16(2);
460 url.last_forced_time =
461 base::Time::FromInternalValue(statement.ColumnInt64(10));
462 std::string redirects = statement.ColumnString(4);
463 SetRedirects(redirects, &url);
464 urls->push_back(url);
465
466 std::vector<unsigned char> data;
467 statement.ColumnBlobAsVector(3, &data);
468 Images thumbnail;
469 if (!data.empty())
470 thumbnail.thumbnail = base::RefCountedBytes::TakeVector(&data);
471 thumbnail.thumbnail_score.boring_score = statement.ColumnDouble(5);
472 thumbnail.thumbnail_score.good_clipping = statement.ColumnBool(6);
473 thumbnail.thumbnail_score.at_top = statement.ColumnBool(7);
474 thumbnail.thumbnail_score.time_at_snapshot =
475 base::Time::FromInternalValue(statement.ColumnInt64(8));
476 thumbnail.thumbnail_score.load_completed = statement.ColumnBool(9);
477 (*thumbnails)[gurl] = thumbnail;
478 }
479 }
480
SetPageThumbnail(const MostVisitedURL & url,int new_rank,const Images & thumbnail)481 void TopSitesDatabase::SetPageThumbnail(const MostVisitedURL& url,
482 int new_rank,
483 const Images& thumbnail) {
484 sql::Transaction transaction(db_.get());
485 transaction.Begin();
486
487 int rank = GetURLRank(url);
488 if (rank == kRankOfNonExistingURL) {
489 AddPageThumbnail(url, new_rank, thumbnail);
490 } else {
491 UpdatePageRankNoTransaction(url, new_rank);
492 UpdatePageThumbnail(url, thumbnail);
493 }
494
495 transaction.Commit();
496 }
497
UpdatePageThumbnail(const MostVisitedURL & url,const Images & thumbnail)498 bool TopSitesDatabase::UpdatePageThumbnail(
499 const MostVisitedURL& url, const Images& thumbnail) {
500 sql::Statement statement(db_->GetCachedStatement(
501 SQL_FROM_HERE,
502 "UPDATE thumbnails SET "
503 "title = ?, thumbnail = ?, redirects = ?, "
504 "boring_score = ?, good_clipping = ?, at_top = ?, last_updated = ?, "
505 "load_completed = ?, last_forced = ?"
506 "WHERE url = ? "));
507 statement.BindString16(0, url.title);
508 if (thumbnail.thumbnail.get() && thumbnail.thumbnail->front()) {
509 statement.BindBlob(1, thumbnail.thumbnail->front(),
510 static_cast<int>(thumbnail.thumbnail->size()));
511 }
512 statement.BindString(2, GetRedirects(url));
513 const ThumbnailScore& score = thumbnail.thumbnail_score;
514 statement.BindDouble(3, score.boring_score);
515 statement.BindBool(4, score.good_clipping);
516 statement.BindBool(5, score.at_top);
517 statement.BindInt64(6, score.time_at_snapshot.ToInternalValue());
518 statement.BindBool(7, score.load_completed);
519 statement.BindInt64(8, url.last_forced_time.ToInternalValue());
520 statement.BindString(9, url.url.spec());
521
522 return statement.Run();
523 }
524
AddPageThumbnail(const MostVisitedURL & url,int new_rank,const Images & thumbnail)525 void TopSitesDatabase::AddPageThumbnail(const MostVisitedURL& url,
526 int new_rank,
527 const Images& thumbnail) {
528 sql::Statement statement(db_->GetCachedStatement(
529 SQL_FROM_HERE,
530 "INSERT OR REPLACE INTO thumbnails "
531 "(url, url_rank, title, thumbnail, redirects, "
532 "boring_score, good_clipping, at_top, last_updated, load_completed, "
533 "last_forced) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)"));
534 statement.BindString(0, url.url.spec());
535 statement.BindInt(1, kRankOfForcedURL); // Fist make it a forced thumbnail.
536 statement.BindString16(2, url.title);
537 if (thumbnail.thumbnail.get() && thumbnail.thumbnail->front()) {
538 statement.BindBlob(3, thumbnail.thumbnail->front(),
539 static_cast<int>(thumbnail.thumbnail->size()));
540 }
541 statement.BindString(4, GetRedirects(url));
542 const ThumbnailScore& score = thumbnail.thumbnail_score;
543 statement.BindDouble(5, score.boring_score);
544 statement.BindBool(6, score.good_clipping);
545 statement.BindBool(7, score.at_top);
546 statement.BindInt64(8, score.time_at_snapshot.ToInternalValue());
547 statement.BindBool(9, score.load_completed);
548 int64 last_forced = url.last_forced_time.ToInternalValue();
549 DCHECK((last_forced == 0) == (new_rank != kRankOfForcedURL))
550 << "Thumbnail without a forced time stamp has a forced rank, or the "
551 << "opposite.";
552 statement.BindInt64(10, last_forced);
553 if (!statement.Run())
554 return;
555
556 // Update rank if this is not a forced thumbnail.
557 if (new_rank != kRankOfForcedURL)
558 UpdatePageRankNoTransaction(url, new_rank);
559 }
560
UpdatePageRank(const MostVisitedURL & url,int new_rank)561 void TopSitesDatabase::UpdatePageRank(const MostVisitedURL& url,
562 int new_rank) {
563 DCHECK((url.last_forced_time.ToInternalValue() == 0) ==
564 (new_rank != kRankOfForcedURL))
565 << "Thumbnail without a forced time stamp has a forced rank, or the "
566 << "opposite.";
567 sql::Transaction transaction(db_.get());
568 transaction.Begin();
569 UpdatePageRankNoTransaction(url, new_rank);
570 transaction.Commit();
571 }
572
573 // Caller should have a transaction open.
UpdatePageRankNoTransaction(const MostVisitedURL & url,int new_rank)574 void TopSitesDatabase::UpdatePageRankNoTransaction(
575 const MostVisitedURL& url, int new_rank) {
576 DCHECK_GT(db_->transaction_nesting(), 0);
577 DCHECK((url.last_forced_time.is_null()) == (new_rank != kRankOfForcedURL))
578 << "Thumbnail without a forced time stamp has a forced rank, or the "
579 << "opposite.";
580
581 int prev_rank = GetURLRank(url);
582 if (prev_rank == kRankOfNonExistingURL) {
583 LOG(WARNING) << "Updating rank of an unknown URL: " << url.url.spec();
584 return;
585 }
586
587 // Shift the ranks.
588 if (prev_rank > new_rank) {
589 if (new_rank == kRankOfForcedURL) {
590 // From non-forced to forced, shift down.
591 // Example: 2 -> -1
592 // -1, -1, -1, 0, 1, [2 -> -1], [3 -> 2], [4 -> 3]
593 sql::Statement shift_statement(db_->GetCachedStatement(
594 SQL_FROM_HERE,
595 "UPDATE thumbnails "
596 "SET url_rank = url_rank - 1 "
597 "WHERE url_rank > ?"));
598 shift_statement.BindInt(0, prev_rank);
599 shift_statement.Run();
600 } else {
601 // From non-forced to non-forced, shift up.
602 // Example: 3 -> 1
603 // -1, -1, -1, 0, [1 -> 2], [2 -> 3], [3 -> 1], 4
604 sql::Statement shift_statement(db_->GetCachedStatement(
605 SQL_FROM_HERE,
606 "UPDATE thumbnails "
607 "SET url_rank = url_rank + 1 "
608 "WHERE url_rank >= ? AND url_rank < ?"));
609 shift_statement.BindInt(0, new_rank);
610 shift_statement.BindInt(1, prev_rank);
611 shift_statement.Run();
612 }
613 } else if (prev_rank < new_rank) {
614 if (prev_rank == kRankOfForcedURL) {
615 // From non-forced to forced, shift up.
616 // Example: -1 -> 2
617 // -1, [-1 -> 2], -1, 0, 1, [2 -> 3], [3 -> 4], [4 -> 5]
618 sql::Statement shift_statement(db_->GetCachedStatement(
619 SQL_FROM_HERE,
620 "UPDATE thumbnails "
621 "SET url_rank = url_rank + 1 "
622 "WHERE url_rank >= ?"));
623 shift_statement.BindInt(0, new_rank);
624 shift_statement.Run();
625 } else {
626 // From non-forced to non-forced, shift down.
627 // Example: 1 -> 3.
628 // -1, -1, -1, 0, [1 -> 3], [2 -> 1], [3 -> 2], 4
629 sql::Statement shift_statement(db_->GetCachedStatement(
630 SQL_FROM_HERE,
631 "UPDATE thumbnails "
632 "SET url_rank = url_rank - 1 "
633 "WHERE url_rank > ? AND url_rank <= ?"));
634 shift_statement.BindInt(0, prev_rank);
635 shift_statement.BindInt(1, new_rank);
636 shift_statement.Run();
637 }
638 }
639
640 // Set the url's rank and last_forced, since the latter changes when a URL
641 // goes from forced to non-forced and vice-versa.
642 sql::Statement set_statement(db_->GetCachedStatement(
643 SQL_FROM_HERE,
644 "UPDATE thumbnails "
645 "SET url_rank = ?, last_forced = ? "
646 "WHERE url == ?"));
647 set_statement.BindInt(0, new_rank);
648 set_statement.BindInt64(1, url.last_forced_time.ToInternalValue());
649 set_statement.BindString(2, url.url.spec());
650 set_statement.Run();
651 }
652
GetPageThumbnail(const GURL & url,Images * thumbnail)653 bool TopSitesDatabase::GetPageThumbnail(const GURL& url,
654 Images* thumbnail) {
655 sql::Statement statement(db_->GetCachedStatement(
656 SQL_FROM_HERE,
657 "SELECT thumbnail, boring_score, good_clipping, at_top, last_updated "
658 "FROM thumbnails WHERE url=?"));
659 statement.BindString(0, url.spec());
660 if (!statement.Step())
661 return false;
662
663 std::vector<unsigned char> data;
664 statement.ColumnBlobAsVector(0, &data);
665 thumbnail->thumbnail = base::RefCountedBytes::TakeVector(&data);
666 thumbnail->thumbnail_score.boring_score = statement.ColumnDouble(1);
667 thumbnail->thumbnail_score.good_clipping = statement.ColumnBool(2);
668 thumbnail->thumbnail_score.at_top = statement.ColumnBool(3);
669 thumbnail->thumbnail_score.time_at_snapshot =
670 base::Time::FromInternalValue(statement.ColumnInt64(4));
671 return true;
672 }
673
GetURLRank(const MostVisitedURL & url)674 int TopSitesDatabase::GetURLRank(const MostVisitedURL& url) {
675 sql::Statement select_statement(db_->GetCachedStatement(
676 SQL_FROM_HERE,
677 "SELECT url_rank "
678 "FROM thumbnails WHERE url=?"));
679 select_statement.BindString(0, url.url.spec());
680 if (select_statement.Step())
681 return select_statement.ColumnInt(0);
682
683 return kRankOfNonExistingURL;
684 }
685
686 // Remove the record for this URL. Returns true iff removed successfully.
RemoveURL(const MostVisitedURL & url)687 bool TopSitesDatabase::RemoveURL(const MostVisitedURL& url) {
688 int old_rank = GetURLRank(url);
689 if (old_rank == kRankOfNonExistingURL)
690 return false;
691
692 sql::Transaction transaction(db_.get());
693 transaction.Begin();
694 if (old_rank != kRankOfForcedURL) {
695 // Decrement all following ranks.
696 sql::Statement shift_statement(db_->GetCachedStatement(
697 SQL_FROM_HERE,
698 "UPDATE thumbnails "
699 "SET url_rank = url_rank - 1 "
700 "WHERE url_rank > ?"));
701 shift_statement.BindInt(0, old_rank);
702
703 if (!shift_statement.Run())
704 return false;
705 }
706
707 sql::Statement delete_statement(
708 db_->GetCachedStatement(SQL_FROM_HERE,
709 "DELETE FROM thumbnails WHERE url = ?"));
710 delete_statement.BindString(0, url.url.spec());
711
712 if (!delete_statement.Run())
713 return false;
714
715 return transaction.Commit();
716 }
717
CreateDB(const base::FilePath & db_name)718 sql::Connection* TopSitesDatabase::CreateDB(const base::FilePath& db_name) {
719 scoped_ptr<sql::Connection> db(new sql::Connection());
720 // Settings copied from ThumbnailDatabase.
721 db->set_histogram_tag("TopSites");
722 db->set_error_callback(base::Bind(&DatabaseErrorCallback,
723 db.get(), db_name));
724 db->set_page_size(4096);
725 db->set_cache_size(32);
726
727 if (!db->Open(db_name))
728 return NULL;
729 return db.release();
730 }
731
732 } // namespace history
733