// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "chrome/browser/history/history_backend.h" #include #include #include #include #include #include #include "base/basictypes.h" #include "base/bind.h" #include "base/compiler_specific.h" #include "base/file_util.h" #include "base/memory/scoped_ptr.h" #include "base/memory/scoped_vector.h" #include "base/message_loop.h" #include "base/metrics/histogram.h" #include "base/string_util.h" #include "base/time.h" #include "base/utf_string_conversions.h" #include "chrome/browser/api/bookmarks/bookmark_service.h" #include "chrome/browser/autocomplete/history_url_provider.h" #include "chrome/browser/history/download_row.h" #include "chrome/browser/history/history_notifications.h" #include "chrome/browser/history/history_publisher.h" #include "chrome/browser/history/in_memory_history_backend.h" #include "chrome/browser/history/page_usage_data.h" #include "chrome/browser/history/select_favicon_frames.h" #include "chrome/browser/history/top_sites.h" #include "chrome/browser/history/visit_filter.h" #include "chrome/common/chrome_constants.h" #include "chrome/common/chrome_notification_types.h" #include "chrome/common/url_constants.h" #include "googleurl/src/gurl.h" #include "grit/chromium_strings.h" #include "grit/generated_resources.h" #include "net/base/registry_controlled_domains/registry_controlled_domain.h" #include "sql/error_delegate_util.h" #if defined(OS_ANDROID) #include "chrome/browser/history/android/android_provider_backend.h" #endif using base::Time; using base::TimeDelta; using base::TimeTicks; /* The HistoryBackend consists of a number of components: HistoryDatabase (stores past 3 months of history) URLDatabase (stores a list of URLs) DownloadDatabase (stores a list of downloads) VisitDatabase (stores a list of visits for the URLs) VisitSegmentDatabase (stores groups of URLs for the most visited view). ArchivedDatabase (stores history older than 3 months) URLDatabase (stores a list of URLs) DownloadDatabase (stores a list of downloads) VisitDatabase (stores a list of visits for the URLs) (this does not store visit segments as they expire after 3 mos.) TextDatabaseManager (manages multiple text database for different times) TextDatabase (represents a single month of full-text index). ...more TextDatabase objects... ExpireHistoryBackend (manages moving things from HistoryDatabase to the ArchivedDatabase and deleting) */ namespace history { // How long we keep segment data for in days. Currently 3 months. // This value needs to be greater or equal to // MostVisitedModel::kMostVisitedScope but we don't want to introduce a direct // dependency between MostVisitedModel and the history backend. static const int kSegmentDataRetention = 90; // How long we'll wait to do a commit, so that things are batched together. static const int kCommitIntervalSeconds = 10; // The amount of time before we re-fetch the favicon. static const int kFaviconRefetchDays = 7; // GetSessionTabs returns all open tabs, or tabs closed kSessionCloseTimeWindow // seconds ago. static const int kSessionCloseTimeWindowSecs = 10; // The maximum number of items we'll allow in the redirect list before // deleting some. static const int kMaxRedirectCount = 32; // The number of days old a history entry can be before it is considered "old" // and is archived. static const int kArchiveDaysThreshold = 90; // Converts from PageUsageData to MostVisitedURL. |redirects| is a // list of redirects for this URL. Empty list means no redirects. MostVisitedURL MakeMostVisitedURL(const PageUsageData& page_data, const RedirectList& redirects) { MostVisitedURL mv; mv.url = page_data.GetURL(); mv.title = page_data.GetTitle(); if (redirects.empty()) { // Redirects must contain at least the target url. mv.redirects.push_back(mv.url); } else { mv.redirects = redirects; if (mv.redirects[mv.redirects.size() - 1] != mv.url) { // The last url must be the target url. mv.redirects.push_back(mv.url); } } return mv; } // This task is run on a timer so that commits happen at regular intervals // so they are batched together. The important thing about this class is that // it supports canceling of the task so the reference to the backend will be // freed. The problem is that when history is shutting down, there is likely // to be one of these commits still pending and holding a reference. // // The backend can call Cancel to have this task release the reference. The // task will still run (if we ever get to processing the event before // shutdown), but it will not do anything. // // Note that this is a refcounted object and is not a task in itself. It should // be assigned to a RunnableMethod. // // TODO(brettw): bug 1165182: This should be replaced with a // base::WeakPtrFactory which will handle everything automatically (like we do // in ExpireHistoryBackend). class CommitLaterTask : public base::RefCounted { public: explicit CommitLaterTask(HistoryBackend* history_backend) : history_backend_(history_backend) { } // The backend will call this function if it is being destroyed so that we // release our reference. void Cancel() { history_backend_ = NULL; } void RunCommit() { if (history_backend_.get()) history_backend_->Commit(); } private: friend class base::RefCounted; ~CommitLaterTask() {} scoped_refptr history_backend_; }; // Handles querying first the main database, then the full text database if that // fails. It will optionally keep track of all URLs seen so duplicates can be // eliminated. This is used by the querying sub-functions. // // TODO(brettw): This class may be able to be simplified or eliminated. After // this was written, QueryResults can efficiently look up by URL, so the need // for this extra set of previously queried URLs is less important. class HistoryBackend::URLQuerier { public: URLQuerier(URLDatabase* main_db, URLDatabase* archived_db, bool track_unique) : main_db_(main_db), archived_db_(archived_db), track_unique_(track_unique) { } // When we're tracking unique URLs, returns true if this URL has been // previously queried. Only call when tracking unique URLs. bool HasURL(const GURL& url) { DCHECK(track_unique_); return unique_urls_.find(url) != unique_urls_.end(); } bool GetRowForURL(const GURL& url, URLRow* row) { if (!main_db_->GetRowForURL(url, row)) { if (!archived_db_ || !archived_db_->GetRowForURL(url, row)) { // This row is neither in the main nor the archived DB. return false; } } if (track_unique_) unique_urls_.insert(url); return true; } private: URLDatabase* main_db_; // Guaranteed non-NULL. URLDatabase* archived_db_; // Possibly NULL. bool track_unique_; // When track_unique_ is set, this is updated with every URL seen so far. std::set unique_urls_; DISALLOW_COPY_AND_ASSIGN(URLQuerier); }; // KillHistoryDatabaseErrorDelegate ------------------------------------------- class KillHistoryDatabaseErrorDelegate : public sql::ErrorDelegate { public: explicit KillHistoryDatabaseErrorDelegate(HistoryBackend* backend) : backend_(backend), scheduled_killing_database_(false) { } // sql::ErrorDelegate implementation. virtual int OnError(int error, sql::Connection* connection, sql::Statement* stmt) OVERRIDE { // Do not schedule killing database more than once. If the first time // failed, it is unlikely that a second time will be successful. if (!scheduled_killing_database_ && sql::IsErrorCatastrophic(error)) { scheduled_killing_database_ = true; // Don't just do the close/delete here, as we are being called by |db| and // that seems dangerous. MessageLoop::current()->PostTask( FROM_HERE, base::Bind(&HistoryBackend::KillHistoryDatabase, backend_)); } return error; } // Returns true if the delegate has previously scheduled killing the database. bool scheduled_killing_database() const { return scheduled_killing_database_; } private: // Do not increment the count on |HistoryBackend| as that would create a // circular reference (HistoryBackend -> HistoryDatabase -> Connection -> // ErrorDelegate -> HistoryBackend). HistoryBackend* backend_; // True if the backend has previously scheduled killing the history database. bool scheduled_killing_database_; DISALLOW_COPY_AND_ASSIGN(KillHistoryDatabaseErrorDelegate); }; // HistoryBackend -------------------------------------------------------------- HistoryBackend::HistoryBackend(const FilePath& history_dir, int id, Delegate* delegate, BookmarkService* bookmark_service) : delegate_(delegate), id_(id), history_dir_(history_dir), ALLOW_THIS_IN_INITIALIZER_LIST(expirer_(this, bookmark_service)), recent_redirects_(kMaxRedirectCount), backend_destroy_message_loop_(NULL), segment_queried_(false), bookmark_service_(bookmark_service) { } HistoryBackend::~HistoryBackend() { DCHECK(!scheduled_commit_) << "Deleting without cleanup"; ReleaseDBTasks(); #if defined(OS_ANDROID) // Release AndroidProviderBackend before other objects. android_provider_backend_.reset(); #endif // First close the databases before optionally running the "destroy" task. CloseAllDatabases(); if (!backend_destroy_task_.is_null()) { // Notify an interested party (typically a unit test) that we're done. DCHECK(backend_destroy_message_loop_); backend_destroy_message_loop_->PostTask(FROM_HERE, backend_destroy_task_); } #if defined(OS_ANDROID) file_util::Delete(GetAndroidCacheFileName(), false); #endif } void HistoryBackend::Init(const std::string& languages, bool force_fail) { if (!force_fail) InitImpl(languages); delegate_->DBLoaded(id_); } void HistoryBackend::SetOnBackendDestroyTask(MessageLoop* message_loop, const base::Closure& task) { if (!backend_destroy_task_.is_null()) DLOG(WARNING) << "Setting more than one destroy task, overriding"; backend_destroy_message_loop_ = message_loop; backend_destroy_task_ = task; } void HistoryBackend::Closing() { // Any scheduled commit will have a reference to us, we must make it // release that reference before we can be destroyed. CancelScheduledCommit(); // Release our reference to the delegate, this reference will be keeping the // history service alive. delegate_.reset(); } void HistoryBackend::NotifyRenderProcessHostDestruction(const void* host) { tracker_.NotifyRenderProcessHostDestruction(host); } FilePath HistoryBackend::GetThumbnailFileName() const { return history_dir_.Append(chrome::kThumbnailsFilename); } FilePath HistoryBackend::GetFaviconsFileName() const { return history_dir_.Append(chrome::kFaviconsFilename); } FilePath HistoryBackend::GetArchivedFileName() const { return history_dir_.Append(chrome::kArchivedHistoryFilename); } #if defined(OS_ANDROID) FilePath HistoryBackend::GetAndroidCacheFileName() const { return history_dir_.Append(chrome::kAndroidCacheFilename); } #endif SegmentID HistoryBackend::GetLastSegmentID(VisitID from_visit) { // Set is used to detect referrer loops. Should not happen, but can // if the database is corrupt. std::set visit_set; VisitID visit_id = from_visit; while (visit_id) { VisitRow row; if (!db_->GetRowForVisit(visit_id, &row)) return 0; if (row.segment_id) return row.segment_id; // Found a visit in this change with a segment. // Check the referrer of this visit, if any. visit_id = row.referring_visit; if (visit_set.find(visit_id) != visit_set.end()) { NOTREACHED() << "Loop in referer chain, giving up"; break; } visit_set.insert(visit_id); } return 0; } SegmentID HistoryBackend::UpdateSegments( const GURL& url, VisitID from_visit, VisitID visit_id, content::PageTransition transition_type, const Time ts) { if (!db_.get()) return 0; // We only consider main frames. if (!content::PageTransitionIsMainFrame(transition_type)) return 0; SegmentID segment_id = 0; content::PageTransition t = content::PageTransitionStripQualifier(transition_type); // Are we at the beginning of a new segment? // Note that navigating to an existing entry (with back/forward) reuses the // same transition type. We are not adding it as a new segment in that case // because if this was the target of a redirect, we might end up with // 2 entries for the same final URL. Ex: User types google.net, gets // redirected to google.com. A segment is created for google.net. On // google.com users navigates through a link, then press back. That last // navigation is for the entry google.com transition typed. We end up adding // a segment for that one as well. So we end up with google.net and google.com // in the segement table, showing as 2 entries in the NTP. // Note also that we should still be updating the visit count for that segment // which we are not doing now. It should be addressed when // http://crbug.com/96860 is fixed. if ((t == content::PAGE_TRANSITION_TYPED || t == content::PAGE_TRANSITION_AUTO_BOOKMARK) && (transition_type & content::PAGE_TRANSITION_FORWARD_BACK) == 0) { // If so, create or get the segment. std::string segment_name = db_->ComputeSegmentName(url); URLID url_id = db_->GetRowForURL(url, NULL); if (!url_id) return 0; if (!(segment_id = db_->GetSegmentNamed(segment_name))) { if (!(segment_id = db_->CreateSegment(url_id, segment_name))) { NOTREACHED(); return 0; } } else { // Note: if we update an existing segment, we update the url used to // represent that segment in order to minimize stale most visited // images. db_->UpdateSegmentRepresentationURL(segment_id, url_id); } } else { // Note: it is possible there is no segment ID set for this visit chain. // This can happen if the initial navigation wasn't AUTO_BOOKMARK or // TYPED. (For example GENERATED). In this case this visit doesn't count // toward any segment. if (!(segment_id = GetLastSegmentID(from_visit))) return 0; } // Set the segment in the visit. if (!db_->SetSegmentID(visit_id, segment_id)) { NOTREACHED(); return 0; } // Finally, increase the counter for that segment / day. if (!db_->IncreaseSegmentVisitCount(segment_id, ts, 1)) { NOTREACHED(); return 0; } return segment_id; } void HistoryBackend::UpdateWithPageEndTime(const void* host, int32 page_id, const GURL& url, Time end_ts) { // Will be filled with the URL ID and the visit ID of the last addition. VisitID visit_id = tracker_.GetLastVisit(host, page_id, url); UpdateVisitDuration(visit_id, end_ts); } void HistoryBackend::UpdateVisitDuration(VisitID visit_id, const Time end_ts) { if (!db_.get()) return; // Get the starting visit_time for visit_id. VisitRow visit_row; if (db_->GetRowForVisit(visit_id, &visit_row)) { // We should never have a negative duration time even when time is skewed. visit_row.visit_duration = end_ts > visit_row.visit_time ? end_ts - visit_row.visit_time : TimeDelta::FromMicroseconds(0); db_->UpdateVisitRow(visit_row); } } void HistoryBackend::AddPage(const HistoryAddPageArgs& request) { if (!db_.get()) return; // Will be filled with the URL ID and the visit ID of the last addition. std::pair last_ids(0, tracker_.GetLastVisit( request.id_scope, request.page_id, request.referrer)); VisitID from_visit_id = last_ids.second; // If a redirect chain is given, we expect the last item in that chain to be // the final URL. DCHECK(request.redirects.empty() || request.redirects.back() == request.url); // If the user is adding older history, we need to make sure our times // are correct. if (request.time < first_recorded_time_) first_recorded_time_ = request.time; content::PageTransition request_transition = request.transition; content::PageTransition stripped_transition = content::PageTransitionStripQualifier(request_transition); bool is_keyword_generated = (stripped_transition == content::PAGE_TRANSITION_KEYWORD_GENERATED); // If the user is navigating to a not-previously-typed intranet hostname, // change the transition to TYPED so that the omnibox will learn that this is // a known host. bool has_redirects = request.redirects.size() > 1; if (content::PageTransitionIsMainFrame(request_transition) && (stripped_transition != content::PAGE_TRANSITION_TYPED) && !is_keyword_generated) { const GURL& origin_url(has_redirects ? request.redirects[0] : request.url); if (origin_url.SchemeIs(chrome::kHttpScheme) || origin_url.SchemeIs(chrome::kHttpsScheme) || origin_url.SchemeIs(chrome::kFtpScheme)) { std::string host(origin_url.host()); if ((net::RegistryControlledDomainService::GetRegistryLength( host, false) == 0) && !db_->IsTypedHost(host)) { stripped_transition = content::PAGE_TRANSITION_TYPED; request_transition = content::PageTransitionFromInt( stripped_transition | content::PageTransitionGetQualifier(request_transition)); } } } if (!has_redirects) { // The single entry is both a chain start and end. content::PageTransition t = content::PageTransitionFromInt( request_transition | content::PAGE_TRANSITION_CHAIN_START | content::PAGE_TRANSITION_CHAIN_END); // No redirect case (one element means just the page itself). last_ids = AddPageVisit(request.url, request.time, last_ids.second, t, request.visit_source); // Update the segment for this visit. KEYWORD_GENERATED visits should not // result in changing most visited, so we don't update segments (most // visited db). if (!is_keyword_generated) { UpdateSegments(request.url, from_visit_id, last_ids.second, t, request.time); // Update the referrer's duration. UpdateVisitDuration(from_visit_id, request.time); } } else { // Redirect case. Add the redirect chain. content::PageTransition redirect_info = content::PAGE_TRANSITION_CHAIN_START; RedirectList redirects = request.redirects; if (redirects[0].SchemeIs(chrome::kAboutScheme)) { // When the redirect source + referrer is "about" we skip it. This // happens when a page opens a new frame/window to about:blank and then // script sets the URL to somewhere else (used to hide the referrer). It // would be nice to keep all these redirects properly but we don't ever // see the initial about:blank load, so we don't know where the // subsequent client redirect came from. // // In this case, we just don't bother hooking up the source of the // redirects, so we remove it. redirects.erase(redirects.begin()); } else if (request_transition & content::PAGE_TRANSITION_CLIENT_REDIRECT) { redirect_info = content::PAGE_TRANSITION_CLIENT_REDIRECT; // The first entry in the redirect chain initiated a client redirect. // We don't add this to the database since the referrer is already // there, so we skip over it but change the transition type of the first // transition to client redirect. // // The referrer is invalid when restoring a session that features an // https tab that redirects to a different host or to http. In this // case we don't need to reconnect the new redirect with the existing // chain. if (request.referrer.is_valid()) { DCHECK(request.referrer == redirects[0]); redirects.erase(redirects.begin()); // If the navigation entry for this visit has replaced that for the // first visit, remove the CHAIN_END marker from the first visit. This // can be called a lot, for example, the page cycler, and most of the // time we won't have changed anything. VisitRow visit_row; if (request.did_replace_entry && db_->GetRowForVisit(last_ids.second, &visit_row) && visit_row.transition & content::PAGE_TRANSITION_CHAIN_END) { visit_row.transition = content::PageTransitionFromInt( visit_row.transition & ~content::PAGE_TRANSITION_CHAIN_END); db_->UpdateVisitRow(visit_row); } } } for (size_t redirect_index = 0; redirect_index < redirects.size(); redirect_index++) { content::PageTransition t = content::PageTransitionFromInt(stripped_transition | redirect_info); // If this is the last transition, add a CHAIN_END marker if (redirect_index == (redirects.size() - 1)) { t = content::PageTransitionFromInt( t | content::PAGE_TRANSITION_CHAIN_END); } // Record all redirect visits with the same timestamp. We don't display // them anyway, and if we ever decide to, we can reconstruct their order // from the redirect chain. last_ids = AddPageVisit(redirects[redirect_index], request.time, last_ids.second, t, request.visit_source); if (t & content::PAGE_TRANSITION_CHAIN_START) { // Update the segment for this visit. UpdateSegments(redirects[redirect_index], from_visit_id, last_ids.second, t, request.time); // Update the visit_details for this visit. UpdateVisitDuration(from_visit_id, request.time); } // Subsequent transitions in the redirect list must all be server // redirects. redirect_info = content::PAGE_TRANSITION_SERVER_REDIRECT; } // Last, save this redirect chain for later so we can set titles & favicons // on the redirected pages properly. It is indexed by the destination page. recent_redirects_.Put(request.url, redirects); } // TODO(brettw) bug 1140015: Add an "add page" notification so the history // views can keep in sync. // Add the last visit to the tracker so we can get outgoing transitions. // TODO(evanm): Due to http://b/1194536 we lose the referrers of a subframe // navigation anyway, so last_visit_id is always zero for them. But adding // them here confuses main frame history, so we skip them for now. if (stripped_transition != content::PAGE_TRANSITION_AUTO_SUBFRAME && stripped_transition != content::PAGE_TRANSITION_MANUAL_SUBFRAME && !is_keyword_generated) { tracker_.AddVisit(request.id_scope, request.page_id, request.url, last_ids.second); } if (text_database_.get()) { text_database_->AddPageURL(request.url, last_ids.first, last_ids.second, request.time); } ScheduleCommit(); } void HistoryBackend::InitImpl(const std::string& languages) { DCHECK(!db_.get()) << "Initializing HistoryBackend twice"; // In the rare case where the db fails to initialize a dialog may get shown // the blocks the caller, yet allows other messages through. For this reason // we only set db_ to the created database if creation is successful. That // way other methods won't do anything as db_ is still NULL. TimeTicks beginning_time = TimeTicks::Now(); // Compute the file names. Note that the index file can be removed when the // text db manager is finished being hooked up. FilePath history_name = history_dir_.Append(chrome::kHistoryFilename); FilePath thumbnail_name = GetThumbnailFileName(); FilePath archived_name = GetArchivedFileName(); // History database. db_.reset(new HistoryDatabase()); // |HistoryDatabase::Init| takes ownership of |error_delegate|. KillHistoryDatabaseErrorDelegate* error_delegate = new KillHistoryDatabaseErrorDelegate(this); sql::InitStatus status = db_->Init(history_name, error_delegate); switch (status) { case sql::INIT_OK: break; case sql::INIT_FAILURE: { // A NULL db_ will cause all calls on this object to notice this error // and to not continue. If the error delegate scheduled killing the // database, the task it posted has not executed yet. Try killing the // database now before we close it. bool kill_database = error_delegate->scheduled_killing_database(); if (kill_database) KillHistoryDatabase(); UMA_HISTOGRAM_BOOLEAN("History.AttemptedToFixProfileError", kill_database); delegate_->NotifyProfileError(id_, status); db_.reset(); return; } default: NOTREACHED(); } // Fill the in-memory database and send it back to the history service on the // main thread. InMemoryHistoryBackend* mem_backend = new InMemoryHistoryBackend; if (mem_backend->Init(history_name, db_.get())) delegate_->SetInMemoryBackend(id_, mem_backend); // Takes ownership of // pointer. else delete mem_backend; // Error case, run without the in-memory DB. db_->BeginExclusiveMode(); // Must be after the mem backend read the data. // Create the history publisher which needs to be passed on to the text and // thumbnail databases for publishing history. history_publisher_.reset(new HistoryPublisher()); if (!history_publisher_->Init()) { // The init may fail when there are no indexers wanting our history. // Hence no need to log the failure. history_publisher_.reset(); } // Full-text database. This has to be first so we can pass it to the // HistoryDatabase for migration. text_database_.reset(new TextDatabaseManager(history_dir_, db_.get(), db_.get())); if (!text_database_->Init(history_publisher_.get())) { LOG(WARNING) << "Text database initialization failed, running without it."; text_database_.reset(); } if (db_->needs_version_17_migration()) { // See needs_version_17_migration() decl for more. In this case, we want // to erase all the text database files. This must be done after the text // database manager has been initialized, since it knows about all the // files it manages. text_database_->DeleteAll(); } // Thumbnail database. thumbnail_db_.reset(new ThumbnailDatabase()); if (!db_->GetNeedsThumbnailMigration()) { // No convertion needed - use new filename right away. thumbnail_name = GetFaviconsFileName(); } if (thumbnail_db_->Init(thumbnail_name, history_publisher_.get(), db_.get()) != sql::INIT_OK) { // Unlike the main database, we don't error out when the database is too // new because this error is much less severe. Generally, this shouldn't // happen since the thumbnail and main datbase versions should be in sync. // We'll just continue without thumbnails & favicons in this case or any // other error. LOG(WARNING) << "Could not initialize the thumbnail database."; thumbnail_db_.reset(); } if (db_->GetNeedsThumbnailMigration()) { VLOG(1) << "Starting TopSites migration"; delegate_->StartTopSitesMigration(id_); } // Archived database. if (db_->needs_version_17_migration()) { // See needs_version_17_migration() decl for more. In this case, we want // to delete the archived database and need to do so before we try to // open the file. We can ignore any error (maybe the file doesn't exist). file_util::Delete(archived_name, false); } archived_db_.reset(new ArchivedDatabase()); if (!archived_db_->Init(archived_name)) { LOG(WARNING) << "Could not initialize the archived database."; archived_db_.reset(); } // Tell the expiration module about all the nice databases we made. This must // happen before db_->Init() is called since the callback ForceArchiveHistory // may need to expire stuff. // // *sigh*, this can all be cleaned up when that migration code is removed. // The main DB initialization should intuitively be first (not that it // actually matters) and the expirer should be set last. expirer_.SetDatabases(db_.get(), archived_db_.get(), thumbnail_db_.get(), text_database_.get()); // Open the long-running transaction. db_->BeginTransaction(); if (thumbnail_db_.get()) thumbnail_db_->BeginTransaction(); if (archived_db_.get()) archived_db_->BeginTransaction(); if (text_database_.get()) text_database_->BeginTransaction(); // Get the first item in our database. db_->GetStartDate(&first_recorded_time_); // Start expiring old stuff. expirer_.StartArchivingOldStuff(TimeDelta::FromDays(kArchiveDaysThreshold)); #if defined(OS_ANDROID) if (thumbnail_db_.get()) { android_provider_backend_.reset(new AndroidProviderBackend( GetAndroidCacheFileName(), db_.get(), thumbnail_db_.get(), bookmark_service_, delegate_.get())); } #endif HISTOGRAM_TIMES("History.InitTime", TimeTicks::Now() - beginning_time); } void HistoryBackend::CloseAllDatabases() { if (db_.get()) { // Commit the long-running transaction. db_->CommitTransaction(); db_.reset(); } if (thumbnail_db_.get()) { thumbnail_db_->CommitTransaction(); thumbnail_db_.reset(); } if (archived_db_.get()) { archived_db_->CommitTransaction(); archived_db_.reset(); } if (text_database_.get()) { text_database_->CommitTransaction(); text_database_.reset(); } } std::pair HistoryBackend::AddPageVisit( const GURL& url, Time time, VisitID referring_visit, content::PageTransition transition, VisitSource visit_source) { // Top-level frame navigations are visible, everything else is hidden bool new_hidden = !content::PageTransitionIsMainFrame(transition); // NOTE: This code must stay in sync with // ExpireHistoryBackend::ExpireURLsForVisits(). // TODO(pkasting): http://b/1148304 We shouldn't be marking so many URLs as // typed, which would eliminate the need for this code. int typed_increment = 0; content::PageTransition transition_type = content::PageTransitionStripQualifier(transition); if ((transition_type == content::PAGE_TRANSITION_TYPED && !content::PageTransitionIsRedirect(transition)) || transition_type == content::PAGE_TRANSITION_KEYWORD_GENERATED) typed_increment = 1; // See if this URL is already in the DB. URLRow url_info(url); URLID url_id = db_->GetRowForURL(url, &url_info); if (url_id) { // Update of an existing row. if (content::PageTransitionStripQualifier(transition) != content::PAGE_TRANSITION_RELOAD) url_info.set_visit_count(url_info.visit_count() + 1); if (typed_increment) url_info.set_typed_count(url_info.typed_count() + typed_increment); url_info.set_last_visit(time); // Only allow un-hiding of pages, never hiding. if (!new_hidden) url_info.set_hidden(false); db_->UpdateURLRow(url_id, url_info); } else { // Addition of a new row. url_info.set_visit_count(1); url_info.set_typed_count(typed_increment); url_info.set_last_visit(time); url_info.set_hidden(new_hidden); url_id = db_->AddURL(url_info); if (!url_id) { NOTREACHED() << "Adding URL failed."; return std::make_pair(0, 0); } url_info.id_ = url_id; // We don't actually add the URL to the full text index at this point. It // might be nice to do this so that even if we get no title or body, the // user can search for URL components and get the page. // // However, in most cases, we'll get at least a title and usually contents, // and this add will be redundant, slowing everything down. As a result, // we ignore this edge case. } // Add the visit with the time to the database. VisitRow visit_info(url_id, time, referring_visit, transition, 0); VisitID visit_id = db_->AddVisit(&visit_info, visit_source); NotifyVisitObservers(visit_info); if (visit_info.visit_time < first_recorded_time_) first_recorded_time_ = visit_info.visit_time; // Broadcast a notification of the visit. if (visit_id) { URLVisitedDetails* details = new URLVisitedDetails; details->transition = transition; details->row = url_info; // TODO(meelapshah) Disabled due to potential PageCycler regression. // Re-enable this. // GetMostRecentRedirectsTo(url, &details->redirects); BroadcastNotifications(chrome::NOTIFICATION_HISTORY_URL_VISITED, details); } else { VLOG(0) << "Failed to build visit insert statement: " << "url_id = " << url_id; } return std::make_pair(url_id, visit_id); } void HistoryBackend::AddPagesWithDetails(const URLRows& urls, VisitSource visit_source) { if (!db_.get()) return; scoped_ptr modified(new URLsModifiedDetails); for (URLRows::const_iterator i = urls.begin(); i != urls.end(); ++i) { DCHECK(!i->last_visit().is_null()); // We will add to either the archived database or the main one depending on // the date of the added visit. URLDatabase* url_database; VisitDatabase* visit_database; if (IsExpiredVisitTime(i->last_visit())) { if (!archived_db_.get()) return; // No archived database to save it to, just forget this. url_database = archived_db_.get(); visit_database = archived_db_.get(); } else { url_database = db_.get(); visit_database = db_.get(); } URLRow existing_url; URLID url_id = url_database->GetRowForURL(i->url(), &existing_url); if (!url_id) { // Add the page if it doesn't exist. url_id = url_database->AddURL(*i); if (!url_id) { NOTREACHED() << "Could not add row to DB"; return; } if (i->typed_count() > 0) { modified->changed_urls.push_back(*i); modified->changed_urls.back().set_id(url_id); // *i likely has |id_| 0. } } // Add the page to the full text index. This function is also used for // importing. Even though we don't have page contents, we can at least // add the title and URL to the index so they can be searched. We don't // bother to delete any already-existing FTS entries for the URL, since // this is normally called on import. // // If you ever import *after* first run (selecting import from the menu), // then these additional entries will "shadow" the originals when querying // for the most recent match only, and the user won't get snippets. This is // a very minor issue, and fixing it will make import slower, so we don't // bother. bool has_indexed = false; if (text_database_.get()) { // We do not have to make it update the visit database, below, we will // create the visit entry with the indexed flag set. has_indexed = text_database_->AddPageData(i->url(), url_id, 0, i->last_visit(), i->title(), string16()); } // Sync code manages the visits itself. if (visit_source != SOURCE_SYNCED) { // Make up a visit to correspond to the last visit to the page. VisitRow visit_info(url_id, i->last_visit(), 0, content::PageTransitionFromInt( content::PAGE_TRANSITION_LINK | content::PAGE_TRANSITION_CHAIN_START | content::PAGE_TRANSITION_CHAIN_END), 0); visit_info.is_indexed = has_indexed; if (!visit_database->AddVisit(&visit_info, visit_source)) { NOTREACHED() << "Adding visit failed."; return; } NotifyVisitObservers(visit_info); if (visit_info.visit_time < first_recorded_time_) first_recorded_time_ = visit_info.visit_time; } } // Broadcast a notification for typed URLs that have been modified. This // will be picked up by the in-memory URL database on the main thread. // // TODO(brettw) bug 1140015: Add an "add page" notification so the history // views can keep in sync. BroadcastNotifications(chrome::NOTIFICATION_HISTORY_URLS_MODIFIED, modified.release()); ScheduleCommit(); } bool HistoryBackend::IsExpiredVisitTime(const base::Time& time) { return time < expirer_.GetCurrentArchiveTime(); } void HistoryBackend::SetPageTitle(const GURL& url, const string16& title) { if (!db_.get()) return; // Update the full text index. if (text_database_.get()) text_database_->AddPageTitle(url, title); // Search for recent redirects which should get the same title. We make a // dummy list containing the exact URL visited if there are no redirects so // the processing below can be the same. history::RedirectList dummy_list; history::RedirectList* redirects; RedirectCache::iterator iter = recent_redirects_.Get(url); if (iter != recent_redirects_.end()) { redirects = &iter->second; // This redirect chain should have the destination URL as the last item. DCHECK(!redirects->empty()); DCHECK(redirects->back() == url); } else { // No redirect chain stored, make up one containing the URL we want so we // can use the same logic below. dummy_list.push_back(url); redirects = &dummy_list; } scoped_ptr details(new URLsModifiedDetails); for (size_t i = 0; i < redirects->size(); i++) { URLRow row; URLID row_id = db_->GetRowForURL(redirects->at(i), &row); if (row_id && row.title() != title) { row.set_title(title); db_->UpdateURLRow(row_id, row); details->changed_urls.push_back(row); } } // Broadcast notifications for any URLs that have changed. This will // update the in-memory database and the InMemoryURLIndex. if (!details->changed_urls.empty()) { BroadcastNotifications(chrome::NOTIFICATION_HISTORY_URLS_MODIFIED, details.release()); ScheduleCommit(); } } void HistoryBackend::AddPageNoVisitForBookmark(const GURL& url, const string16& title) { if (!db_.get()) return; URLRow url_info(url); URLID url_id = db_->GetRowForURL(url, &url_info); if (url_id) { // URL is already known, nothing to do. return; } if (!title.empty()) { url_info.set_title(title); } else { url_info.set_title(UTF8ToUTF16(url.spec())); } url_info.set_last_visit(Time::Now()); // Mark the page hidden. If the user types it in, it'll unhide. url_info.set_hidden(true); db_->AddURL(url_info); } void HistoryBackend::IterateURLs( const scoped_refptr& iterator) { if (db_.get()) { HistoryDatabase::URLEnumerator e; if (db_->InitURLEnumeratorForEverything(&e)) { URLRow info; while (e.GetNextURL(&info)) { iterator->OnURL(info.url()); } iterator->OnComplete(true); // Success. return; } } iterator->OnComplete(false); // Failure. } bool HistoryBackend::GetAllTypedURLs(URLRows* urls) { if (db_.get()) return db_->GetAllTypedUrls(urls); return false; } bool HistoryBackend::GetVisitsForURL(URLID id, VisitVector* visits) { if (db_.get()) return db_->GetVisitsForURL(id, visits); return false; } bool HistoryBackend::GetMostRecentVisitsForURL(URLID id, int max_visits, VisitVector* visits) { if (db_.get()) return db_->GetMostRecentVisitsForURL(id, max_visits, visits); return false; } bool HistoryBackend::UpdateURL(URLID id, const history::URLRow& url) { if (db_.get()) return db_->UpdateURLRow(id, url); return false; } bool HistoryBackend::AddVisits(const GURL& url, const std::vector& visits, VisitSource visit_source) { if (db_.get()) { for (std::vector::const_iterator visit = visits.begin(); visit != visits.end(); ++visit) { if (!AddPageVisit( url, visit->first, 0, visit->second, visit_source).first) { return false; } } ScheduleCommit(); return true; } return false; } bool HistoryBackend::RemoveVisits(const VisitVector& visits) { if (!db_.get()) return false; expirer_.ExpireVisits(visits); ScheduleCommit(); return true; } bool HistoryBackend::GetVisitsSource(const VisitVector& visits, VisitSourceMap* sources) { if (!db_.get()) return false; db_->GetVisitsSource(visits, sources); return true; } bool HistoryBackend::GetURL(const GURL& url, history::URLRow* url_row) { if (db_.get()) return db_->GetRowForURL(url, url_row) != 0; return false; } void HistoryBackend::QueryURL(scoped_refptr request, const GURL& url, bool want_visits) { if (request->canceled()) return; bool success = false; URLRow* row = &request->value.a; VisitVector* visits = &request->value.b; if (db_.get()) { if (db_->GetRowForURL(url, row)) { // Have a row. success = true; // Optionally query the visits. if (want_visits) db_->GetVisitsForURL(row->id(), visits); } } request->ForwardResult(request->handle(), success, row, visits); } // Segment usage --------------------------------------------------------------- void HistoryBackend::DeleteOldSegmentData() { if (db_.get()) db_->DeleteSegmentData(Time::Now() - TimeDelta::FromDays(kSegmentDataRetention)); } void HistoryBackend::SetSegmentPresentationIndex(SegmentID segment_id, int index) { if (db_.get()) db_->SetSegmentPresentationIndex(segment_id, index); } void HistoryBackend::QuerySegmentUsage( scoped_refptr request, const Time from_time, int max_result_count) { if (request->canceled()) return; if (db_.get()) { db_->QuerySegmentUsage(from_time, max_result_count, &request->value.get()); // If this is the first time we query segments, invoke // DeleteOldSegmentData asynchronously. We do this to cleanup old // entries. if (!segment_queried_) { segment_queried_ = true; MessageLoop::current()->PostTask( FROM_HERE, base::Bind(&HistoryBackend::DeleteOldSegmentData, this)); } } request->ForwardResult(request->handle(), &request->value.get()); } // Keyword visits -------------------------------------------------------------- void HistoryBackend::SetKeywordSearchTermsForURL(const GURL& url, TemplateURLID keyword_id, const string16& term) { if (!db_.get()) return; // Get the ID for this URL. URLRow url_row; if (!db_->GetRowForURL(url, &url_row)) { // There is a small possibility the url was deleted before the keyword // was added. Ignore the request. return; } db_->SetKeywordSearchTermsForURL(url_row.id(), keyword_id, term); // details is deleted by BroadcastNotifications. KeywordSearchTermDetails* details = new KeywordSearchTermDetails; details->url = url; details->keyword_id = keyword_id; details->term = term; BroadcastNotifications( chrome::NOTIFICATION_HISTORY_KEYWORD_SEARCH_TERM_UPDATED, details); ScheduleCommit(); } void HistoryBackend::DeleteAllSearchTermsForKeyword( TemplateURLID keyword_id) { if (!db_.get()) return; db_->DeleteAllSearchTermsForKeyword(keyword_id); // TODO(sky): bug 1168470. Need to move from archive dbs too. ScheduleCommit(); } void HistoryBackend::GetMostRecentKeywordSearchTerms( scoped_refptr request, TemplateURLID keyword_id, const string16& prefix, int max_count) { if (request->canceled()) return; if (db_.get()) { db_->GetMostRecentKeywordSearchTerms(keyword_id, prefix, max_count, &(request->value)); } request->ForwardResult(request->handle(), &request->value); } // Downloads ------------------------------------------------------------------- void HistoryBackend::GetNextDownloadId(int* id) { if (db_.get()) *id = db_->next_download_id(); } // Get all the download entries from the database. void HistoryBackend::QueryDownloads(std::vector* rows) { if (db_.get()) db_->QueryDownloads(rows); } // Clean up entries that has been corrupted (because of the crash, for example). void HistoryBackend::CleanUpInProgressEntries() { // If some "in progress" entries were not updated when Chrome exited, they // need to be cleaned up. if (db_.get()) db_->CleanUpInProgressEntries(); } // Update a particular download entry. void HistoryBackend::UpdateDownload(const history::DownloadRow& data) { if (db_.get()) db_->UpdateDownload(data); } void HistoryBackend::CreateDownload(const history::DownloadRow& history_info, int64* db_handle) { if (db_.get()) *db_handle = db_->CreateDownload(history_info); } void HistoryBackend::RemoveDownloads(const std::set& handles) { if (!db_.get()) return; int downloads_count_before = db_->CountDownloads(); base::TimeTicks started_removing = base::TimeTicks::Now(); // HistoryBackend uses a long-running Transaction that is committed // periodically, so this loop doesn't actually hit the disk too hard. for (std::set::const_iterator it = handles.begin(); it != handles.end(); ++it) { db_->RemoveDownload(*it); } base::TimeTicks finished_removing = base::TimeTicks::Now(); int downloads_count_after = db_->CountDownloads(); int num_downloads_deleted = downloads_count_before - downloads_count_after; if (num_downloads_deleted >= 0) { UMA_HISTOGRAM_COUNTS("Download.DatabaseRemoveDownloadsCount", num_downloads_deleted); base::TimeDelta micros = (1000 * (finished_removing - started_removing)); UMA_HISTOGRAM_TIMES("Download.DatabaseRemoveDownloadsTime", micros); if (num_downloads_deleted > 0) { UMA_HISTOGRAM_TIMES("Download.DatabaseRemoveDownloadsTimePerRecord", (1000 * micros) / num_downloads_deleted); } } int num_downloads_not_deleted = handles.size() - num_downloads_deleted; if (num_downloads_not_deleted >= 0) { UMA_HISTOGRAM_COUNTS("Download.DatabaseRemoveDownloadsCountNotRemoved", num_downloads_not_deleted); } } void HistoryBackend::QueryHistory(scoped_refptr request, const string16& text_query, const QueryOptions& options) { if (request->canceled()) return; TimeTicks beginning_time = TimeTicks::Now(); if (db_.get()) { if (text_query.empty()) { // Basic history query for the main database. QueryHistoryBasic(db_.get(), db_.get(), options, &request->value); // Now query the archived database. This is a bit tricky because we don't // want to query it if the queried time range isn't going to find anything // in it. // TODO(brettw) bug 1171036: do blimpie querying for the archived database // as well. // if (archived_db_.get() && // expirer_.GetCurrentArchiveTime() - TimeDelta::FromDays(7)) { } else { // Full text history query. QueryHistoryFTS(text_query, options, &request->value); } } request->ForwardResult(request->handle(), &request->value); UMA_HISTOGRAM_TIMES("History.QueryHistory", TimeTicks::Now() - beginning_time); } // Basic time-based querying of history. void HistoryBackend::QueryHistoryBasic(URLDatabase* url_db, VisitDatabase* visit_db, const QueryOptions& options, QueryResults* result) { // First get all visits. VisitVector visits; bool has_more_results = visit_db->GetVisibleVisitsInRange(options, &visits); DCHECK(static_cast(visits.size()) <= options.EffectiveMaxCount()); // Now add them and the URL rows to the results. URLResult url_result; QueryCursor cursor; for (size_t i = 0; i < visits.size(); i++) { const VisitRow visit = visits[i]; // Add a result row for this visit, get the URL info from the DB. if (!url_db->GetURLRow(visit.url_id, &url_result)) { VLOG(0) << "Failed to get id " << visit.url_id << " from history.urls."; continue; // DB out of sync and URL doesn't exist, try to recover. } if (!url_result.url().is_valid()) { VLOG(0) << "Got invalid URL from history.urls with id " << visit.url_id << ": " << url_result.url().possibly_invalid_spec(); continue; // Don't report invalid URLs in case of corruption. } // The archived database may be out of sync with respect to starring, // titles, last visit date, etc. Therefore, we query the main DB if the // current URL database is not the main one. if (url_db == db_.get()) { // Currently querying the archived DB, update with the main database to // catch any interesting stuff. This will update it if it exists in the // main DB, and do nothing otherwise. db_->GetRowForURL(url_result.url(), &url_result); } url_result.set_visit_time(visit.visit_time); // We don't set any of the query-specific parts of the URLResult, since // snippets and stuff don't apply to basic querying. result->AppendURLBySwapping(&url_result); cursor.rowid_ = visit.visit_id; cursor.time_ = visit.visit_time; } result->set_cursor(cursor); if (!has_more_results && options.begin_time <= first_recorded_time_) result->set_reached_beginning(true); } void HistoryBackend::QueryHistoryFTS(const string16& text_query, const QueryOptions& options, QueryResults* result) { if (!text_database_.get()) return; // Full text query, first get all the FTS results in the time range. std::vector fts_matches; Time first_time_searched; text_database_->GetTextMatches(text_query, options, &fts_matches, &first_time_searched); URLQuerier querier(db_.get(), archived_db_.get(), true); // Now get the row and visit information for each one. URLResult url_result; // Declare outside loop to prevent re-construction. QueryCursor cursor; for (size_t i = 0; i < fts_matches.size(); i++) { if (options.max_count != 0 && static_cast(result->size()) >= options.max_count) break; // Got too many items. // Get the URL, querying the main and archived databases as necessary. If // this is not found, the history and full text search databases are out // of sync and we give up with this result. if (!querier.GetRowForURL(fts_matches[i].url, &url_result)) continue; if (!url_result.url().is_valid()) continue; // Don't report invalid URLs in case of corruption. // Copy over the FTS stuff that the URLDatabase doesn't know about. // We do this with swap() to avoid copying, since we know we don't // need the original any more. Note that we override the title with the // one from FTS, since that will match the title_match_positions (the // FTS title and the history DB title may differ). url_result.set_title(fts_matches[i].title); url_result.title_match_positions_.swap( fts_matches[i].title_match_positions); url_result.snippet_.Swap(&fts_matches[i].snippet); // The visit time also comes from the full text search database. Since it // has the time, we can avoid an extra query of the visits table. url_result.set_visit_time(fts_matches[i].time); // Add it to the vector, this will clear our |url_row| object as a // result of the swap. result->AppendURLBySwapping(&url_result); cursor.rowid_ = fts_matches[i].rowid; cursor.time_ = fts_matches[i].time; } result->set_cursor(cursor); if (first_time_searched <= first_recorded_time_) result->set_reached_beginning(true); } // Frontend to GetMostRecentRedirectsFrom from the history thread. void HistoryBackend::QueryRedirectsFrom( scoped_refptr request, const GURL& url) { if (request->canceled()) return; bool success = GetMostRecentRedirectsFrom(url, &request->value); request->ForwardResult(request->handle(), url, success, &request->value); } void HistoryBackend::QueryRedirectsTo( scoped_refptr request, const GURL& url) { if (request->canceled()) return; bool success = GetMostRecentRedirectsTo(url, &request->value); request->ForwardResult(request->handle(), url, success, &request->value); } void HistoryBackend::GetVisibleVisitCountToHost( scoped_refptr request, const GURL& url) { if (request->canceled()) return; int count = 0; Time first_visit; const bool success = db_.get() && db_->GetVisibleVisitCountToHost(url, &count, &first_visit); request->ForwardResult(request->handle(), success, count, first_visit); } void HistoryBackend::QueryTopURLsAndRedirects( scoped_refptr request, int result_count) { if (request->canceled()) return; if (!db_.get()) { request->ForwardResult(request->handle(), false, NULL, NULL); return; } std::vector* top_urls = &request->value.a; history::RedirectMap* redirects = &request->value.b; ScopedVector data; db_->QuerySegmentUsage(base::Time::Now() - base::TimeDelta::FromDays(90), result_count, &data.get()); for (size_t i = 0; i < data.size(); ++i) { top_urls->push_back(data[i]->GetURL()); RefCountedVector* list = new RefCountedVector; GetMostRecentRedirectsFrom(top_urls->back(), &list->data); (*redirects)[top_urls->back()] = list; } request->ForwardResult(request->handle(), true, top_urls, redirects); } // Will replace QueryTopURLsAndRedirectsRequest. void HistoryBackend::QueryMostVisitedURLs( scoped_refptr request, int result_count, int days_back) { if (request->canceled()) return; if (!db_.get()) { // No History Database - return an empty list. request->ForwardResult(request->handle(), MostVisitedURLList()); return; } MostVisitedURLList* result = &request->value; QueryMostVisitedURLsImpl(result_count, days_back, result); request->ForwardResult(request->handle(), *result); } void HistoryBackend::QueryFilteredURLs( scoped_refptr request, int result_count, const history::VisitFilter& filter, bool extended_info) { if (request->canceled()) return; base::Time request_start = base::Time::Now(); if (!db_.get()) { // No History Database - return an empty list. request->ForwardResult(request->handle(), FilteredURLList()); return; } VisitVector visits; db_->GetDirectVisitsDuringTimes(filter, 0, &visits); std::map score_map; for (size_t i = 0; i < visits.size(); ++i) { score_map[visits[i].url_id] += filter.GetVisitScore(visits[i]); } // TODO(georgey): experiment with visit_segment database granularity (it is // currently 24 hours) to use it directly instead of using visits database, // which is considerably slower. ScopedVector data; data.reserve(score_map.size()); for (std::map::iterator it = score_map.begin(); it != score_map.end(); ++it) { PageUsageData* pud = new PageUsageData(it->first); pud->SetScore(it->second); data.push_back(pud); } // Limit to the top |result_count| results. std::sort(data.begin(), data.end(), PageUsageData::Predicate); if (result_count && implicit_cast(data.size()) > result_count) data.resize(result_count); for (size_t i = 0; i < data.size(); ++i) { URLRow info; if (db_->GetURLRow(data[i]->GetID(), &info)) { data[i]->SetURL(info.url()); data[i]->SetTitle(info.title()); } } FilteredURLList& result = request->value; for (size_t i = 0; i < data.size(); ++i) { PageUsageData* current_data = data[i]; FilteredURL url(*current_data); if (extended_info) { VisitVector visits; db_->GetVisitsForURL(current_data->GetID(), &visits); if (visits.size() > 0) { url.extended_info.total_visits = visits.size(); for (size_t i = 0; i < visits.size(); ++i) { url.extended_info.duration_opened += visits[i].visit_duration.InSeconds(); if (visits[i].visit_time > url.extended_info.last_visit_time) { url.extended_info.last_visit_time = visits[i].visit_time; } } // TODO(macourteau): implement the url.extended_info.visits stat. } } result.push_back(url); } int delta_time = std::max(1, std::min(999, static_cast((base::Time::Now() - request_start).InMilliseconds()))); STATIC_HISTOGRAM_POINTER_BLOCK( "NewTabPage.SuggestedSitesLoadTime", Add(delta_time), base::LinearHistogram::FactoryGet("NewTabPage.SuggestedSitesLoadTime", 1, 1000, 100, base::Histogram::kUmaTargetedHistogramFlag)); request->ForwardResult(request->handle(), result); } void HistoryBackend::QueryMostVisitedURLsImpl(int result_count, int days_back, MostVisitedURLList* result) { if (!db_.get()) return; ScopedVector data; db_->QuerySegmentUsage(base::Time::Now() - base::TimeDelta::FromDays(days_back), result_count, &data.get()); for (size_t i = 0; i < data.size(); ++i) { PageUsageData* current_data = data[i]; RedirectList redirects; GetMostRecentRedirectsFrom(current_data->GetURL(), &redirects); MostVisitedURL url = MakeMostVisitedURL(*current_data, redirects); result->push_back(url); } } void HistoryBackend::GetRedirectsFromSpecificVisit( VisitID cur_visit, history::RedirectList* redirects) { // Follow any redirects from the given visit and add them to the list. // It *should* be impossible to get a circular chain here, but we check // just in case to avoid infinite loops. GURL cur_url; std::set visit_set; visit_set.insert(cur_visit); while (db_->GetRedirectFromVisit(cur_visit, &cur_visit, &cur_url)) { if (visit_set.find(cur_visit) != visit_set.end()) { NOTREACHED() << "Loop in visit chain, giving up"; return; } visit_set.insert(cur_visit); redirects->push_back(cur_url); } } void HistoryBackend::GetRedirectsToSpecificVisit( VisitID cur_visit, history::RedirectList* redirects) { // Follow redirects going to cur_visit. These are added to |redirects| in // the order they are found. If a redirect chain looks like A -> B -> C and // |cur_visit| = C, redirects will be {B, A} in that order. if (!db_.get()) return; GURL cur_url; std::set visit_set; visit_set.insert(cur_visit); while (db_->GetRedirectToVisit(cur_visit, &cur_visit, &cur_url)) { if (visit_set.find(cur_visit) != visit_set.end()) { NOTREACHED() << "Loop in visit chain, giving up"; return; } visit_set.insert(cur_visit); redirects->push_back(cur_url); } } bool HistoryBackend::GetMostRecentRedirectsFrom( const GURL& from_url, history::RedirectList* redirects) { redirects->clear(); if (!db_.get()) return false; URLID from_url_id = db_->GetRowForURL(from_url, NULL); VisitID cur_visit = db_->GetMostRecentVisitForURL(from_url_id, NULL); if (!cur_visit) return false; // No visits for URL. GetRedirectsFromSpecificVisit(cur_visit, redirects); return true; } bool HistoryBackend::GetMostRecentRedirectsTo( const GURL& to_url, history::RedirectList* redirects) { redirects->clear(); if (!db_.get()) return false; URLID to_url_id = db_->GetRowForURL(to_url, NULL); VisitID cur_visit = db_->GetMostRecentVisitForURL(to_url_id, NULL); if (!cur_visit) return false; // No visits for URL. GetRedirectsToSpecificVisit(cur_visit, redirects); return true; } void HistoryBackend::ScheduleAutocomplete(HistoryURLProvider* provider, HistoryURLProviderParams* params) { // ExecuteWithDB should handle the NULL database case. provider->ExecuteWithDB(this, db_.get(), params); } void HistoryBackend::SetPageContents(const GURL& url, const string16& contents) { // This is histogrammed in the text database manager. if (!text_database_.get()) return; text_database_->AddPageContents(url, contents); } void HistoryBackend::SetPageThumbnail( const GURL& url, const gfx::Image* thumbnail, const ThumbnailScore& score) { if (!db_.get() || !thumbnail_db_.get()) return; URLRow url_row; URLID url_id = db_->GetRowForURL(url, &url_row); if (url_id) { thumbnail_db_->SetPageThumbnail(url, url_id, thumbnail, score, url_row.last_visit()); } ScheduleCommit(); } void HistoryBackend::GetPageThumbnail( scoped_refptr request, const GURL& page_url) { if (request->canceled()) return; scoped_refptr data; GetPageThumbnailDirectly(page_url, &data); request->ForwardResult(request->handle(), data); } void HistoryBackend::GetPageThumbnailDirectly( const GURL& page_url, scoped_refptr* data) { if (thumbnail_db_.get()) { *data = new base::RefCountedBytes; // Time the result. TimeTicks beginning_time = TimeTicks::Now(); history::RedirectList redirects; URLID url_id; bool success = false; // If there are some redirects, try to get a thumbnail from the last // redirect destination. if (GetMostRecentRedirectsFrom(page_url, &redirects) && !redirects.empty()) { if ((url_id = db_->GetRowForURL(redirects.back(), NULL))) success = thumbnail_db_->GetPageThumbnail(url_id, &(*data)->data()); } // If we don't have a thumbnail from redirects, try the URL directly. if (!success) { if ((url_id = db_->GetRowForURL(page_url, NULL))) success = thumbnail_db_->GetPageThumbnail(url_id, &(*data)->data()); } // In this rare case, we start to mine the older redirect sessions // from the visit table to try to find a thumbnail. if (!success) { success = GetThumbnailFromOlderRedirect(page_url, &(*data)->data()); } if (!success) *data = NULL; // This will tell the callback there was an error. UMA_HISTOGRAM_TIMES("History.GetPageThumbnail", TimeTicks::Now() - beginning_time); } } void HistoryBackend::MigrateThumbnailsDatabase() { // If there is no History DB, we can't record that the migration was done. // It will be recorded on the next run. if (db_.get()) { // If there is no thumbnail DB, we can still record a successful migration. if (thumbnail_db_.get()) { thumbnail_db_->RenameAndDropThumbnails(GetThumbnailFileName(), GetFaviconsFileName()); } db_->ThumbnailMigrationDone(); } } bool HistoryBackend::GetThumbnailFromOlderRedirect( const GURL& page_url, std::vector* data) { // Look at a few previous visit sessions. VisitVector older_sessions; URLID page_url_id = db_->GetRowForURL(page_url, NULL); static const int kVisitsToSearchForThumbnail = 4; db_->GetMostRecentVisitsForURL( page_url_id, kVisitsToSearchForThumbnail, &older_sessions); // Iterate across all those previous visits, and see if any of the // final destinations of those redirect chains have a good thumbnail // for us. bool success = false; for (VisitVector::const_iterator it = older_sessions.begin(); !success && it != older_sessions.end(); ++it) { history::RedirectList redirects; if (it->visit_id) { GetRedirectsFromSpecificVisit(it->visit_id, &redirects); if (!redirects.empty()) { URLID url_id; if ((url_id = db_->GetRowForURL(redirects.back(), NULL))) success = thumbnail_db_->GetPageThumbnail(url_id, data); } } } return success; } void HistoryBackend::GetFavicons( const std::vector& icon_urls, int icon_types, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* bitmap_results) { UpdateFaviconMappingsAndFetchImpl(NULL, icon_urls, icon_types, desired_size_in_dip, desired_scale_factors, bitmap_results); } void HistoryBackend::GetFaviconsForURL( const GURL& page_url, int icon_types, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* bitmap_results) { DCHECK(bitmap_results); GetFaviconsFromDB(page_url, icon_types, desired_size_in_dip, desired_scale_factors, bitmap_results); } void HistoryBackend::GetFaviconForID( FaviconID favicon_id, int desired_size_in_dip, ui::ScaleFactor desired_scale_factor, std::vector* bitmap_results) { std::vector favicon_ids; favicon_ids.push_back(favicon_id); std::vector desired_scale_factors; desired_scale_factors.push_back(desired_scale_factor); // Get results from DB. GetFaviconBitmapResultsForBestMatch(favicon_ids, desired_size_in_dip, desired_scale_factors, bitmap_results); } void HistoryBackend::UpdateFaviconMappingsAndFetch( const GURL& page_url, const std::vector& icon_urls, int icon_types, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* bitmap_results) { UpdateFaviconMappingsAndFetchImpl(&page_url, icon_urls, icon_types, desired_size_in_dip, desired_scale_factors, bitmap_results); } void HistoryBackend::MergeFavicon( const GURL& page_url, const GURL& icon_url, history::IconType icon_type, scoped_refptr bitmap_data, const gfx::Size& pixel_size) { if (!thumbnail_db_.get() || !db_.get()) return; FaviconID favicon_id = thumbnail_db_->GetFaviconIDForFaviconURL(icon_url, icon_type, NULL); if (!favicon_id) { // There is no favicon at |icon_url|, create it. favicon_id = thumbnail_db_->AddFavicon(icon_url, icon_type, GetDefaultFaviconSizes()); } std::vector bitmap_id_sizes; thumbnail_db_->GetFaviconBitmapIDSizes(favicon_id, &bitmap_id_sizes); // If there is already a favicon bitmap of |pixel_size| at |icon_url|, // replace it. bool replaced_bitmap = false; for (size_t i = 0; i < bitmap_id_sizes.size(); ++i) { if (bitmap_id_sizes[i].pixel_size == pixel_size) { if (IsFaviconBitmapDataEqual(bitmap_id_sizes[i].bitmap_id, bitmap_data)) { thumbnail_db_->SetFaviconBitmapLastUpdateTime( bitmap_id_sizes[i].bitmap_id, base::Time::Now()); // Return early as merging did not alter the bitmap data. ScheduleCommit(); return; } thumbnail_db_->SetFaviconBitmap(bitmap_id_sizes[i].bitmap_id, bitmap_data, base::Time::Now()); replaced_bitmap = true; break; } } // Create a vector of the pixel sizes of the favicon bitmaps currently at // |icon_url|. std::vector favicon_sizes; for (size_t i = 0; i < bitmap_id_sizes.size(); ++i) favicon_sizes.push_back(bitmap_id_sizes[i].pixel_size); if (!replaced_bitmap) { // Set the preexisting favicon bitmaps as expired as the preexisting favicon // bitmaps are not consistent with the merged in data. thumbnail_db_->SetFaviconOutOfDate(favicon_id); // Delete an arbitrary favicon bitmap to avoid going over the limit of // |kMaxFaviconBitmapsPerIconURL|. if (bitmap_id_sizes.size() >= kMaxFaviconBitmapsPerIconURL) { thumbnail_db_->DeleteFaviconBitmap(bitmap_id_sizes[0].bitmap_id); favicon_sizes.erase(favicon_sizes.begin()); } thumbnail_db_->AddFaviconBitmap(favicon_id, bitmap_data, base::Time::Now(), pixel_size); favicon_sizes.push_back(pixel_size); } // A site may have changed the favicons that it uses for |page_url|. // Example Scenario: // page_url = news.google.com // Intial State: www.google.com/favicon.ico 16x16, 32x32 // MergeFavicon(news.google.com, news.google.com/news_specific.ico, ..., // ..., 16x16) // // Difficulties: // 1. Sync requires that a call to GetFaviconsForURL() returns the // |bitmap_data| passed into MergeFavicon(). // - It is invalid for the 16x16 bitmap for www.google.com/favicon.ico to // stay mapped to news.google.com because it would be unclear which 16x16 // bitmap should be returned via GetFaviconsForURL(). // // 2. www.google.com/favicon.ico may be mapped to more than just // news.google.com (eg www.google.com). // - The 16x16 bitmap cannot be deleted from www.google.com/favicon.ico // // To resolve these problems, we copy all of the favicon bitmaps previously // mapped to news.google.com (|page_url|) and add them to the favicon at // news.google.com/news_specific.ico (|icon_url|). The favicon sizes for // |icon_url| are set to default to indicate that |icon_url| has incomplete // / incorrect data. // Difficlty 1: All but news.google.com/news_specific.ico are unmapped from // news.google.com // Difficulty 2: The favicon bitmaps for www.google.com/favicon.ico are not // modified. std::vector icon_mappings; thumbnail_db_->GetIconMappingsForPageURL(page_url, icon_type, &icon_mappings); // Copy the favicon bitmaps mapped to |page_url| to the favicon at |icon_url| // till the limit of |kMaxFaviconBitmapsPerIconURL| is reached. bool migrated_bitmaps = false; for (size_t i = 0; i < icon_mappings.size(); ++i) { if (favicon_sizes.size() >= kMaxFaviconBitmapsPerIconURL) break; if (icon_mappings[i].icon_url == icon_url) continue; std::vector bitmaps_to_copy; thumbnail_db_->GetFaviconBitmaps(icon_mappings[i].icon_id, &bitmaps_to_copy); for (size_t j = 0; j < bitmaps_to_copy.size(); ++j) { // Do not add a favicon bitmap at a pixel size for which there is already // a favicon bitmap mapped to |icon_url|. The one there is more correct // and having multiple equally sized favicon bitmaps for |page_url| is // ambiguous in terms of GetFaviconsForURL(). std::vector::iterator it = std::find(favicon_sizes.begin(), favicon_sizes.end(), bitmaps_to_copy[j].pixel_size); if (it != favicon_sizes.end()) continue; migrated_bitmaps = true; // Add the favicon bitmap as expired as it is not consistent with the // merged in data. thumbnail_db_->AddFaviconBitmap(favicon_id, bitmaps_to_copy[j].bitmap_data, base::Time(), bitmaps_to_copy[j].pixel_size); favicon_sizes.push_back(bitmaps_to_copy[j].pixel_size); if (favicon_sizes.size() >= kMaxFaviconBitmapsPerIconURL) break; } } // Update the favicon mappings such that only |icon_url| is mapped to // |page_url|. if (icon_mappings.size() != 1 || icon_mappings[0].icon_url != icon_url) { std::vector favicon_ids; favicon_ids.push_back(favicon_id); SetFaviconMappingsForPageAndRedirects(page_url, icon_type, favicon_ids); } // Sync currently does not properly deal with notifications as a result of // replacing a favicon bitmap. For M25, do not send any notifications if a // bitmap was replaced and no bitmaps were added or deleted. This is a // temporary fix for http://crbug.com/169460. if (migrated_bitmaps || !replaced_bitmap) SendFaviconChangedNotificationForPageAndRedirects(page_url); ScheduleCommit(); } void HistoryBackend::SetFavicons( const GURL& page_url, IconType icon_type, const std::vector& favicon_bitmap_data) { if (!thumbnail_db_.get() || !db_.get()) return; DCHECK(ValidateSetFaviconsParams(favicon_bitmap_data)); // Build map of FaviconBitmapData for each icon url. typedef std::map > BitmapDataByIconURL; BitmapDataByIconURL grouped_by_icon_url; for (size_t i = 0; i < favicon_bitmap_data.size(); ++i) { const GURL& icon_url = favicon_bitmap_data[i].icon_url; grouped_by_icon_url[icon_url].push_back(favicon_bitmap_data[i]); } // Track whether the method modifies or creates any favicon bitmaps, favicons // or icon mappings. bool data_modified = false; std::vector icon_ids; for (BitmapDataByIconURL::const_iterator it = grouped_by_icon_url.begin(); it != grouped_by_icon_url.end(); ++it) { const GURL& icon_url = it->first; FaviconID icon_id = thumbnail_db_->GetFaviconIDForFaviconURL(icon_url, icon_type, NULL); if (!icon_id) { // TODO(pkotwicz): Remove the favicon sizes attribute from // ThumbnailDatabase::AddFavicon(). icon_id = thumbnail_db_->AddFavicon(icon_url, icon_type, GetDefaultFaviconSizes()); data_modified = true; } icon_ids.push_back(icon_id); if (!data_modified) SetFaviconBitmaps(icon_id, it->second, &data_modified); else SetFaviconBitmaps(icon_id, it->second, NULL); } data_modified |= SetFaviconMappingsForPageAndRedirects(page_url, icon_type, icon_ids); if (data_modified) { // Send notification to the UI as an icon mapping, favicon, or favicon // bitmap was changed by this function. SendFaviconChangedNotificationForPageAndRedirects(page_url); } ScheduleCommit(); } void HistoryBackend::SetFaviconsOutOfDateForPage(const GURL& page_url) { std::vector icon_mappings; if (!thumbnail_db_.get() || !thumbnail_db_->GetIconMappingsForPageURL(page_url, &icon_mappings)) return; for (std::vector::iterator m = icon_mappings.begin(); m != icon_mappings.end(); ++m) { thumbnail_db_->SetFaviconOutOfDate(m->icon_id); } ScheduleCommit(); } void HistoryBackend::CloneFavicons(const GURL& old_page_url, const GURL& new_page_url) { if (!thumbnail_db_.get()) return; // Prevent cross-domain cloning. if (old_page_url.GetOrigin() != new_page_url.GetOrigin()) return; thumbnail_db_->CloneIconMappings(old_page_url, new_page_url); ScheduleCommit(); } void HistoryBackend::SetImportedFavicons( const std::vector& favicon_usage) { if (!db_.get() || !thumbnail_db_.get()) return; Time now = Time::Now(); // Track all URLs that had their favicons set or updated. std::set favicons_changed; for (size_t i = 0; i < favicon_usage.size(); i++) { FaviconID favicon_id = thumbnail_db_->GetFaviconIDForFaviconURL( favicon_usage[i].favicon_url, history::FAVICON, NULL); if (!favicon_id) { // This favicon doesn't exist yet, so we create it using the given data. // TODO(pkotwicz): Pass in real pixel size. favicon_id = thumbnail_db_->AddFavicon( favicon_usage[i].favicon_url, history::FAVICON, GetDefaultFaviconSizes(), new base::RefCountedBytes(favicon_usage[i].png_data), now, gfx::Size()); } // Save the mapping from all the URLs to the favicon. BookmarkService* bookmark_service = GetBookmarkService(); for (std::set::const_iterator url = favicon_usage[i].urls.begin(); url != favicon_usage[i].urls.end(); ++url) { URLRow url_row; if (!db_->GetRowForURL(*url, &url_row)) { // If the URL is present as a bookmark, add the url in history to // save the favicon mapping. This will match with what history db does // for regular bookmarked URLs with favicons - when history db is // cleaned, we keep an entry in the db with 0 visits as long as that // url is bookmarked. if (bookmark_service && bookmark_service_->IsBookmarked(*url)) { URLRow url_info(*url); url_info.set_visit_count(0); url_info.set_typed_count(0); url_info.set_last_visit(base::Time()); url_info.set_hidden(false); db_->AddURL(url_info); thumbnail_db_->AddIconMapping(*url, favicon_id); favicons_changed.insert(*url); } } else { if (!thumbnail_db_->GetIconMappingsForPageURL(*url, FAVICON, NULL)) { // URL is present in history, update the favicon *only* if it is not // set already. thumbnail_db_->AddIconMapping(*url, favicon_id); favicons_changed.insert(*url); } } } } if (!favicons_changed.empty()) { // Send the notification about the changed favicon URLs. FaviconChangeDetails* changed_details = new FaviconChangeDetails; changed_details->urls.swap(favicons_changed); BroadcastNotifications(chrome::NOTIFICATION_FAVICON_CHANGED, changed_details); } } void HistoryBackend::UpdateFaviconMappingsAndFetchImpl( const GURL* page_url, const std::vector& icon_urls, int icon_types, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* bitmap_results) { // If |page_url| is specified, |icon_types| must be either a single icon // type or icon types which are equivalent. DCHECK(!page_url || icon_types == FAVICON || icon_types == TOUCH_ICON || icon_types == TOUCH_PRECOMPOSED_ICON || icon_types == (TOUCH_ICON | TOUCH_PRECOMPOSED_ICON)); bitmap_results->clear(); if (!thumbnail_db_.get()) { return; } std::vector favicon_ids; // The icon type for which the mappings will the updated and data will be // returned. IconType selected_icon_type = INVALID_ICON; for (size_t i = 0; i < icon_urls.size(); ++i) { const GURL& icon_url = icon_urls[i]; IconType icon_type_out; const FaviconID favicon_id = thumbnail_db_->GetFaviconIDForFaviconURL( icon_url, icon_types, &icon_type_out); if (favicon_id) { // Return and update icon mappings only for the largest icon type. As // |icon_urls| is not sorted in terms of icon type, clear |favicon_ids| // if an |icon_url| with a larger icon type is found. if (icon_type_out > selected_icon_type) { selected_icon_type = icon_type_out; favicon_ids.clear(); } if (icon_type_out == selected_icon_type) favicon_ids.push_back(favicon_id); } } if (page_url && !favicon_ids.empty()) { bool mappings_updated = SetFaviconMappingsForPageAndRedirects(*page_url, selected_icon_type, favicon_ids); if (mappings_updated) { SendFaviconChangedNotificationForPageAndRedirects(*page_url); ScheduleCommit(); } } GetFaviconBitmapResultsForBestMatch(favicon_ids, desired_size_in_dip, desired_scale_factors, bitmap_results); } void HistoryBackend::SetFaviconBitmaps( FaviconID icon_id, const std::vector& favicon_bitmap_data, bool* favicon_bitmaps_changed) { if (favicon_bitmaps_changed) *favicon_bitmaps_changed = false; std::vector bitmap_id_sizes; thumbnail_db_->GetFaviconBitmapIDSizes(icon_id, &bitmap_id_sizes); std::vector to_add = favicon_bitmap_data; for (size_t i = 0; i < bitmap_id_sizes.size(); ++i) { const gfx::Size& pixel_size = bitmap_id_sizes[i].pixel_size; std::vector::iterator match_it = to_add.end(); for (std::vector::iterator it = to_add.begin(); it != to_add.end(); ++it) { if (it->pixel_size == pixel_size) { match_it = it; break; } } FaviconBitmapID bitmap_id = bitmap_id_sizes[i].bitmap_id; if (match_it == to_add.end()) { thumbnail_db_->DeleteFaviconBitmap(bitmap_id); if (favicon_bitmaps_changed) *favicon_bitmaps_changed = true; } else { if (favicon_bitmaps_changed && !*favicon_bitmaps_changed && IsFaviconBitmapDataEqual(bitmap_id, match_it->bitmap_data)) { thumbnail_db_->SetFaviconBitmapLastUpdateTime( bitmap_id, base::Time::Now()); } else { thumbnail_db_->SetFaviconBitmap(bitmap_id, match_it->bitmap_data, base::Time::Now()); if (favicon_bitmaps_changed) *favicon_bitmaps_changed = true; } to_add.erase(match_it); } } for (size_t i = 0; i < to_add.size(); ++i) { thumbnail_db_->AddFaviconBitmap(icon_id, to_add[i].bitmap_data, base::Time::Now(), to_add[i].pixel_size); if (favicon_bitmaps_changed) *favicon_bitmaps_changed = true; } } bool HistoryBackend::ValidateSetFaviconsParams( const std::vector& favicon_bitmap_data) const { typedef std::map BitmapsPerIconURL; BitmapsPerIconURL num_bitmaps_per_icon_url; for (size_t i = 0; i < favicon_bitmap_data.size(); ++i) { if (!favicon_bitmap_data[i].bitmap_data.get()) return false; const GURL& icon_url = favicon_bitmap_data[i].icon_url; if (!num_bitmaps_per_icon_url.count(icon_url)) num_bitmaps_per_icon_url[icon_url] = 1u; else ++num_bitmaps_per_icon_url[icon_url]; } if (num_bitmaps_per_icon_url.size() > kMaxFaviconsPerPage) return false; for (BitmapsPerIconURL::const_iterator it = num_bitmaps_per_icon_url.begin(); it != num_bitmaps_per_icon_url.end(); ++it) { if (it->second > kMaxFaviconBitmapsPerIconURL) return false; } return true; } bool HistoryBackend::IsFaviconBitmapDataEqual( FaviconBitmapID bitmap_id, const scoped_refptr& new_bitmap_data) { if (!new_bitmap_data.get()) return false; scoped_refptr original_bitmap_data; thumbnail_db_->GetFaviconBitmap(bitmap_id, NULL, &original_bitmap_data, NULL); return new_bitmap_data->Equals(original_bitmap_data); } bool HistoryBackend::GetFaviconsFromDB( const GURL& page_url, int icon_types, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* favicon_bitmap_results) { DCHECK(favicon_bitmap_results); favicon_bitmap_results->clear(); if (!db_.get() || !thumbnail_db_.get()) return false; // Time the query. TimeTicks beginning_time = TimeTicks::Now(); // Get FaviconIDs for |page_url| and one of |icon_types|. std::vector icon_mappings; thumbnail_db_->GetIconMappingsForPageURL(page_url, icon_types, &icon_mappings); std::vector favicon_ids; for (size_t i = 0; i < icon_mappings.size(); ++i) favicon_ids.push_back(icon_mappings[i].icon_id); // Populate |favicon_bitmap_results| and |icon_url_sizes|. bool success = GetFaviconBitmapResultsForBestMatch(favicon_ids, desired_size_in_dip, desired_scale_factors, favicon_bitmap_results); UMA_HISTOGRAM_TIMES("History.GetFavIconFromDB", // historical name TimeTicks::Now() - beginning_time); return success && !favicon_bitmap_results->empty(); } bool HistoryBackend::GetFaviconBitmapResultsForBestMatch( const std::vector& candidate_favicon_ids, int desired_size_in_dip, const std::vector& desired_scale_factors, std::vector* favicon_bitmap_results) { favicon_bitmap_results->clear(); if (candidate_favicon_ids.empty()) return true; // Find the FaviconID and the FaviconBitmapIDs which best match // |desired_size_in_dip| and |desired_scale_factors|. // TODO(pkotwicz): Select bitmap results from multiple favicons once // content::FaviconStatus supports multiple icon URLs. FaviconID best_favicon_id = 0; std::vector best_bitmap_ids; float highest_score = kSelectFaviconFramesInvalidScore; for (size_t i = 0; i < candidate_favicon_ids.size(); ++i) { std::vector bitmap_id_sizes; thumbnail_db_->GetFaviconBitmapIDSizes(candidate_favicon_ids[i], &bitmap_id_sizes); // Build vector of gfx::Size from |bitmap_id_sizes|. std::vector sizes; for (size_t j = 0; j < bitmap_id_sizes.size(); ++j) sizes.push_back(bitmap_id_sizes[j].pixel_size); std::vector candidate_bitmap_indices; float score = 0; SelectFaviconFrameIndices(sizes, desired_scale_factors, desired_size_in_dip, &candidate_bitmap_indices, &score); if (score > highest_score) { highest_score = score; best_favicon_id = candidate_favicon_ids[i], best_bitmap_ids.clear(); for (size_t j = 0; j < candidate_bitmap_indices.size(); ++j) { size_t candidate_index = candidate_bitmap_indices[j]; best_bitmap_ids.push_back( bitmap_id_sizes[candidate_index].bitmap_id); } } } // Construct FaviconBitmapResults from |best_favicon_id| and // |best_bitmap_ids|. GURL icon_url; IconType icon_type; if (!thumbnail_db_->GetFaviconHeader(best_favicon_id, &icon_url, &icon_type, NULL)) { return false; } for (size_t i = 0; i < best_bitmap_ids.size(); ++i) { base::Time last_updated; FaviconBitmapResult bitmap_result; bitmap_result.icon_url = icon_url; bitmap_result.icon_type = icon_type; if (!thumbnail_db_->GetFaviconBitmap(best_bitmap_ids[i], &last_updated, &bitmap_result.bitmap_data, &bitmap_result.pixel_size)) { return false; } bitmap_result.expired = (Time::Now() - last_updated) > TimeDelta::FromDays(kFaviconRefetchDays); if (bitmap_result.is_valid()) favicon_bitmap_results->push_back(bitmap_result); } return true; } bool HistoryBackend::SetFaviconMappingsForPageAndRedirects( const GURL& page_url, IconType icon_type, const std::vector& icon_ids) { if (!thumbnail_db_.get()) return false; // Find all the pages whose favicons we should set, we want to set it for // all the pages in the redirect chain if it redirected. history::RedirectList redirects; GetCachedRecentRedirects(page_url, &redirects); bool mappings_changed = false; // Save page <-> favicon associations. for (history::RedirectList::const_iterator i(redirects.begin()); i != redirects.end(); ++i) { mappings_changed |= SetFaviconMappingsForPage(*i, icon_type, icon_ids); } return mappings_changed; } bool HistoryBackend::SetFaviconMappingsForPage( const GURL& page_url, IconType icon_type, const std::vector& icon_ids) { DCHECK_LE(icon_ids.size(), kMaxFaviconsPerPage); bool mappings_changed = false; // Two icon types are considered 'equivalent' if one of the icon types is // TOUCH_ICON and the other is TOUCH_PRECOMPOSED_ICON. // // Sets the icon mappings from |page_url| for |icon_type| to the favicons // with |icon_ids|. Mappings for |page_url| to favicons of type |icon_type| // whose FaviconID is not in |icon_ids| are removed. All icon mappings for // |page_url| to favicons of a type equivalent to |icon_type| are removed. // Remove any favicons which are orphaned as a result of the removal of the // icon mappings. std::vector unmapped_icon_ids = icon_ids; std::vector icon_mappings; thumbnail_db_->GetIconMappingsForPageURL(page_url, &icon_mappings); for (std::vector::iterator m = icon_mappings.begin(); m != icon_mappings.end(); ++m) { std::vector::iterator icon_id_it = std::find( unmapped_icon_ids.begin(), unmapped_icon_ids.end(), m->icon_id); // If the icon mapping already exists, avoid removing it and adding it back. if (icon_id_it != unmapped_icon_ids.end()) { unmapped_icon_ids.erase(icon_id_it); continue; } if ((icon_type == TOUCH_ICON && m->icon_type == TOUCH_PRECOMPOSED_ICON) || (icon_type == TOUCH_PRECOMPOSED_ICON && m->icon_type == TOUCH_ICON) || (icon_type == m->icon_type)) { thumbnail_db_->DeleteIconMapping(m->mapping_id); // Removing the icon mapping may have orphaned the associated favicon so // we must recheck it. This is not super fast, but this case will get // triggered rarely, since normally a page will always map to the same // favicon IDs. It will mostly happen for favicons we import. if (!thumbnail_db_->HasMappingFor(m->icon_id)) thumbnail_db_->DeleteFavicon(m->icon_id); mappings_changed = true; } } for (size_t i = 0; i < unmapped_icon_ids.size(); ++i) { thumbnail_db_->AddIconMapping(page_url, unmapped_icon_ids[i]); mappings_changed = true; } return mappings_changed; } void HistoryBackend::GetCachedRecentRedirects( const GURL& page_url, history::RedirectList* redirect_list) { RedirectCache::iterator iter = recent_redirects_.Get(page_url); if (iter != recent_redirects_.end()) { *redirect_list = iter->second; // The redirect chain should have the destination URL as the last item. DCHECK(!redirect_list->empty()); DCHECK(redirect_list->back() == page_url); } else { // No known redirects, construct mock redirect chain containing |page_url|. redirect_list->push_back(page_url); } } void HistoryBackend::SendFaviconChangedNotificationForPageAndRedirects( const GURL& page_url) { history::RedirectList redirect_list; GetCachedRecentRedirects(page_url, &redirect_list); FaviconChangeDetails* changed_details = new FaviconChangeDetails; for (size_t i = 0; i < redirect_list.size(); ++i) changed_details->urls.insert(redirect_list[i]); BroadcastNotifications(chrome::NOTIFICATION_FAVICON_CHANGED, changed_details); } void HistoryBackend::Commit() { if (!db_.get()) return; // Note that a commit may not actually have been scheduled if a caller // explicitly calls this instead of using ScheduleCommit. Likewise, we // may reset the flag written by a pending commit. But this is OK! It // will merely cause extra commits (which is kind of the idea). We // could optimize more for this case (we may get two extra commits in // some cases) but it hasn't been important yet. CancelScheduledCommit(); db_->CommitTransaction(); DCHECK(db_->transaction_nesting() == 0) << "Somebody left a transaction open"; db_->BeginTransaction(); if (thumbnail_db_.get()) { thumbnail_db_->CommitTransaction(); DCHECK(thumbnail_db_->transaction_nesting() == 0) << "Somebody left a transaction open"; thumbnail_db_->BeginTransaction(); } if (archived_db_.get()) { archived_db_->CommitTransaction(); archived_db_->BeginTransaction(); } if (text_database_.get()) { text_database_->CommitTransaction(); text_database_->BeginTransaction(); } } void HistoryBackend::ScheduleCommit() { if (scheduled_commit_.get()) return; scheduled_commit_ = new CommitLaterTask(this); MessageLoop::current()->PostDelayedTask( FROM_HERE, base::Bind(&CommitLaterTask::RunCommit, scheduled_commit_.get()), base::TimeDelta::FromSeconds(kCommitIntervalSeconds)); } void HistoryBackend::CancelScheduledCommit() { if (scheduled_commit_) { scheduled_commit_->Cancel(); scheduled_commit_ = NULL; } } void HistoryBackend::ProcessDBTaskImpl() { if (!db_.get()) { // db went away, release all the refs. ReleaseDBTasks(); return; } // Remove any canceled tasks. while (!db_task_requests_.empty() && db_task_requests_.front()->canceled()) { db_task_requests_.front()->Release(); db_task_requests_.pop_front(); } if (db_task_requests_.empty()) return; // Run the first task. HistoryDBTaskRequest* request = db_task_requests_.front(); db_task_requests_.pop_front(); if (request->value->RunOnDBThread(this, db_.get())) { // The task is done. Notify the callback. request->ForwardResult(); // We AddRef'd the request before adding, need to release it now. request->Release(); } else { // Tasks wants to run some more. Schedule it at the end of current tasks. db_task_requests_.push_back(request); // And process it after an invoke later. MessageLoop::current()->PostTask( FROM_HERE, base::Bind(&HistoryBackend::ProcessDBTaskImpl, this)); } } void HistoryBackend::ReleaseDBTasks() { for (std::list::iterator i = db_task_requests_.begin(); i != db_task_requests_.end(); ++i) { (*i)->Release(); } db_task_requests_.clear(); } //////////////////////////////////////////////////////////////////////////////// // // Generic operations // //////////////////////////////////////////////////////////////////////////////// void HistoryBackend::DeleteURLs(const std::vector& urls) { expirer_.DeleteURLs(urls); db_->GetStartDate(&first_recorded_time_); // Force a commit, if the user is deleting something for privacy reasons, we // want to get it on disk ASAP. Commit(); } void HistoryBackend::DeleteURL(const GURL& url) { expirer_.DeleteURL(url); db_->GetStartDate(&first_recorded_time_); // Force a commit, if the user is deleting something for privacy reasons, we // want to get it on disk ASAP. Commit(); } void HistoryBackend::ExpireHistoryBetween( const std::set& restrict_urls, Time begin_time, Time end_time) { if (db_.get()) { if (begin_time.is_null() && end_time.is_null() && restrict_urls.empty()) { // Special case deleting all history so it can be faster and to reduce the // possibility of an information leak. DeleteAllHistory(); } else { // Clearing parts of history, have the expirer do the depend expirer_.ExpireHistoryBetween(restrict_urls, begin_time, end_time); // Force a commit, if the user is deleting something for privacy reasons, // we want to get it on disk ASAP. Commit(); } } if (begin_time <= first_recorded_time_) db_->GetStartDate(&first_recorded_time_); } void HistoryBackend::ExpireHistoryForTimes( const std::vector& times) { // Put the times in reverse chronological order and remove // duplicates (for expirer_.ExpireHistoryForTimes()). std::vector sorted_times = times; std::sort(sorted_times.begin(), sorted_times.end(), std::greater()); sorted_times.erase( std::unique(sorted_times.begin(), sorted_times.end()), sorted_times.end()); if (sorted_times.empty()) return; if (db_.get()) { expirer_.ExpireHistoryForTimes(sorted_times); // Force a commit, if the user is deleting something for privacy reasons, // we want to get it on disk ASAP. Commit(); } // Update the first recorded time if we've expired it. if (std::binary_search(sorted_times.begin(), sorted_times.end(), first_recorded_time_, std::greater())) db_->GetStartDate(&first_recorded_time_); } void HistoryBackend::URLsNoLongerBookmarked(const std::set& urls) { if (!db_.get()) return; for (std::set::const_iterator i = urls.begin(); i != urls.end(); ++i) { URLRow url_row; if (!db_->GetRowForURL(*i, &url_row)) continue; // The URL isn't in the db; nothing to do. VisitVector visits; db_->GetVisitsForURL(url_row.id(), &visits); if (visits.empty()) expirer_.DeleteURL(*i); // There are no more visits; nuke the URL. } } void HistoryBackend::KillHistoryDatabase() { if (!db_.get()) return; // Rollback transaction because Raze() cannot be called from within a // transaction. db_->RollbackTransaction(); bool success = db_->Raze(); UMA_HISTOGRAM_BOOLEAN("History.KillHistoryDatabaseResult", success); #if defined(OS_ANDROID) // Release AndroidProviderBackend before other objects. android_provider_backend_.reset(); #endif // The expirer keeps tabs on the active databases. Tell it about the // databases which will be closed. expirer_.SetDatabases(NULL, NULL, NULL, NULL); // Reopen a new transaction for |db_| for the sake of CloseAllDatabases(). db_->BeginTransaction(); CloseAllDatabases(); } void HistoryBackend::ProcessDBTask( scoped_refptr request) { DCHECK(request.get()); if (request->canceled()) return; bool task_scheduled = !db_task_requests_.empty(); // Make sure we up the refcount of the request. ProcessDBTaskImpl will // release when done with the task. request->AddRef(); db_task_requests_.push_back(request.get()); if (!task_scheduled) { // No other tasks are scheduled. Process request now. ProcessDBTaskImpl(); } } void HistoryBackend::BroadcastNotifications( int type, HistoryDetails* details_deleted) { // |delegate_| may be NULL if |this| is in the process of closing (closed by // HistoryService -> HistroyBackend::Closing(). if (delegate_.get()) delegate_->BroadcastNotifications(type, details_deleted); else delete details_deleted; } // Deleting -------------------------------------------------------------------- void HistoryBackend::DeleteAllHistory() { // Our approach to deleting all history is: // 1. Copy the bookmarks and their dependencies to new tables with temporary // names. // 2. Delete the original tables. Since tables can not share pages, we know // that any data we don't want to keep is now in an unused page. // 3. Renaming the temporary tables to match the original. // 4. Vacuuming the database to delete the unused pages. // // Since we are likely to have very few bookmarks and their dependencies // compared to all history, this is also much faster than just deleting from // the original tables directly. // Get the bookmarked URLs. std::vector starred_urls; BookmarkService* bookmark_service = GetBookmarkService(); if (bookmark_service) bookmark_service_->GetBookmarks(&starred_urls); URLRows kept_urls; for (size_t i = 0; i < starred_urls.size(); i++) { URLRow row; if (!db_->GetRowForURL(starred_urls[i].url, &row)) continue; // Clear the last visit time so when we write these rows they are "clean." row.set_last_visit(Time()); row.set_visit_count(0); row.set_typed_count(0); kept_urls.push_back(row); } // Clear thumbnail and favicon history. The favicons for the given URLs will // be kept. if (!ClearAllThumbnailHistory(&kept_urls)) { LOG(ERROR) << "Thumbnail history could not be cleared"; // We continue in this error case. If the user wants to delete their // history, we should delete as much as we can. } // ClearAllMainHistory will change the IDs of the URLs in kept_urls. Therfore, // we clear the list afterwards to make sure nobody uses this invalid data. if (!ClearAllMainHistory(kept_urls)) LOG(ERROR) << "Main history could not be cleared"; kept_urls.clear(); // Delete FTS files & archived history. if (text_database_.get()) { // We assume that the text database has one transaction on them that we need // to close & restart (the long-running history transaction). text_database_->CommitTransaction(); text_database_->DeleteAll(); text_database_->BeginTransaction(); } if (archived_db_.get()) { // Close the database and delete the file. archived_db_.reset(); FilePath archived_file_name = GetArchivedFileName(); file_util::Delete(archived_file_name, false); // Now re-initialize the database (which may fail). archived_db_.reset(new ArchivedDatabase()); if (!archived_db_->Init(archived_file_name)) { LOG(WARNING) << "Could not initialize the archived database."; archived_db_.reset(); } else { // Open our long-running transaction on this database. archived_db_->BeginTransaction(); } } db_->GetStartDate(&first_recorded_time_); // Send out the notfication that history is cleared. The in-memory datdabase // will pick this up and clear itself. URLsDeletedDetails* details = new URLsDeletedDetails; details->all_history = true; BroadcastNotifications(chrome::NOTIFICATION_HISTORY_URLS_DELETED, details); } bool HistoryBackend::ClearAllThumbnailHistory(URLRows* kept_urls) { if (!thumbnail_db_.get()) { // When we have no reference to the thumbnail database, maybe there was an // error opening it. In this case, we just try to blow it away to try to // fix the error if it exists. This may fail, in which case either the // file doesn't exist or there's no more we can do. file_util::Delete(GetThumbnailFileName(), false); return true; } // Create duplicate icon_mapping, favicon, and favicon_bitmaps tables, this // is where the favicons we want to keep will be stored. if (!thumbnail_db_->InitTemporaryTables()) return false; // This maps existing favicon IDs to the ones in the temporary table. typedef std::map FaviconMap; FaviconMap copied_favicons; // Copy all unique favicons to the temporary table, and update all the // URLs to have the new IDs. for (URLRows::iterator i = kept_urls->begin(); i != kept_urls->end(); ++i) { std::vector icon_mappings; if (!thumbnail_db_->GetIconMappingsForPageURL(i->url(), &icon_mappings)) continue; for (std::vector::iterator m = icon_mappings.begin(); m != icon_mappings.end(); ++m) { FaviconID old_id = m->icon_id; FaviconID new_id; FaviconMap::const_iterator found = copied_favicons.find(old_id); if (found == copied_favicons.end()) { new_id = thumbnail_db_->CopyFaviconAndFaviconBitmapsToTemporaryTables( old_id); copied_favicons[old_id] = new_id; } else { // We already encountered a URL that used this favicon, use the ID we // previously got. new_id = found->second; } // Add Icon mapping, and we don't care wheteher it suceeded or not. thumbnail_db_->AddToTemporaryIconMappingTable(i->url(), new_id); } } #if defined(OS_ANDROID) // TODO (michaelbai): Add the unit test once AndroidProviderBackend is // avaliable in HistoryBackend. db_->ClearAndroidURLRows(); #endif // Drop original favicon_bitmaps, favicons, and icon mapping tables and // replace them with the duplicate tables. Recreate the other tables. This // will make the database consistent again. thumbnail_db_->CommitTemporaryTables(); thumbnail_db_->RecreateThumbnailTable(); // Vacuum to remove all the pages associated with the dropped tables. There // must be no transaction open on the table when we do this. We assume that // our long-running transaction is open, so we complete it and start it again. DCHECK(thumbnail_db_->transaction_nesting() == 1); thumbnail_db_->CommitTransaction(); thumbnail_db_->Vacuum(); thumbnail_db_->BeginTransaction(); return true; } bool HistoryBackend::ClearAllMainHistory(const URLRows& kept_urls) { // Create the duplicate URL table. We will copy the kept URLs into this. if (!db_->CreateTemporaryURLTable()) return false; // Insert the URLs into the temporary table, we need to keep a map of changed // IDs since the ID will be different in the new table. typedef std::map URLIDMap; URLIDMap old_to_new; // Maps original ID to new one. for (URLRows::const_iterator i = kept_urls.begin(); i != kept_urls.end(); ++i) { URLID new_id = db_->AddTemporaryURL(*i); old_to_new[i->id()] = new_id; } // Replace the original URL table with the temporary one. if (!db_->CommitTemporaryURLTable()) return false; // Delete the old tables and recreate them empty. db_->RecreateAllTablesButURL(); // Vacuum to reclaim the space from the dropped tables. This must be done // when there is no transaction open, and we assume that our long-running // transaction is currently open. db_->CommitTransaction(); db_->Vacuum(); db_->BeginTransaction(); db_->GetStartDate(&first_recorded_time_); return true; } BookmarkService* HistoryBackend::GetBookmarkService() { if (bookmark_service_) bookmark_service_->BlockTillLoaded(); return bookmark_service_; } void HistoryBackend::NotifyVisitObservers(const VisitRow& visit) { BriefVisitInfo info; info.url_id = visit.url_id; info.time = visit.visit_time; info.transition = visit.transition; // If we don't have a delegate yet during setup or shutdown, we will drop // these notifications. if (delegate_.get()) delegate_->NotifyVisitDBObserversOnAddVisit(info); } } // namespace history