1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
|
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef CHROME_BROWSER_HISTORY_URL_DATABASE_H_
#define CHROME_BROWSER_HISTORY_URL_DATABASE_H_
#include "base/basictypes.h"
#include "chrome/browser/history/history_types.h"
#include "chrome/browser/history/query_parser.h"
#include "chrome/browser/search_engines/template_url_id.h"
#include "sql/statement.h"
class GURL;
namespace sql {
class Connection;
}
namespace history {
class VisitDatabase; // For friend statement.
// Encapsulates an SQL database that holds URL info. This is a subset of the
// full history data. We split this class' functionality out from the larger
// HistoryDatabase class to support maintaining separate databases of URLs with
// different capabilities (for example, in-memory, or archived).
//
// This is refcounted to support calling InvokeLater() with some of its methods
// (necessary to maintain ordering of DB operations).
class URLDatabase {
public:
// Must call CreateURLTable() and CreateURLIndexes() before using to make
// sure the database is initialized.
URLDatabase();
// This object must be destroyed on the thread where all accesses are
// happening to avoid thread-safety problems.
virtual ~URLDatabase();
// Converts a GURL to a string used in the history database. We plan to
// do more complex operations than just getting the spec out involving
// punycode, so this function should be used instead of url.spec() when
// interacting with the database.
//
// TODO(brettw) this should be moved out of the public section and the
// entire public HistoryDatabase interface should use GURL. This should
// also probably return a string instead since that is what the DB uses
// internally and we can avoid the extra conversion.
static std::string GURLToDatabaseURL(const GURL& url);
// URL table functions -------------------------------------------------------
// Looks up a url given an id. Fills info with the data. Returns true on
// success and false otherwise.
bool GetURLRow(URLID url_id, URLRow* info);
// Looks up all urls that were typed in manually. Fills info with the data.
// Returns true on success and false otherwise.
bool GetAllTypedUrls(URLRows* urls);
// Looks up the given URL and if it exists, fills the given pointers with the
// associated info and returns the ID of that URL. If the info pointer is
// NULL, no information about the URL will be filled in, only the ID will be
// returned. Returns 0 if the URL was not found.
URLID GetRowForURL(const GURL& url, URLRow* info);
// Given an already-existing row in the URL table, updates that URL's stats.
// This can not change the URL. Returns true on success.
//
// This will NOT update the title used for full text indexing. If you are
// setting the title, call SetPageIndexedData with the new title.
bool UpdateURLRow(URLID url_id, const URLRow& info);
// Adds a line to the URL database with the given information and returns the
// row ID. A row with the given URL must not exist. Returns 0 on error.
//
// This does NOT add a row to the full text search database. Use
// HistoryDatabase::SetPageIndexedData to do this.
URLID AddURL(const URLRow& info) {
return AddURLInternal(info, false);
}
// Delete the row of the corresponding URL. Only the row in the URL table
// will be deleted, not any other data that may refer to it. Returns true if
// the row existed and was deleted.
bool DeleteURLRow(URLID id);
// URL mass-deleting ---------------------------------------------------------
// Begins the mass-deleting operation by creating a temporary URL table.
// The caller than adds the URLs it wants to preseve to the temporary table,
// and then deletes everything else by calling CommitTemporaryURLTable().
// Returns true on success.
bool CreateTemporaryURLTable();
// Adds a row to the temporary URL table. This must be called between
// CreateTemporaryURLTable() and CommitTemporaryURLTable() (see those for more
// info). The ID of the URL will change in the temporary table, so the new ID
// is returned. Returns 0 on failure.
URLID AddTemporaryURL(const URLRow& row) {
return AddURLInternal(row, true);
}
// Ends the mass-deleting by replacing the original URL table with the
// temporary one created in CreateTemporaryURLTable. Returns true on success.
//
// This function does not create the supplimentary indices. It is virtual so
// that the main history database can provide this additional behavior.
virtual bool CommitTemporaryURLTable();
// Enumeration ---------------------------------------------------------------
// A basic enumerator to enumerate urls database.
class URLEnumeratorBase {
public:
URLEnumeratorBase();
virtual ~URLEnumeratorBase();
private:
friend class URLDatabase;
bool initialized_;
sql::Statement statement_;
DISALLOW_COPY_AND_ASSIGN(URLEnumeratorBase);
};
// A basic enumerator to enumerate urls
class URLEnumerator : public URLEnumeratorBase {
public:
URLEnumerator();
// Retreives the next url. Returns false if no more urls are available
bool GetNextURL(history::URLRow* r);
private:
DISALLOW_COPY_AND_ASSIGN(URLEnumerator);
};
// A basic enumerator to enumerate icon mapping, it is only used for icon
// mapping migration.
class IconMappingEnumerator : public URLEnumeratorBase {
public:
IconMappingEnumerator();
// Retreives the next url. Returns false if no more urls are available
bool GetNextIconMapping(IconMapping* r);
private:
DISALLOW_COPY_AND_ASSIGN(IconMappingEnumerator);
};
// Initializes the given enumerator to enumerator all URLs in the database.
bool InitURLEnumeratorForEverything(URLEnumerator* enumerator);
// Initializes the given enumerator to enumerator all URLs in the database
// that are historically significant: ones having been visited within 3 days,
// having their URL manually typed more than once, or having been visited
// more than 3 times.
bool InitURLEnumeratorForSignificant(URLEnumerator* enumerator);
// Favicons ------------------------------------------------------------------
// Autocomplete --------------------------------------------------------------
// Fills the given array with URLs matching the given prefix. They will be
// sorted by typed count, then by visit count, then by visit date (most recent
// first) up to the given maximum number. If |typed_only| is true, only urls
// that have been typed once are returned. For caller convenience, returns
// whether any results were found.
bool AutocompleteForPrefix(const std::string& prefix,
size_t max_results,
bool typed_only,
URLRows* results);
// Returns true if the database holds some past typed navigation to a URL on
// the provided hostname.
bool IsTypedHost(const std::string& host);
// Tries to find the shortest URL beginning with |base| that strictly
// prefixes |url|, and has minimum visit_ and typed_counts as specified.
// If found, fills in |info| and returns true; otherwise returns false,
// leaving |info| unchanged.
// We allow matches of exactly |base| iff |allow_base| is true.
bool FindShortestURLFromBase(const std::string& base,
const std::string& url,
int min_visits,
int min_typed,
bool allow_base,
history::URLRow* info);
// History search ------------------------------------------------------------
// Performs a brute force search over the database to find any URLs or titles
// which match the |query| string. Returns any matches in |results|.
bool GetTextMatches(const string16& query, URLRows* results);
// Keyword Search Terms ------------------------------------------------------
// Sets the search terms for the specified url/keyword pair.
bool SetKeywordSearchTermsForURL(URLID url_id,
TemplateURLID keyword_id,
const string16& term);
// Looks up a keyword search term given a url id. Returns all the search terms
// in |rows|. Returns true on success.
bool GetKeywordSearchTermRow(URLID url_id, KeywordSearchTermRow* row);
// Looks up all keyword search terms given a term, Fills the rows with data.
// Returns true on success and false otherwise.
bool GetKeywordSearchTermRows(const string16& term,
std::vector<KeywordSearchTermRow>* rows);
// Deletes all search terms for the specified keyword that have been added by
// way of SetKeywordSearchTermsForURL.
void DeleteAllSearchTermsForKeyword(TemplateURLID keyword_id);
// Returns up to max_count of the most recent search terms for the specified
// keyword.
void GetMostRecentKeywordSearchTerms(
TemplateURLID keyword_id,
const string16& prefix,
int max_count,
std::vector<KeywordSearchTermVisit>* matches);
// Deletes all searches matching |term|.
bool DeleteKeywordSearchTerm(const string16& term);
// Migration -----------------------------------------------------------------
// Do to a bug we were setting the favicon of about:blank. This forces
// about:blank to have no icon or title. Returns true on success, false if
// the favicon couldn't be updated.
bool MigrateFromVersion11ToVersion12();
// Initializes the given enumerator to enumerator all URL and icon mappings
// in the database. Only used for icon mapping migration.
bool InitIconMappingEnumeratorForEverything(
IconMappingEnumerator* enumerator);
protected:
friend class VisitDatabase;
// See HISTORY_URL_ROW_FIELDS below.
static const char kURLRowFields[];
// The number of fiends in kURLRowFields. If callers need additional
// fields, they can add their 0-based index to this value to get the index of
// fields following kURLRowFields.
static const int kNumURLRowFields;
// Drops the starred_id column from urls, returning true on success. This does
// nothing (and returns true) if the urls doesn't contain the starred_id
// column.
bool DropStarredIDFromURLs();
// Initialization functions. The indexing functions are separate from the
// table creation functions so the in-memory database and the temporary tables
// used when clearing history can populate the table and then create the
// index, which is faster than the reverse.
//
// is_temporary is false when generating the "regular" URLs table. The expirer
// sets this to true to generate the temporary table, which will have a
// different name but the same schema.
bool CreateURLTable(bool is_temporary);
// We have two tiers of indices for the URL table. The main tier is used by
// all URL databases, and is an index over the URL itself.
bool CreateMainURLIndex();
// Ensures the keyword search terms table exists.
bool InitKeywordSearchTermsTable();
// Creates the indices used for keyword search terms.
bool CreateKeywordSearchTermsIndices();
// Deletes the keyword search terms table.
bool DropKeywordSearchTermsTable();
// Inserts the given URL row into the URLs table, using the regular table
// if is_temporary is false, or the temporary URL table if is temporary is
// true. The temporary table may only be used in between
// CreateTemporaryURLTable() and CommitTemporaryURLTable().
URLID AddURLInternal(const URLRow& info, bool is_temporary);
// Convenience to fill a history::URLRow. Must be in sync with the fields in
// kHistoryURLRowFields.
static void FillURLRow(sql::Statement& s, URLRow* i);
// Returns the database for the functions in this interface. The decendent of
// this class implements these functions to return its objects.
virtual sql::Connection& GetDB() = 0;
private:
// True if InitKeywordSearchTermsTable() has been invoked. Not all subclasses
// have keyword search terms.
bool has_keyword_search_terms_;
QueryParser query_parser_;
DISALLOW_COPY_AND_ASSIGN(URLDatabase);
};
// The fields and order expected by FillURLRow(). ID is guaranteed to be first
// so that DISTINCT can be prepended to get distinct URLs.
//
// This is available BOTH as a macro and a static string (kURLRowFields). Use
// the macro if you want to put this in the middle of an otherwise constant
// string, it will save time doing string appends. If you have to build a SQL
// string dynamically anyway, use the constant, it will save space.
#define HISTORY_URL_ROW_FIELDS \
" urls.id, urls.url, urls.title, urls.visit_count, urls.typed_count, " \
"urls.last_visit_time, urls.hidden "
} // namespace history
#endif // CHROME_BROWSER_HISTORY_URL_DATABASE_H_
|