summaryrefslogtreecommitdiffstats
path: root/third_party/rust/suggest/src/schema.rs
blob: b304363de5007470c0328e0ecadb3853960420ec (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
/* This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this
 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
 */

use rusqlite::{Connection, Transaction};
use sql_support::open_database::{self, ConnectionInitializer};

/// The current database schema version.
///
/// For any changes to the schema [`SQL`], please make sure to:
///
///  1. Bump this version.
///  2. Add a migration from the old version to the new version in
///     [`SuggestConnectionInitializer::upgrade_from`].
///    a. If suggestions should be re-ingested after the migration, call `clear_database()` inside
///       the migration.
pub const VERSION: u32 = 18;

/// The current Suggest database schema.
pub const SQL: &str = "
    CREATE TABLE meta(
        key TEXT PRIMARY KEY,
        value NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE keywords(
        keyword TEXT NOT NULL,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        full_keyword_id INTEGER NULL REFERENCES full_keywords(id) ON DELETE SET NULL,
        rank INTEGER NOT NULL,
        PRIMARY KEY (keyword, suggestion_id)
    ) WITHOUT ROWID;

    -- full keywords are what we display to the user when a (partial) keyword matches
    -- The FK to suggestion_id makes it so full keywords get deleted when the parent suggestion is deleted.
    CREATE TABLE full_keywords(
        id INTEGER PRIMARY KEY,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        full_keyword TEXT NOT NULL
    );

    CREATE TABLE prefix_keywords(
        keyword_prefix TEXT NOT NULL,
        keyword_suffix TEXT NOT NULL DEFAULT '',
        confidence INTEGER NOT NULL DEFAULT 0,
        rank INTEGER NOT NULL,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        PRIMARY KEY (keyword_prefix, keyword_suffix, suggestion_id)
    ) WITHOUT ROWID;

    CREATE UNIQUE INDEX keywords_suggestion_id_rank ON keywords(suggestion_id, rank);

    CREATE TABLE suggestions(
        id INTEGER PRIMARY KEY,
        record_id TEXT NOT NULL,
        provider INTEGER NOT NULL,
        title TEXT NOT NULL,
        url TEXT NOT NULL,
        score REAL NOT NULL
    );

    CREATE TABLE amp_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        advertiser TEXT NOT NULL,
        block_id INTEGER NOT NULL,
        iab_category TEXT NOT NULL,
        impression_url TEXT NOT NULL,
        click_url TEXT NOT NULL,
        icon_id TEXT NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    CREATE TABLE wikipedia_custom_details(
        suggestion_id INTEGER PRIMARY KEY REFERENCES suggestions(id) ON DELETE CASCADE,
        icon_id TEXT NOT NULL
    );

    CREATE TABLE amo_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        description TEXT NOT NULL,
        guid TEXT NOT NULL,
        icon_url TEXT NOT NULL,
        rating TEXT,
        number_of_ratings INTEGER NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    CREATE INDEX suggestions_record_id ON suggestions(record_id);

    CREATE TABLE icons(
        id TEXT PRIMARY KEY,
        data BLOB NOT NULL,
        mimetype TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_subjects(
        keyword TEXT PRIMARY KEY,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_modifiers(
        type INTEGER NOT NULL,
        keyword TEXT NOT NULL,
        record_id TEXT NOT NULL,
        PRIMARY KEY (type, keyword)
    ) WITHOUT ROWID;

    CREATE TABLE yelp_location_signs(
        keyword TEXT PRIMARY KEY,
        need_location INTEGER NOT NULL,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_custom_details(
        icon_id TEXT PRIMARY KEY,
        score REAL NOT NULL,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE mdn_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        description TEXT NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    CREATE TABLE dismissed_suggestions (
        url TEXT PRIMARY KEY
    ) WITHOUT ROWID;
";

/// Initializes an SQLite connection to the Suggest database, performing
/// migrations as needed.
pub struct SuggestConnectionInitializer;

impl ConnectionInitializer for SuggestConnectionInitializer {
    const NAME: &'static str = "suggest db";
    const END_VERSION: u32 = VERSION;

    fn prepare(&self, conn: &Connection, _db_empty: bool) -> open_database::Result<()> {
        let initial_pragmas = "
            -- Use in-memory storage for TEMP tables.
            PRAGMA temp_store = 2;

            PRAGMA journal_mode = WAL;
            PRAGMA foreign_keys = ON;
        ";
        conn.execute_batch(initial_pragmas)?;
        sql_support::debug_tools::define_debug_functions(conn)?;

        Ok(())
    }

    fn init(&self, db: &Transaction<'_>) -> open_database::Result<()> {
        Ok(db.execute_batch(SQL)?)
    }

    fn upgrade_from(&self, tx: &Transaction<'_>, version: u32) -> open_database::Result<()> {
        match version {
            1..=15 => {
                // Treat databases with these older schema versions as corrupt,
                // so that they'll be replaced by a fresh, empty database with
                // the current schema.
                Err(open_database::Error::Corrupt)
            }
            16 => {
                tx.execute(
                    "
                    CREATE TABLE dismissed_suggestions (
                        url_hash INTEGER PRIMARY KEY
                    ) WITHOUT ROWID;",
                    (),
                )?;
                Ok(())
            }
            17 => {
                tx.execute(
                    "
                    DROP TABLE dismissed_suggestions;
                    CREATE TABLE dismissed_suggestions (
                        url TEXT PRIMARY KEY
                    ) WITHOUT ROWID;",
                    (),
                )?;
                Ok(())
            }
            _ => Err(open_database::Error::IncompatibleVersion(version)),
        }
    }
}

/// Clears the database, removing all suggestions, icons, and metadata.
pub fn clear_database(db: &Connection) -> rusqlite::Result<()> {
    db.execute_batch(
        "
        DELETE FROM meta;
        DELETE FROM suggestions;
        DELETE FROM icons;
        DELETE FROM yelp_subjects;
        DELETE FROM yelp_modifiers;
        DELETE FROM yelp_location_signs;
        DELETE FROM yelp_custom_details;
        ",
    )
}

#[cfg(test)]
mod test {
    use super::*;
    use sql_support::open_database::test_utils::MigratedDatabaseFile;

    // Snapshot of the v16 schema.  We use this to test that we can migrate from there to the
    // current schema.
    const V16_SCHEMA: &str = r#"
    CREATE TABLE meta(
        key TEXT PRIMARY KEY,
        value NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE keywords(
        keyword TEXT NOT NULL,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        full_keyword_id INTEGER NULL REFERENCES full_keywords(id) ON DELETE SET NULL,
        rank INTEGER NOT NULL,
        PRIMARY KEY (keyword, suggestion_id)
    ) WITHOUT ROWID;

    -- full keywords are what we display to the user when a (partial) keyword matches
    -- The FK to suggestion_id makes it so full keywords get deleted when the parent suggestion is deleted.
    CREATE TABLE full_keywords(
        id INTEGER PRIMARY KEY,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        full_keyword TEXT NOT NULL
    );

    CREATE TABLE prefix_keywords(
        keyword_prefix TEXT NOT NULL,
        keyword_suffix TEXT NOT NULL DEFAULT '',
        confidence INTEGER NOT NULL DEFAULT 0,
        rank INTEGER NOT NULL,
        suggestion_id INTEGER NOT NULL REFERENCES suggestions(id) ON DELETE CASCADE,
        PRIMARY KEY (keyword_prefix, keyword_suffix, suggestion_id)
    ) WITHOUT ROWID;

    CREATE UNIQUE INDEX keywords_suggestion_id_rank ON keywords(suggestion_id, rank);

    CREATE TABLE suggestions(
        id INTEGER PRIMARY KEY,
        record_id TEXT NOT NULL,
        provider INTEGER NOT NULL,
        title TEXT NOT NULL,
        url TEXT NOT NULL,
        score REAL NOT NULL
    );

    CREATE TABLE amp_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        advertiser TEXT NOT NULL,
        block_id INTEGER NOT NULL,
        iab_category TEXT NOT NULL,
        impression_url TEXT NOT NULL,
        click_url TEXT NOT NULL,
        icon_id TEXT NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    CREATE TABLE wikipedia_custom_details(
        suggestion_id INTEGER PRIMARY KEY REFERENCES suggestions(id) ON DELETE CASCADE,
        icon_id TEXT NOT NULL
    );

    CREATE TABLE amo_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        description TEXT NOT NULL,
        guid TEXT NOT NULL,
        icon_url TEXT NOT NULL,
        rating TEXT,
        number_of_ratings INTEGER NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    CREATE INDEX suggestions_record_id ON suggestions(record_id);

    CREATE TABLE icons(
        id TEXT PRIMARY KEY,
        data BLOB NOT NULL,
        mimetype TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_subjects(
        keyword TEXT PRIMARY KEY,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_modifiers(
        type INTEGER NOT NULL,
        keyword TEXT NOT NULL,
        record_id TEXT NOT NULL,
        PRIMARY KEY (type, keyword)
    ) WITHOUT ROWID;

    CREATE TABLE yelp_location_signs(
        keyword TEXT PRIMARY KEY,
        need_location INTEGER NOT NULL,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE yelp_custom_details(
        icon_id TEXT PRIMARY KEY,
        score REAL NOT NULL,
        record_id TEXT NOT NULL
    ) WITHOUT ROWID;

    CREATE TABLE mdn_custom_details(
        suggestion_id INTEGER PRIMARY KEY,
        description TEXT NOT NULL,
        FOREIGN KEY(suggestion_id) REFERENCES suggestions(id) ON DELETE CASCADE
    );

    PRAGMA user_version=16;
"#;

    /// Test running all schema upgrades from V16, which was the first schema with a "real"
    /// migration.
    ///
    /// If an upgrade fails, then this test will fail with a panic.
    #[test]
    fn test_all_upgrades() {
        let db_file = MigratedDatabaseFile::new(SuggestConnectionInitializer, V16_SCHEMA);
        db_file.run_all_upgrades();
    }
}