Annotation of pandia/base.sql, revision 1.3
1.2 snw 1: DROP TABLE IF EXISTS url_domains;
2: CREATE TABLE url_domains
3: (url_domain VARCHAR(255) NOT NULL,
4: PRIMARY KEY(url_domain))
5: ENGINE=InnoDB DEFAULT CHARSET=utf8;
6:
1.1 snw 7: DROP TABLE IF EXISTS crawl_queue;
8: CREATE TABLE crawl_queue
9: (url VARCHAR(255) NOT NULL,
1.2 snw 10: parent_url VARCHAR(255),
11: url_domain VARCHAR(255) NOT NULL,
12: scheme VARCHAR(40) NOT NULL DEFAULT "http",
13: analyzed TINYINT NOT NULL DEFAULT 0,
1.1 snw 14: create_ts TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP,
15: PRIMARY KEY(url))
16: ENGINE=InnoDB DEFAULT CHARSET=utf8;
17:
18: DROP TABLE IF EXISTS blacklist;
19: CREATE TABLE blacklist
20: (url_domain VARCHAR(255) NOT NULL,
21: PRIMARY KEY(url_domain))
22: ENGINE=InnoDB DEFAULT CHARSET=utf8;
23:
1.2 snw 24: DROP TABLE IF EXISTS keywords;
25: CREATE TABLE keywords
26: (id BIGINT(20) UNSIGNED NOT NULL AUTO_INCREMENT,
27: word VARCHAR(255) NOT NULL,
28: url VARCHAR(255) NOT NULL,
29: url_domain VARCHAR(255) NOT NULL,
30: word_count SMALLINT UNSIGNED NOT NULL,
31: PRIMARY KEY(id))
32: ENGINE=InnoDB DEFAULT CHARSET=utf8;
33:
34: DROP TABLE IF EXISTS url_fulltext;
35: CREATE TABLE url_fulltext
36: (url VARCHAR(255) NOT NULL,
37: body MEDIUMTEXT NOT NULL,
1.3 ! snw 38: page_title TEXT,
1.2 snw 39: PRIMARY KEY(url))
40: ENGINE=InnoDB DEFAULT CHARSET=utf8;
41:
42: CREATE INDEX idx_keyword_search_word ON keywords(word);
43: CREATE INDEX idx_keyword_search_url ON keywords(url);
44: CREATE INDEX idx_keyword_search_domain ON keywords(url_domain);
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>