-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathidfwiki_empty.sql
executable file
·127 lines (108 loc) · 4.26 KB
/
idfwiki_empty.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
-- MySQL dump 10.11
--
-- Host: localhost Database: idfsimplewiki
-- ------------------------------------------------------
-- Server version 5.0.51-3
/*!40101 SET @OLD_CHARACTER_SET_CLIENT=@@CHARACTER_SET_CLIENT */;
/*!40101 SET @OLD_CHARACTER_SET_RESULTS=@@CHARACTER_SET_RESULTS */;
/*!40101 SET @OLD_COLLATION_CONNECTION=@@COLLATION_CONNECTION */;
/*!40101 SET NAMES utf8 */;
/*!40103 SET @OLD_TIME_ZONE=@@TIME_ZONE */;
/*!40103 SET TIME_ZONE='+00:00' */;
/*!40014 SET @OLD_UNIQUE_CHECKS=@@UNIQUE_CHECKS, UNIQUE_CHECKS=0 */;
/*!40014 SET @OLD_FOREIGN_KEY_CHECKS=@@FOREIGN_KEY_CHECKS, FOREIGN_KEY_CHECKS=0 */;
/*!40101 SET @OLD_SQL_MODE=@@SQL_MODE, SQL_MODE='NO_AUTO_VALUE_ON_ZERO' */;
/*!40111 SET @OLD_SQL_NOTES=@@SQL_NOTES, SQL_NOTES=0 */;
--
-- Table structure for table `page`
--
DROP TABLE IF EXISTS `page`;
SET @saved_cs_client = @@character_set_client;
SET character_set_client = utf8;
CREATE TABLE `page` (
`page_id` int(10) unsigned NOT NULL auto_increment,
`page_title` varchar(255) NOT NULL COMMENT 'copy from MediaWiki page.page_title, see http://www.mediawiki.org/wiki/Page_table',
`word_count` int(6) unsigned NOT NULL COMMENT 'number of words in the article',
PRIMARY KEY (`page_id`),
UNIQUE KEY `page_title` (`page_title`)
) ENGINE=MyISAM DEFAULT CHARSET=utf8 COMMENT='titles of wiki articles';
SET character_set_client = @saved_cs_client;
--
-- Dumping data for table `page`
--
LOCK TABLES `page` WRITE;
/*!40000 ALTER TABLE `page` DISABLE KEYS */;
/*!40000 ALTER TABLE `page` ENABLE KEYS */;
UNLOCK TABLES;
--
-- Table structure for table `related_page`
--
DROP TABLE IF EXISTS `related_page`;
SET @saved_cs_client = @@character_set_client;
SET character_set_client = utf8;
CREATE TABLE `related_page` (
`page_id` int(10) unsigned NOT NULL,
`related_titles` mediumblob NOT NULL COMMENT 'Comma separated list of related pages'' titles',
UNIQUE KEY `page_id` (`page_id`)
) ENGINE=MyISAM DEFAULT CHARSET=utf8 COMMENT='List of related pages found by the algorithm';
SET character_set_client = @saved_cs_client;
--
-- Dumping data for table `related_page`
--
LOCK TABLES `related_page` WRITE;
/*!40000 ALTER TABLE `related_page` DISABLE KEYS */;
/*!40000 ALTER TABLE `related_page` ENABLE KEYS */;
UNLOCK TABLES;
--
-- Table structure for table `term`
--
DROP TABLE IF EXISTS `term`;
SET @saved_cs_client = @@character_set_client;
SET character_set_client = utf8;
CREATE TABLE `term` (
`term_id` int(10) unsigned NOT NULL auto_increment,
`lemma` varchar(255) NOT NULL COMMENT 'the word\'s lemma (term), unique',
`doc_freq` int(11) NOT NULL COMMENT 'document\'s frequency, number of documents where the term appears',
`corpus_freq` int(11) NOT NULL COMMENT 'frequency of the term in the corpus',
PRIMARY KEY (`term_id`),
UNIQUE KEY `lemma` (`lemma`)
) ENGINE=MyISAM DEFAULT CHARSET=utf8 COMMENT='terms found in wiki-texts';
SET character_set_client = @saved_cs_client;
--
-- Dumping data for table `term`
--
LOCK TABLES `term` WRITE;
/*!40000 ALTER TABLE `term` DISABLE KEYS */;
/*!40000 ALTER TABLE `term` ENABLE KEYS */;
UNLOCK TABLES;
--
-- Table structure for table `term_page`
--
DROP TABLE IF EXISTS `term_page`;
SET @saved_cs_client = @@character_set_client;
SET character_set_client = utf8;
CREATE TABLE `term_page` (
`term_id` int(10) unsigned NOT NULL,
`page_id` int(10) unsigned NOT NULL,
`term_freq` int(6) unsigned NOT NULL COMMENT 'term frequency in the document',
UNIQUE KEY `term_page_id` (`term_id`,`page_id`),
KEY `term_id` (`term_id`),
KEY `page_id` (`page_id`)
) ENGINE=MyISAM DEFAULT CHARSET=latin1 COMMENT='pages which contain the term';
SET character_set_client = @saved_cs_client;
--
-- Dumping data for table `term_page`
--
LOCK TABLES `term_page` WRITE;
/*!40000 ALTER TABLE `term_page` DISABLE KEYS */;
/*!40000 ALTER TABLE `term_page` ENABLE KEYS */;
UNLOCK TABLES;
/*!40103 SET TIME_ZONE=@OLD_TIME_ZONE */;
/*!40101 SET SQL_MODE=@OLD_SQL_MODE */;
/*!40014 SET FOREIGN_KEY_CHECKS=@OLD_FOREIGN_KEY_CHECKS */;
/*!40014 SET UNIQUE_CHECKS=@OLD_UNIQUE_CHECKS */;
/*!40101 SET CHARACTER_SET_CLIENT=@OLD_CHARACTER_SET_CLIENT */;
/*!40101 SET CHARACTER_SET_RESULTS=@OLD_CHARACTER_SET_RESULTS */;
/*!40101 SET COLLATION_CONNECTION=@OLD_COLLATION_CONNECTION */;
/*!40111 SET SQL_NOTES=@OLD_SQL_NOTES */;
-- Dump completed on 2008-02-06 18:01:42