1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397
|
-- BioSQL database schema for SQLite.
--
-- This file is part of BioSQL.
--
-- BioSQL is free software: you can redistribute it and/or modify it
-- under the terms of the GNU Lesser General Public License as
-- published by the Free Software Foundation, either version 3 of the
-- License, or (at your option) any later version.
--
-- BioSQL is distributed in the hope that it will be useful,
-- but WITHOUT ANY WARRANTY; without even the implied warranty of
-- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-- GNU Lesser General Public License for more details.
--
-- You should have received a copy of the GNU Lesser General Public License
-- along with BioSQL. If not, see <http://www.gnu.org/licenses/>.
--
-- ========================================================================
--
-- See MySQL database schema and BioSQL website for table documentation.
-- This contains notes specific to SQLite
--
-- A note about Primary Keys in SQLite
-- SQLite automatically creates a ROWID for each row of a table.
-- Using this ROWID as the primary key is faster than using a
-- user-defined primary key. By declaring a column as an
-- INTEGER PRIMARY KEY, you are actually creating an alias to the
-- ROWID and get the associated speed benefits. The ROWID effectively
-- "autoincrements"; however, it can reuse ROWIDs of deleted rows.
-- To avoid reusing old ROWIDs would require adding the AUTOINCREMENT
-- keyword, which also reduces the performance.
-- ( see http://www.sqlite.org/autoinc.html)
CREATE TABLE biodatabase (
biodatabase_id INTEGER PRIMARY KEY,
name VARCHAR(128) NOT NULL,
authority VARCHAR(128),
description TEXT,
UNIQUE (name)
);
CREATE INDEX db_auth on biodatabase(authority);
CREATE TABLE taxon (
taxon_id INTEGER PRIMARY KEY,
ncbi_taxon_id INT(10),
parent_taxon_id INT(10) ,
node_rank VARCHAR(32),
genetic_code TINYINT ,
mito_genetic_code TINYINT ,
left_value INT(10) ,
right_value INT(10) ,
UNIQUE (ncbi_taxon_id),
UNIQUE (left_value),
UNIQUE (right_value)
);
CREATE INDEX taxparent ON taxon(parent_taxon_id);
CREATE TABLE taxon_name (
taxon_id INTEGER,
name VARCHAR(255) NOT NULL,
name_class VARCHAR(32) NOT NULL,
UNIQUE (taxon_id,name,name_class),
FOREIGN KEY ( taxon_id ) REFERENCES taxon ( taxon_id ) ON DELETE CASCADE
);
CREATE INDEX taxnametaxonid ON taxon_name(taxon_id);
CREATE INDEX taxnamename ON taxon_name(name);
CREATE TABLE ontology (
ontology_id INTEGER PRIMARY KEY,
name VARCHAR(32) NOT NULL,
definition TEXT,
UNIQUE (name)
);
CREATE TABLE term (
term_id INTEGER PRIMARY KEY,
name VARCHAR(255) NOT NULL,
definition TEXT,
identifier VARCHAR(40) ,
is_obsolete CHAR(1),
ontology_id INTEGER,
UNIQUE (identifier),
UNIQUE (name,ontology_id,is_obsolete),
FOREIGN KEY ( ontology_id ) REFERENCES ontology ( ontology_id ) ON DELETE CASCADE
);
CREATE INDEX term_ont ON term(ontology_id);
CREATE TABLE term_synonym (
synonym VARCHAR(255) NOT NULL,
term_id INTEGER,
PRIMARY KEY (term_id,synonym),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE
);
CREATE TABLE term_dbxref (
term_id INTEGER,
dbxref_id INTEGER,
rank SMALLINT,
PRIMARY KEY (term_id, dbxref_id),
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id ) ON DELETE CASCADE,
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE
);
CREATE INDEX trmdbxref_dbxrefid ON term_dbxref(dbxref_id);
CREATE TABLE term_relationship (
term_relationship_id INTEGER PRIMARY KEY,
subject_term_id INTEGER,
predicate_term_id INTEGER,
object_term_id INTEGER,
ontology_id INTEGER,
UNIQUE (subject_term_id,predicate_term_id,object_term_id,ontology_id),
FOREIGN KEY ( subject_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( predicate_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( object_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( ontology_id ) REFERENCES ontology ( ontology_id ) ON DELETE CASCADE
);
CREATE INDEX trmrel_predicateid ON term_relationship(predicate_term_id);
CREATE INDEX trmrel_objectid ON term_relationship(object_term_id);
CREATE INDEX trmrel_ontid ON term_relationship(ontology_id);
CREATE TABLE term_relationship_term (
term_relationship_id INTEGER PRIMARY KEY,
term_id INTEGER,
UNIQUE ( term_id ),
FOREIGN KEY (term_relationship_id) REFERENCES term_relationship(term_relationship_id) ON DELETE CASCADE,
FOREIGN KEY (term_id) REFERENCES term(term_id) ON DELETE CASCADE
);
CREATE TABLE term_path (
term_path_id INTEGER PRIMARY KEY,
subject_term_id INTEGER,
predicate_term_id INTEGER,
object_term_id INTEGER,
ontology_id INTEGER,
distance INT(10) ,
UNIQUE (subject_term_id,predicate_term_id,object_term_id,ontology_id,distance),
FOREIGN KEY ( subject_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( predicate_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( object_term_id ) REFERENCES term ( term_id ) ON DELETE CASCADE ,
FOREIGN KEY ( ontology_id ) REFERENCES ontology ( ontology_id ) ON DELETE CASCADE
);
CREATE INDEX trmpath_predicateid ON term_path(predicate_term_id);
CREATE INDEX trmpath_objectid ON term_path(object_term_id);
CREATE INDEX trmpath_ontid ON term_path(ontology_id);
CREATE TABLE bioentry (
bioentry_id INTEGER PRIMARY KEY,
biodatabase_id INTEGER,
taxon_id INT(10) ,
name VARCHAR(40) NOT NULL,
accession VARCHAR(128) NOT NULL,
identifier VARCHAR(40) ,
division VARCHAR(6),
description TEXT,
version SMALLINT NOT NULL,
UNIQUE (accession,biodatabase_id,version),
UNIQUE (identifier, biodatabase_id),
FOREIGN KEY ( taxon_id ) REFERENCES taxon ( taxon_id ),
FOREIGN KEY ( biodatabase_id ) REFERENCES biodatabase ( biodatabase_id )
);
CREATE INDEX bioentry_name ON bioentry(name);
CREATE INDEX bioentry_db ON bioentry(biodatabase_id);
CREATE INDEX bioentry_tax ON bioentry(taxon_id);
CREATE TABLE bioentry_relationship (
bioentry_relationship_id INTEGER PRIMARY KEY,
object_bioentry_id INTEGER,
subject_bioentry_id INTEGER,
term_id INTEGER,
rank INT(5),
UNIQUE (object_bioentry_id,subject_bioentry_id,term_id),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( object_bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE,
FOREIGN KEY ( subject_bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
);
CREATE INDEX bioentryrel_trm ON bioentry_relationship(term_id);
CREATE INDEX bioentryrel_child ON bioentry_relationship(subject_bioentry_id);
CREATE TABLE bioentry_path (
object_bioentry_id INTEGER PRIMARY KEY,
subject_bioentry_id INTEGER,
term_id INTEGER,
distance INT(10) ,
UNIQUE (object_bioentry_id,subject_bioentry_id,term_id,distance),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id )
FOREIGN KEY ( object_bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE,
FOREIGN KEY ( subject_bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
);
CREATE INDEX bioentrypath_trm ON bioentry_path(term_id);
CREATE INDEX bioentrypath_child ON bioentry_path(subject_bioentry_id);
CREATE TABLE biosequence (
bioentry_id INTEGER PRIMARY KEY,
version SMALLINT,
length INT(10),
alphabet VARCHAR(10),
seq LONGTEXT,
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
);
CREATE TABLE dbxref (
dbxref_id INTEGER PRIMARY KEY,
dbname VARCHAR(40) NOT NULL,
accession VARCHAR(128) NOT NULL,
version SMALLINT NOT NULL,
UNIQUE(accession, dbname, version)
);
CREATE INDEX dbxref_db ON dbxref(dbname);
CREATE TABLE dbxref_qualifier_value (
dbxref_id INTEGER,
term_id INTEGER,
rank SMALLINT NOT NULL DEFAULT 0,
value TEXT,
PRIMARY KEY (dbxref_id,term_id,rank),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id ) ON DELETE CASCADE
);
CREATE INDEX dbxrefqual_dbx ON dbxref_qualifier_value(dbxref_id);
CREATE INDEX dbxrefqual_trm ON dbxref_qualifier_value(term_id);
CREATE TABLE bioentry_dbxref (
bioentry_id INTEGER,
dbxref_id INTEGER,
rank SMALLINT,
PRIMARY KEY (bioentry_id,dbxref_id),
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE,
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id ) ON DELETE CASCADE
);
CREATE INDEX dblink_dbx ON bioentry_dbxref(dbxref_id);
CREATE TABLE reference (
reference_id INTEGER PRIMARY KEY,
dbxref_id INT(10) ,
location TEXT NOT NULL,
title TEXT,
authors TEXT,
crc VARCHAR(32),
UNIQUE (dbxref_id),
UNIQUE (crc),
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id )
);
CREATE TABLE bioentry_reference (
bioentry_id INTEGER,
reference_id INTEGER,
start_pos INT(10),
end_pos INT(10),
rank SMALLINT NOT NULL DEFAULT 0,
PRIMARY KEY(bioentry_id,reference_id,rank),
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
FOREIGN KEY ( reference_id ) REFERENCES reference ( reference_id ) ON DELETE CASCADE
);
CREATE INDEX bioentryref_ref ON bioentry_reference(reference_id);
CREATE TABLE comment (
comment_id INTEGER PRIMARY KEY,
bioentry_id INTEGER,
comment_text TEXT NOT NULL,
rank SMALLINT NOT NULL DEFAULT 0,
UNIQUE(bioentry_id, rank),
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
);
CREATE TABLE bioentry_qualifier_value (
bioentry_id INTEGER,
term_id INTEGER,
value TEXT,
rank INT(5) NOT NULL DEFAULT 0,
UNIQUE (bioentry_id,term_id,rank),
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE,
FOREIGN KEY ( term_id ) REFERENCES term ( term_id )
);
CREATE INDEX bioentryqual_trm ON bioentry_qualifier_value(term_id);
CREATE TABLE seqfeature (
seqfeature_id INTEGER PRIMARY KEY,
bioentry_id INTEGER,
type_term_id INTEGER,
source_term_id INTEGER,
display_name VARCHAR(64),
rank SMALLINT NOT NULL DEFAULT 0,
UNIQUE (bioentry_id,type_term_id,source_term_id,rank),
FOREIGN KEY ( type_term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( source_term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( bioentry_id ) REFERENCES bioentry ( bioentry_id ) ON DELETE CASCADE
);
CREATE INDEX seqfeature_trm ON seqfeature(type_term_id);
CREATE INDEX seqfeature_fsrc ON seqfeature(source_term_id);
CREATE TABLE seqfeature_relationship (
seqfeature_relationship_id INTEGER PRIMARY KEY,
object_seqfeature_id INTEGER,
subject_seqfeature_id INTEGER,
term_id INTEGER,
rank INT(5),
UNIQUE (object_seqfeature_id,subject_seqfeature_id,term_id),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( object_seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE,
FOREIGN KEY ( subject_seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE
);
CREATE INDEX seqfeaturerel_trm ON seqfeature_relationship(term_id);
CREATE INDEX seqfeaturerel_child ON seqfeature_relationship(subject_seqfeature_id);
CREATE TABLE seqfeature_path (
object_seqfeature_id INTEGER,
subject_seqfeature_id INTEGER,
term_id INTEGER,
distance INT(10) ,
UNIQUE (object_seqfeature_id,subject_seqfeature_id,term_id,distance),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( object_seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE,
FOREIGN KEY ( subject_seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE
);
CREATE INDEX seqfeaturepath_trm ON seqfeature_path(term_id);
CREATE INDEX seqfeaturepath_child ON seqfeature_path(subject_seqfeature_id);
CREATE TABLE seqfeature_qualifier_value (
seqfeature_id INTEGER,
term_id INTEGER,
rank SMALLINT NOT NULL DEFAULT 0,
value TEXT NOT NULL,
PRIMARY KEY (seqfeature_id,term_id,rank),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id ),
FOREIGN KEY ( seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE
);
CREATE INDEX seqfeaturequal_trm ON seqfeature_qualifier_value(term_id);
CREATE TABLE seqfeature_dbxref (
seqfeature_id INTEGER,
dbxref_id INTEGER,
rank SMALLINT,
PRIMARY KEY (seqfeature_id,dbxref_id),
FOREIGN KEY ( seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE,
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id ) ON DELETE CASCADE
);
CREATE INDEX feadblink_dbx ON seqfeature_dbxref(dbxref_id);
CREATE TABLE location (
location_id INTEGER PRIMARY KEY,
seqfeature_id INTEGER,
dbxref_id INT(10),
term_id INT(10),
start_pos INT(10),
end_pos INT(10),
strand TINYINT NOT NULL DEFAULT 0,
rank SMALLINT NOT NULL DEFAULT 0,
UNIQUE (seqfeature_id, rank),
FOREIGN KEY ( seqfeature_id ) REFERENCES seqfeature ( seqfeature_id ) ON DELETE CASCADE,
FOREIGN KEY ( dbxref_id ) REFERENCES dbxref ( dbxref_id ),
FOREIGN KEY ( term_id ) REFERENCES term ( term_id )
);
CREATE INDEX seqfeatureloc_start ON location(start_pos, end_pos);
CREATE INDEX seqfeatureloc_dbx ON location(dbxref_id);
CREATE INDEX seqfeatureloc_trm ON location(term_id);
CREATE TABLE location_qualifier_value (
location_id INTEGER,
term_id INTEGER,
value VARCHAR(255) NOT NULL,
int_value INT(10),
PRIMARY KEY (location_id,term_id),
FOREIGN KEY ( location_id ) REFERENCES location ( location_id ) ON DELETE CASCADE,
FOREIGN KEY ( term_id ) REFERENCES term ( term_id )
);
CREATE INDEX locationqual_trm ON location_qualifier_value(term_id);
|