Project

General

Profile

1 2276 jones
/**
2
 *  '$RCSfile$'
3
 *  Copyright: 2004 Regents of the University of California and the
4
 *             National Center for Ecological Analysis and Synthesis
5
 *
6
 *   '$Author$'
7
 *     '$Date$'
8
 * '$Revision$'
9
 *
10 2599 jones
 * This program is free software, you can redistribute it and/or modify
11 2276 jones
 * it under the terms of the GNU General Public License as published by
12 2599 jones
 * the Free Software Foundation, either version 2 of the License, or
13 2276 jones
 * (at your option) any later version.
14
 *
15
 * This program is distributed in the hope that it will be useful,
16 2599 jones
 * but WITHOUT ANY WARRANTY, without even the implied warranty of
17 2276 jones
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18
 * GNU General Public License for more details.
19
 *
20
 * You should have received a copy of the GNU General Public License
21 2599 jones
 * along with this program, if not, write to the Free Software
22 2276 jones
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
23
 */
24 2422 sgarg
25 2276 jones
/*
26 2599 jones
 * this is sql script does the same as the sql script named
27
 * xmltables.sql except that this script is to be use to
28
 * create the database tables on a Postgresql backend rather
29
 * than an Oracle Backend
30 2276 jones
 */
31
32
/*
33 2599 jones
 * Replication -- table to store servers that metacat is replicated to
34 2276 jones
 */
35
CREATE SEQUENCE xml_replication_id_seq;
36
CREATE TABLE xml_replication (
37 2422 sgarg
  serverid INT8 default nextval('xml_replication_id_seq'),
38 2276 jones
  server VARCHAR(512),
39
  last_checked DATE,
40
  replicate INT8,
41
  datareplicate INT8,
42
  hub INT8,
43
  CONSTRAINT xml_replication_pk PRIMARY KEY (serverid)
44 2422 sgarg
);
45 2276 jones
46 6814 leinfelder
INSERT INTO xml_replication (server, replicate, datareplicate, hub) VALUES ('localhost', '0', '0', '0');
47 2276 jones
48 6814 leinfelder
49 2422 sgarg
/*
50 2276 jones
 * Nodes -- table to store XML Nodes (both elements and attributes)
51
 */
52
CREATE SEQUENCE xml_nodes_id_seq;
53
CREATE TABLE xml_nodes (
54
	nodeid INT8 default nextval('xml_nodes_id_seq'),
55
					-- the unique node id (pk)
56
	nodeindex INT8,		-- order of nodes within parent
57
	nodetype VARCHAR(20),	-- type (DOCUMENT, COMMENT, PI,
58 2359 sgarg
				-- ELEMENT, ATTRIBUTE, TEXT)
59 2276 jones
	nodename VARCHAR(250),	-- the name of an element or attribute
60
        nodeprefix VARCHAR(50), -- the namespace prefix of the node
61 3336 tao
	nodedata TEXT, -- the data for this node (e.g.,
62 2359 sgarg
				-- for TEXT it is the content)
63
	parentnodeid INT8,	-- index of the parent of this node
64
	rootnodeid INT8,	-- index of the root node of this tree
65 2276 jones
	docid VARCHAR(250),	-- index to the document id
66
	date_created DATE,
67
	date_updated DATE,
68 6012 leinfelder
    nodedatanumerical FLOAT8, -- the data for this node if it is a number
69
    nodedatadate TIMESTAMP, -- the data for this node if it is a date
70 2276 jones
   CONSTRAINT xml_nodes_pk PRIMARY KEY (nodeid),
71 2422 sgarg
   CONSTRAINT xml_nodes_root_fk
72 2276 jones
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes,
73 2422 sgarg
   CONSTRAINT xml_nodes_parent_fk
74 2276 jones
		FOREIGN KEY (parentnodeid) REFERENCES xml_nodes
75
);
76 2422 sgarg
/*
77 2276 jones
 * Indexes of rootnodeid, parentnodeid, and nodename in xml_nodes
78
 */
79
CREATE INDEX xml_nodes_idx1 ON xml_nodes (rootnodeid);
80
CREATE INDEX xml_nodes_idx2 ON xml_nodes (parentnodeid);
81
CREATE INDEX xml_nodes_idx3 ON xml_nodes (nodename);
82 3412 tao
CREATE INDEX xml_nodes_idx4 ON xml_nodes (docid);
83 2276 jones
84 2519 sgarg
85 2422 sgarg
/*
86 2519 sgarg
 * Table for storing the nodes for the old revisions of the document and the deleted documents
87
 */
88
CREATE TABLE xml_nodes_revisions (
89
        nodeid INT8,            -- the unique node id (pk)
90
        nodeindex INT8,         -- order of nodes within parent
91
        nodetype VARCHAR(20),   -- type (DOCUMENT, COMMENT, PI,
92
                                -- ELEMENT, ATTRIBUTE, TEXT)
93
        nodename VARCHAR(250),  -- the name of an element or attribute
94
        nodeprefix VARCHAR(50), -- the namespace prefix of the node
95 3336 tao
        nodedata TEXT, -- the data for this node (e.g.,
96 2519 sgarg
                                -- for TEXT it is the content)
97
        parentnodeid INT8,      -- index of the parent of this node
98
        rootnodeid INT8,        -- index of the root node of this tree
99
        docid VARCHAR(250),     -- index to the document id
100
        date_created DATE,
101
        date_updated DATE,
102 6012 leinfelder
        nodedatanumerical FLOAT8, -- the data for this node if it is a number
103
        nodedatadate TIMESTAMP, -- the data for this node if it is a date
104 2519 sgarg
   CONSTRAINT xml_nodes_revisions_pk PRIMARY KEY (nodeid),
105
   CONSTRAINT xml_nodes_revisions_root_fk
106
                FOREIGN KEY (rootnodeid) REFERENCES xml_nodes_revisions,
107
   CONSTRAINT xml_nodes_revisions_parent_fk
108
                FOREIGN KEY (parentnodeid) REFERENCES xml_nodes_revisions
109
);
110
111
/*
112
 * Indexes of rootnodeid, parentnodeid, and nodename in xml_nodes_revisions
113
 */
114
CREATE INDEX xml_nodes_revisions_idx1 ON xml_nodes_revisions (rootnodeid);
115
CREATE INDEX xml_nodes_revisions_idx2 ON xml_nodes_revisions (parentnodeid);
116
CREATE INDEX xml_nodes_revisions_idx3 ON xml_nodes_revisions (nodename);
117
118
119
120
/*
121 2276 jones
 * XML Catalog -- table to store all external sources for XML documents
122
 */
123
CREATE SEQUENCE xml_catalog_id_seq;
124
CREATE TABLE xml_catalog (
125
	catalog_id INT8 default nextval('xml_catalog_id_seq'),
126
                                        -- the id for this catalog entry
127
	entry_type VARCHAR(500),	-- the type of this catalog entry
128
					-- (e.g., DTD, XSD, XSL)
129
	source_doctype VARCHAR(500),	-- the source public_id for transforms
130
	target_doctype VARCHAR(500),	-- the target public_id for transforms
131
	public_id VARCHAR(500),	-- the unique id for this type
132
	system_id VARCHAR(1000),	-- the local location of the object
133 9576 tao
  format_id VARCHAR(1000),  -- the format id from dataone
134 2276 jones
   CONSTRAINT xml_catalog_pk PRIMARY KEY (catalog_id),
135 2422 sgarg
   CONSTRAINT xml_catalog_uk UNIQUE
136 9576 tao
              (entry_type, source_doctype, target_doctype, public_id, format_id)
137 2276 jones
);
138
139 2422 sgarg
/*
140 2276 jones
 * Sequence to get uniqueID for Accession #
141
 */
142
CREATE SEQUENCE xml_documents_id_seq;
143 2422 sgarg
/*
144 2276 jones
 * Documents -- table to store XML documents
145
 */
146
CREATE TABLE xml_documents (
147
	docid VARCHAR(250),	-- the document id #
148
	rootnodeid INT8,		-- reference to root node of the DOM
149
	docname VARCHAR(100),	-- usually the root element name
150
	doctype VARCHAR(100),	-- public id indicating document type
151
	user_owner VARCHAR(100),	-- the user owned the document
152
	user_updated VARCHAR(100),	-- the user updated the document
153
	server_location INT8,	-- the server on which this document resides
154
	rev INT8 default 1,   -- the revision number of the document
155
	date_created DATE,
156
	date_updated DATE,
157
	public_access INT8,	-- flag for public access
158 2422 sgarg
        catalog_id INT8,	-- reference to xml_catalog
159 2276 jones
     CONSTRAINT xml_documents_pk PRIMARY KEY (docid),
160
     CONSTRAINT xml_documents_rep_fk
161 2422 sgarg
     		FOREIGN KEY (server_location) REFERENCES xml_replication,
162
    CONSTRAINT xml_documents_root_fk
163 2276 jones
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes,
164 2422 sgarg
   CONSTRAINT xml_documents_catalog_fk
165 2276 jones
		FOREIGN KEY (catalog_id) REFERENCES xml_catalog
166
);
167
168 2422 sgarg
/*
169 2276 jones
 * Index of <docid,doctype> in xml_document
170
 */
171
CREATE INDEX xml_documents_idx1 ON xml_documents (docid, doctype);
172 3052 jones
CREATE INDEX xml_documents_idx2 ON xml_documents (lower(user_owner));
173 3504 tao
CREATE INDEX xml_documents_idx3 ON xml_documents (rootnodeid);
174 7455 leinfelder
CREATE INDEX xml_documents_idx5 ON xml_documents (docid, rev);
175 2276 jones
176 2422 sgarg
/*
177 2276 jones
 * Revised Documents -- table to store XML documents saved after an UPDATE
178
 *                    or DELETE
179
 */
180
CREATE SEQUENCE xml_revisions_id_seq;
181
CREATE TABLE xml_revisions (
182
	revisionid INT8  default nextval('xml_revisions_id_seq'),
183
                                        -- the revision number we are saving
184
	docid VARCHAR(250),	-- the document id #
185
	rootnodeid INT8,		-- reference to root node of the DOM
186
	docname VARCHAR(100),	-- usually the root element name
187
	doctype VARCHAR(100),	-- public id indicating document type
188
	user_owner VARCHAR(100),
189
	user_updated VARCHAR(100),
190
	server_location INT8,
191
	rev INT8,
192
	date_created DATE,
193
	date_updated DATE,
194
	public_access INT8,	-- flag for public access
195 2422 sgarg
        catalog_id INT8,	-- reference to xml_catalog
196 2276 jones
   CONSTRAINT xml_revisions_pk PRIMARY KEY (revisionid),
197
   CONSTRAINT xml_revisions_rep_fk
198
		FOREIGN KEY (server_location) REFERENCES xml_replication,
199 2422 sgarg
   CONSTRAINT xml_revisions_root_fk
200 2514 sgarg
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes_revisions,
201 2422 sgarg
   CONSTRAINT xml_revisions_catalog_fk
202 2276 jones
		FOREIGN KEY (catalog_id) REFERENCES xml_catalog
203
);
204
205 5171 daigle
CREATE INDEX xml_revisions_idx1 ON xml_revisions (docid);
206 2276 jones
207 2422 sgarg
/*
208 2276 jones
 * ACL -- table to store ACL for XML documents by principals
209
 */
210
CREATE TABLE xml_access (
211 6122 leinfelder
	guid text,	-- foreign key to system metadata
212 6923 leinfelder
	accessfileid text,	-- the id for the access file
213 2276 jones
	principal_name VARCHAR(100),	-- name of user, group, etc.
214
	permission INT8,		-- "read", "write", "all"
215
	perm_type VARCHAR(32),	-- "allowed" or "denied"
216
	perm_order VARCHAR(32),	-- "allow first" or "deny first"
217
	begin_time DATE,		-- the time that permission begins
218
	end_time DATE,		-- the time that permission ends
219
	ticket_count INT8,		-- ticket counter for that permission
220
  subtreeid VARCHAR(32),
221
  startnodeid INT8,
222
  endnodeid INT8,
223 6209 leinfelder
   CONSTRAINT xml_access_ck CHECK (begin_time < end_time)
224 2276 jones
);
225 3052 jones
CREATE INDEX xml_access_idx1 ON xml_access (lower(principal_name));
226
CREATE INDEX xml_access_idx2 ON xml_access (permission);
227
CREATE INDEX xml_access_idx3 ON xml_access (perm_type);
228
CREATE INDEX xml_access_idx4 ON xml_access (perm_order);
229
CREATE INDEX xml_access_idx5 ON xml_access (subtreeid);
230 7455 leinfelder
CREATE INDEX xml_access_idx6 on xml_access(guid);
231 6122 leinfelder
/*
232
 * ALTER TABLE xml_access ADD COLUMN guid text;
233
*/
234 2276 jones
235 2422 sgarg
/*
236
 * Index of Nodes -- table to store precomputed paths through tree for
237 2276 jones
 * quick searching in structured searches
238
 */
239
CREATE TABLE xml_index (
240
	nodeid INT8,		-- the unique node id
241 3352 tao
	path TEXT,	-- precomputed path through tree
242 2276 jones
	docid VARCHAR(250),	-- index to the document id
243
	doctype VARCHAR(100),	-- public id indicating document type
244 2377 sgarg
        parentnodeid INT8,      -- id of the parent of the node represented
245
				-- by this row
246 2276 jones
   CONSTRAINT xml_index_pk PRIMARY KEY (nodeid,path),
247
   CONSTRAINT xml_index_nodeid_fk FOREIGN KEY (nodeid) REFERENCES xml_nodes,
248 2422 sgarg
   CONSTRAINT xml_index_docid_fk
249 2276 jones
		FOREIGN KEY (docid) REFERENCES xml_documents
250
);
251
252 2422 sgarg
/*
253
 * Index of the paths in xml_index
254 2276 jones
 */
255
CREATE INDEX xml_index_idx1 ON xml_index (path);
256 3347 tao
CREATE INDEX xml_index_idx2 ON xml_index (docid);
257 3504 tao
CREATE INDEX xml_index_idx3 ON xml_index (nodeid);
258 2276 jones
259
CREATE SEQUENCE xml_relation_id_seq;
260
CREATE TABLE xml_relation (
261
	relationid INT8 default nextval('xml_relation_id_seq') PRIMARY KEY,
262
					     -- unique id
263
	docid VARCHAR(250) ,         -- the docid of the package file
264
	                                     -- that this relation came from
265
        packagetype VARCHAR(250),          -- the type of the package
266
	subject VARCHAR(512) NOT NULL, -- the subject of the relation
267
	subdoctype VARCHAR(128),         	-- the doctype of the subject
268
	relationship VARCHAR(128)  NOT NULL,-- the relationship type
269
	object VARCHAR(512) NOT NULL, -- the object of the relation
270
	objdoctype VARCHAR(128),          -- the doctype of the object
271
	CONSTRAINT xml_relation_uk UNIQUE (docid, subject, relationship, object),
272 2422 sgarg
	CONSTRAINT xml_relation_docid_fk
273 2276 jones
		FOREIGN KEY (docid) REFERENCES xml_documents
274
);
275
276 2422 sgarg
/*
277 2769 jones
 * Table used to store all document identifiers in metacat.  Each identifier
278 5276 jones
 * has a globally unique, unconstrained string, which we will refer to as a
279
 * GUID, and a local metacat identifier, which consists of the docid
280
 * and revision fields. Each row maps one global identifier to the local
281
 * identifier (docid) used within metacat.
282 2276 jones
 */
283 2769 jones
CREATE TABLE identifier (
284 5276 jones
   guid   text,          -- the globally unique string identifier
285
   docid  VARCHAR(250),	 -- the local document id #
286
   rev    INT8,          -- the revision part of the local identifier
287
   CONSTRAINT identifier_pk PRIMARY KEY (guid)
288 2276 jones
);
289 7455 leinfelder
CREATE INDEX identifier_guid on identifier(guid);
290
CREATE INDEX identifier_docid on identifier(docid);
291
CREATE INDEX identifier_rev on identifier(rev);
292
CREATE INDEX identifier_docid_rev on identifier(docid, rev);
293 8335 leinfelder
CREATE INDEX identifier_docid_rev_log ON identifier((docid||'.'||rev));
294 2276 jones
295 2422 sgarg
/*
296 5333 berkley
 * Table used to store all document identifiers for system metadata objects
297
 * similar restraints to identifier.  Cannot use identifier table for this
298
 * purpose because then you have to worry about whether you insert the
299
 * data first or the systemMetadata first.
300
 */
301
CREATE TABLE systemMetadata (
302 6107 leinfelder
	guid   text,          -- the globally unique string identifier of the object that the system metadata describes
303 8810 leinfelder
	series_id text, -- the series identifier
304 6561 leinfelder
	serial_version VARCHAR(256), --the serial version of the object
305 6107 leinfelder
	date_uploaded TIMESTAMP, -- the date/time the document was first submitted
306
	rights_holder VARCHAR(250), --the user who has rights to the document, usually the first persons to upload it
307
	checksum VARCHAR(512), --the checksum of the doc using the given algorithm (see below)
308
	checksum_algorithm VARCHAR(250), --the algorithm used to calculate the checksum
309
	origin_member_node VARCHAR(250), --the member node where the document was first uploaded
310
	authoritive_member_node VARCHAR(250), --the member node that currently controls the document
311
	date_modified TIMESTAMP, -- the last date/time that the file was changed
312
	submitter VARCHAR(256), -- the user who originally submitted the doc
313
	object_format VARCHAR(256), --the format of the object
314
	size VARCHAR(256), --the size of the object
315 6766 leinfelder
	archived boolean,	 -- specifies whether this an archived object
316 6107 leinfelder
	replication_allowed boolean,	 -- replication allowed
317
	number_replicas INT8, 	-- the number of replicas allowed
318 6375 leinfelder
	obsoletes   text,       -- the identifier that this record obsoletes
319
	obsoleted_by   text,     -- the identifier of the record that replaces this record
320 9216 tao
  media_type   text,      -- the media type of this object
321
  file_name    text,      -- the suggested file name for this object
322 6107 leinfelder
	CONSTRAINT systemMetadata_pk PRIMARY KEY (guid)
323 5333 berkley
);
324 9224 tao
325 6100 leinfelder
/*
326 9224 tao
 * Table used to store the properties for media types. They are part of the system metadata. But a media type
327
 * can have multiple properties, we have to store them in a separate table. The guids in this table refer
328 9225 tao
 * the guids in the systemMetadata.
329 9224 tao
 */
330
CREATE TABLE smMediaTypeProperties (
331
	guid    text,  -- id refer to guid in the system metadata table
332
  name    text, -- name of the property
333
  value    text, -- value of the property
334 9225 tao
  CONSTRAINT smMediaTypeProperties_fk
335 9224 tao
     FOREIGN KEY (guid) REFERENCES systemMetadata DEFERRABLE
336
);
337
/*
338 6100 leinfelder
 * For devs to remove docid, rev
339
 * ALTER TABLE systemMetadata DROP COLUMN docid;
340
 * ALTER TABLE systemMetadata DROP COLUMN rev;
341 6107 leinfelder
 * ALTER TABLE systemMetadata ADD COLUMN replication_allowed boolean;
342
 * ALTER TABLE systemMetadata ADD COLUMN number_replicas INT8;
343 6100 leinfelder
 */
344 5333 berkley
345 9483 tao
CREATE SEQUENCE policy_id_seq;
346 7392 leinfelder
CREATE TABLE smReplicationPolicy (
347 9483 tao
  policy_id INT8 default nextval('policy_id_seq'),
348 6107 leinfelder
	guid text,	-- the globally unique string identifier of the object that the system metadata describes
349
	member_node VARCHAR(250),	 -- replication member node
350
	policy text,	 -- the policy (preferred, blocked, etc...TBD)
351 7392 leinfelder
	CONSTRAINT smReplicationPolicy_fk
352 6933 jones
		FOREIGN KEY (guid) REFERENCES systemMetadata DEFERRABLE
353 6107 leinfelder
);
354
355 7392 leinfelder
CREATE TABLE smReplicationStatus (
356 6107 leinfelder
	guid text,	-- the globally unique string identifier of the object that the system metadata describes
357
	member_node VARCHAR(250),	 -- replication member node
358
	status VARCHAR(250),	 -- replication status
359
	date_verified TIMESTAMP, 	-- the date replication was verified
360 7392 leinfelder
	CONSTRAINT smReplicationStatus_fk
361 6933 jones
		FOREIGN KEY (guid) REFERENCES systemMetadata DEFERRABLE
362 6107 leinfelder
);
363
364 6098 leinfelder
/*
365 2422 sgarg
 * accesssubtree -- table to store access subtree info
366 2276 jones
 */
367
CREATE TABLE xml_accesssubtree (
368
	docid		VARCHAR(250),	-- the document id #
369
  rev 		INT8 default 1, --the revision number of the docume
370
  controllevel VARCHAR(50), -- the level it control -- document or subtree
371 2422 sgarg
  subtreeid VARCHAR(250), -- the subtree id
372 2276 jones
	startnodeid	INT8,	-- the start node id of access subtree
373
  endnodeid INT8, -- the end node if of access subtree
374 2422 sgarg
  CONSTRAINT xml_accesssubtree_docid_fk
375 2276 jones
		FOREIGN KEY (docid) REFERENCES xml_documents
376
);
377
378
/*
379 2422 sgarg
 * Returnfields -- table to store combinations of returnfields requested
380
 *		    and the number of times this table is accessed
381
 */
382 2949 berkley
CREATE SEQUENCE xml_returnfield_id_seq;
383 2422 sgarg
CREATE TABLE xml_returnfield (
384
        returnfield_id     INT8 default nextval('xml_returnfield_id_seq'),   -- the id for this returnfield entry
385
        returnfield_string VARCHAR(2000),                                    -- the returnfield string
386
        usage_count        INT8,                                             -- the number of times this string has been requested
387
        CONSTRAINT xml_returnfield_pk PRIMARY KEY (returnfield_id)
388
);
389
CREATE INDEX xml_returnfield_idx1 ON xml_returnfield(returnfield_string);
390
391
/*
392
 * Queryresults -- table to store queryresults for a given docid
393
 * and returnfield_id
394
 */
395 2949 berkley
CREATE SEQUENCE xml_queryresult_id_seq;
396 2422 sgarg
CREATE TABLE xml_queryresult(
397
  queryresult_id INT8 default nextval('xml_queryresult_id_seq'), -- id for this entry
398
  returnfield_id       INT8,          -- id for the returnfield corresponding to this entry
399
  docid                VARCHAR(250),  -- docid of the document
400 3336 tao
  queryresult_string   TEXT, -- resultant text generated for this docid and given
401 2422 sgarg
  				       -- returnfield
402
  CONSTRAINT xml_queryresult_pk PRIMARY KEY (queryresult_id),
403
  CONSTRAINT xml_queryresult_searchid_fk
404
               FOREIGN KEY (returnfield_id) REFERENCES xml_returnfield
405
);
406
407
CREATE INDEX xml_queryresult_idx1 ON xml_queryresult (returnfield_id, docid);
408
409
/*
410 2276 jones
 * Logging -- table to store metadata and data access log
411
 */
412
CREATE SEQUENCE access_log_id_seq;
413
CREATE TABLE access_log (
414
  entryid       INT8 default nextval ('access_log_id_seq'), -- the identifier for the log event
415
  ip_address    VARCHAR(512),   -- the ip address inititiating the event
416 6542 leinfelder
  user_agent    VARCHAR(512),   -- the user agent for the request
417
  principal     VARCHAR(512),   -- the user initiating the event
418 2276 jones
  docid         VARCHAR(250),	-- the document id #
419
  event         VARCHAR(512),   -- the code symbolizing the event type
420
  date_logged   TIMESTAMP,      -- the datetime on which the event occurred
421
  CONSTRAINT access_log_pk PRIMARY KEY (entryid)
422
);
423 8335 leinfelder
CREATE INDEX access_log_docid ON access_log(docid);
424 2276 jones
425 8335 leinfelder
426 7830 leinfelder
/*
427
 * the index_event table for solr-based indexing
428
 */
429
CREATE TABLE index_event (
430
	guid text,
431
	event_action VARCHAR(250),
432
	description text,
433
	event_date TIMESTAMP
434
);
435 2514 sgarg
436 2422 sgarg
/*
437 2514 sgarg
 * Table for indexing the paths specified the administrator in metacat.properties
438
 */
439
440
CREATE SEQUENCE xml_path_index_id_seq;
441
CREATE TABLE xml_path_index (
442
    nodeid INT8  default nextval('xml_path_index_id_seq'),
443
        docid VARCHAR(250),     -- the document id
444 7053 leinfelder
        path TEXT,     -- precomputed path through tree
445 3336 tao
        nodedata TEXT, -- the data for this node (e.g.,
446 2514 sgarg
                                -- for TEXT it is the content)
447 6012 leinfelder
        nodedatanumerical FLOAT8, -- the data for this node if it is a number
448
        nodedatadate TIMESTAMP, -- the data for this node if it is a date
449 2514 sgarg
        parentnodeid INT8,      -- id of the parent of the node represented
450
                                -- by this row
451
   CONSTRAINT xml_path_index_pk PRIMARY KEY (nodeid),
452 2515 sgarg
   CONSTRAINT xml_path_index_docid_fk
453 2514 sgarg
                FOREIGN KEY (docid) REFERENCES xml_documents
454
);
455
456
/*
457
 * Indexes of path, nodedata and nodedatanumerical in xml_path_index
458
 */
459
CREATE INDEX xml_path_index_idx1 ON xml_path_index (path);
460
CREATE INDEX xml_path_index_idx2 ON xml_path_index (nodedata);
461
CREATE INDEX xml_path_index_idx3 ON xml_path_index (nodedatanumerical);
462 3052 jones
CREATE INDEX xml_path_index_idx4 ON xml_path_index (upper(nodedata));
463 6012 leinfelder
CREATE INDEX xml_path_index_idx5 ON xml_path_index (nodedatadate);
464 7455 leinfelder
CREATE INDEX xml_path_index_idx6 ON xml_path_index (docid);
465 2514 sgarg
466
/*
467 2276 jones
 * harvest_site_schedule -- table to store harvest sites and schedule info
468
 */
469
CREATE TABLE harvest_site_schedule (
470
  site_schedule_id INT8,         -- unique id
471
  documentlisturl  VARCHAR(255), -- URL of the site harvest document list
472
  ldapdn           VARCHAR(255), -- LDAP distinguished name for site account
473
  datenextharvest  DATE,         -- scheduled date of next harvest
474
  datelastharvest  DATE,         -- recorded date of last harvest
475
  updatefrequency  INT8,         -- the harvest update frequency
476
  unit             VARCHAR(50),  -- update unit -- days weeks or months
477
  contact_email    VARCHAR(50),  -- email address of the site contact person
478
  ldappwd          VARCHAR(20),  -- LDAP password for site account
479
  CONSTRAINT harvest_site_schedule_pk PRIMARY KEY (site_schedule_id)
480
);
481
482 2422 sgarg
/*
483 2276 jones
 * harvest_log -- table to log entries for harvest operations
484
 */
485
CREATE TABLE harvest_log (
486
  harvest_log_id         INT8,          -- unique id
487
  harvest_date           DATE,          -- date of the current harvest
488
  status                 INT8,          -- non-zero indicates an error status
489
  message                VARCHAR(1000), -- text message for this log entry
490 8028 leinfelder
  harvest_operation_code VARCHAR(1000),   -- the type of harvest operation
491 2276 jones
  site_schedule_id       INT8,          -- site schedule id, or 0 if no site
492
  CONSTRAINT harvest_log_pk PRIMARY KEY (harvest_log_id)
493
);
494
495 2422 sgarg
/*
496 2276 jones
 * harvest_detail_log -- table to log detailed info about documents that
497
 *                       generated errors during the harvest
498
 */
499
CREATE TABLE harvest_detail_log (
500
  detail_log_id          INT8,          -- unique id
501
  harvest_log_id         INT8,          -- ponter to the related log entry
502
  scope                  VARCHAR(50),   -- document scope
503
  identifier             INT8,          -- document identifier
504
  revision               INT8,          -- document revision
505
  document_url           VARCHAR(255),  -- document URL
506
  error_message          VARCHAR(1000), -- text error message
507
  document_type          VARCHAR(100),  -- document type
508
  CONSTRAINT harvest_detail_log_pk PRIMARY KEY (detail_log_id),
509 2422 sgarg
  CONSTRAINT harvest_detail_log_fk
510 2276 jones
        FOREIGN KEY (harvest_log_id) REFERENCES harvest_log
511
);
512
513 4080 daigle
/*
514
 * db_version -- table to store the version history of this database
515
 */
516
CREATE SEQUENCE db_version_id_seq;
517
CREATE TABLE db_version (
518
  db_version_id   INT8 default nextval ('db_version_id_seq'), -- the identifier for the version
519
  version         VARCHAR(250),     -- the version number
520
  status          INT8,             -- status of the version
521
  date_created    TIMESTAMP,        -- the datetime on which the version was created
522
  CONSTRAINT db_version_pk PRIMARY KEY (db_version_id)
523
);
524 4975 daigle
525
/*
526
 * scheduled_job -- table to store scheduled jobs
527
 */
528
CREATE SEQUENCE scheduled_job_id_seq;
529
CREATE TABLE scheduled_job (
530
  id INT8 NOT NULL default nextval('scheduled_job_id_seq'),
531
  date_created TIMESTAMP NOT NULL,
532
  date_updated TIMESTAMP NOT NULL,
533
  status VARCHAR(64) NOT NULL,
534
  name VARCHAR(512) NOT NULL,
535
  trigger_name VARCHAR(512) NOT NULL,
536
  group_name VARCHAR(512) NOT NULL,
537
  class_name VARCHAR(1024) NOT NULL,
538
  start_time TIMESTAMP NOT NULL,
539 5027 daigle
  end_time TIMESTAMP,
540 4975 daigle
  interval_value INT NOT NULL,
541
  interval_unit VARCHAR(8) NOT NULL,
542
  CONSTRAINT scheduled_job_pk PRIMARY KEY (id),
543
  CONSTRAINT scheduled_job_uk UNIQUE (name)
544
);
545
546
/*
547
 * scheduled_job_params -- table to store scheduled jobs
548
 */
549
CREATE SEQUENCE scheduled_job_params_id_seq;
550
CREATE TABLE scheduled_job_params (
551
  id INT8  NOT NULL default nextval('scheduled_job_params_id_seq'),
552
  date_created TIMESTAMP NOT NULL,
553
  date_updated TIMESTAMP  NOT NULL,
554
  status VARCHAR(64)  NOT NULL,
555
  job_id INT8 NOT NULL,
556
  key VARCHAR(64) NOT NULL,
557
  value VARCHAR(1024) NOT NULL,
558
  CONSTRAINT scheduled_job_params_pk PRIMARY KEY (id),
559
  CONSTRAINT scheduled_job_params_fk
560
        FOREIGN KEY (job_id) REFERENCES scheduled_job(id)
561
);