Project

General

Profile

1
/**
2
 *  '$RCSfile$'
3
 *  Copyright: 2004 Regents of the University of California and the
4
 *             National Center for Ecological Analysis and Synthesis
5
 *
6
 *   '$Author: berkley $'
7
 *     '$Date: 2011-02-04 12:39:21 -0800 (Fri, 04 Feb 2011) $'
8
 * '$Revision: 5917 $'
9
 *
10
 * This program is free software, you can redistribute it and/or modify
11
 * it under the terms of the GNU General Public License as published by
12
 * the Free Software Foundation, either version 2 of the License, or
13
 * (at your option) any later version.
14
 *
15
 * This program is distributed in the hope that it will be useful,
16
 * but WITHOUT ANY WARRANTY, without even the implied warranty of
17
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18
 * GNU General Public License for more details.
19
 *
20
 * You should have received a copy of the GNU General Public License
21
 * along with this program, if not, write to the Free Software
22
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
23
 */
24

    
25
/*
26
 * this is sql script does the same as the sql script named
27
 * xmltables.sql except that this script is to be use to
28
 * create the database tables on a Postgresql backend rather
29
 * than an Oracle Backend
30
 */
31

    
32
/*
33
 * Replication -- table to store servers that metacat is replicated to
34
 */
35
CREATE SEQUENCE xml_replication_id_seq;
36
CREATE TABLE xml_replication (
37
  serverid INT8 default nextval('xml_replication_id_seq'),
38
  server VARCHAR(512),
39
  last_checked DATE,
40
  replicate INT8,
41
  datareplicate INT8,
42
  hub INT8,
43
  CONSTRAINT xml_replication_pk PRIMARY KEY (serverid)
44
);
45

    
46
INSERT INTO xml_replication (server, replicate, datareplicate, hub) VALUES ('localhost', '0', '0', '0');
47

    
48
/*
49
 * Nodes -- table to store XML Nodes (both elements and attributes)
50
 */
51
CREATE SEQUENCE xml_nodes_id_seq;
52
CREATE TABLE xml_nodes (
53
	nodeid INT8 default nextval('xml_nodes_id_seq'),
54
					-- the unique node id (pk)
55
	nodeindex INT8,		-- order of nodes within parent
56
	nodetype VARCHAR(20),	-- type (DOCUMENT, COMMENT, PI,
57
				-- ELEMENT, ATTRIBUTE, TEXT)
58
	nodename VARCHAR(250),	-- the name of an element or attribute
59
        nodeprefix VARCHAR(50), -- the namespace prefix of the node
60
	nodedata TEXT, -- the data for this node (e.g.,
61
				-- for TEXT it is the content)
62
	parentnodeid INT8,	-- index of the parent of this node
63
	rootnodeid INT8,	-- index of the root node of this tree
64
	docid VARCHAR(250),	-- index to the document id
65
	date_created DATE,
66
	date_updated DATE,
67
        nodedatanumerical FLOAT8, -- the data for this node if
68
				  -- if it is a number
69
   CONSTRAINT xml_nodes_pk PRIMARY KEY (nodeid),
70
   CONSTRAINT xml_nodes_root_fk
71
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes,
72
   CONSTRAINT xml_nodes_parent_fk
73
		FOREIGN KEY (parentnodeid) REFERENCES xml_nodes
74
);
75
/*
76
 * Indexes of rootnodeid, parentnodeid, and nodename in xml_nodes
77
 */
78
CREATE INDEX xml_nodes_idx1 ON xml_nodes (rootnodeid);
79
CREATE INDEX xml_nodes_idx2 ON xml_nodes (parentnodeid);
80
CREATE INDEX xml_nodes_idx3 ON xml_nodes (nodename);
81
CREATE INDEX xml_nodes_idx4 ON xml_nodes (docid);
82

    
83

    
84
/*
85
 * Table for storing the nodes for the old revisions of the document and the deleted documents
86
 */
87
CREATE TABLE xml_nodes_revisions (
88
        nodeid INT8,            -- the unique node id (pk)
89
        nodeindex INT8,         -- order of nodes within parent
90
        nodetype VARCHAR(20),   -- type (DOCUMENT, COMMENT, PI,
91
                                -- ELEMENT, ATTRIBUTE, TEXT)
92
        nodename VARCHAR(250),  -- the name of an element or attribute
93
        nodeprefix VARCHAR(50), -- the namespace prefix of the node
94
        nodedata TEXT, -- the data for this node (e.g.,
95
                                -- for TEXT it is the content)
96
        parentnodeid INT8,      -- index of the parent of this node
97
        rootnodeid INT8,        -- index of the root node of this tree
98
        docid VARCHAR(250),     -- index to the document id
99
        date_created DATE,
100
        date_updated DATE,
101
        nodedatanumerical FLOAT8, -- the data for this node if
102
                                  -- if it is a number
103
   CONSTRAINT xml_nodes_revisions_pk PRIMARY KEY (nodeid),
104
   CONSTRAINT xml_nodes_revisions_root_fk
105
                FOREIGN KEY (rootnodeid) REFERENCES xml_nodes_revisions,
106
   CONSTRAINT xml_nodes_revisions_parent_fk
107
                FOREIGN KEY (parentnodeid) REFERENCES xml_nodes_revisions
108
);
109
                                                                                                                                                             
110
/*
111
 * Indexes of rootnodeid, parentnodeid, and nodename in xml_nodes_revisions
112
 */
113
CREATE INDEX xml_nodes_revisions_idx1 ON xml_nodes_revisions (rootnodeid);
114
CREATE INDEX xml_nodes_revisions_idx2 ON xml_nodes_revisions (parentnodeid);
115
CREATE INDEX xml_nodes_revisions_idx3 ON xml_nodes_revisions (nodename);
116
                                                                                                                                                             
117

    
118

    
119
/*
120
 * XML Catalog -- table to store all external sources for XML documents
121
 */
122
CREATE SEQUENCE xml_catalog_id_seq;
123
CREATE TABLE xml_catalog (
124
	catalog_id INT8 default nextval('xml_catalog_id_seq'),
125
                                        -- the id for this catalog entry
126
	entry_type VARCHAR(500),	-- the type of this catalog entry
127
					-- (e.g., DTD, XSD, XSL)
128
	source_doctype VARCHAR(500),	-- the source public_id for transforms
129
	target_doctype VARCHAR(500),	-- the target public_id for transforms
130
	public_id VARCHAR(500),	-- the unique id for this type
131
	system_id VARCHAR(1000),	-- the local location of the object
132
   CONSTRAINT xml_catalog_pk PRIMARY KEY (catalog_id),
133
   CONSTRAINT xml_catalog_uk UNIQUE
134
              (entry_type, source_doctype, target_doctype, public_id)
135
);
136

    
137
/*
138
 * Sequence to get uniqueID for Accession #
139
 */
140
CREATE SEQUENCE xml_documents_id_seq;
141
/*
142
 * Documents -- table to store XML documents
143
 */
144
CREATE TABLE xml_documents (
145
	docid VARCHAR(250),	-- the document id #
146
	rootnodeid INT8,		-- reference to root node of the DOM
147
	docname VARCHAR(100),	-- usually the root element name
148
	doctype VARCHAR(100),	-- public id indicating document type
149
	user_owner VARCHAR(100),	-- the user owned the document
150
	user_updated VARCHAR(100),	-- the user updated the document
151
	server_location INT8,	-- the server on which this document resides
152
	rev INT8 default 1,   -- the revision number of the document
153
	date_created DATE,
154
	date_updated DATE,
155
	public_access INT8,	-- flag for public access
156
        catalog_id INT8,	-- reference to xml_catalog
157
     CONSTRAINT xml_documents_pk PRIMARY KEY (docid),
158
     CONSTRAINT xml_documents_rep_fk
159
     		FOREIGN KEY (server_location) REFERENCES xml_replication,
160
    CONSTRAINT xml_documents_root_fk
161
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes,
162
   CONSTRAINT xml_documents_catalog_fk
163
		FOREIGN KEY (catalog_id) REFERENCES xml_catalog
164
);
165

    
166
/*
167
 * Index of <docid,doctype> in xml_document
168
 */
169
CREATE INDEX xml_documents_idx1 ON xml_documents (docid, doctype);
170
CREATE INDEX xml_documents_idx2 ON xml_documents (lower(user_owner));
171
CREATE INDEX xml_documents_idx3 ON xml_documents (rootnodeid);
172

    
173
/*
174
 * Revised Documents -- table to store XML documents saved after an UPDATE
175
 *                    or DELETE
176
 */
177
CREATE SEQUENCE xml_revisions_id_seq;
178
CREATE TABLE xml_revisions (
179
	revisionid INT8  default nextval('xml_revisions_id_seq'),
180
                                        -- the revision number we are saving
181
	docid VARCHAR(250),	-- the document id #
182
	rootnodeid INT8,		-- reference to root node of the DOM
183
	docname VARCHAR(100),	-- usually the root element name
184
	doctype VARCHAR(100),	-- public id indicating document type
185
	user_owner VARCHAR(100),
186
	user_updated VARCHAR(100),
187
	server_location INT8,
188
	rev INT8,
189
	date_created DATE,
190
	date_updated DATE,
191
	public_access INT8,	-- flag for public access
192
        catalog_id INT8,	-- reference to xml_catalog
193
   CONSTRAINT xml_revisions_pk PRIMARY KEY (revisionid),
194
   CONSTRAINT xml_revisions_rep_fk
195
		FOREIGN KEY (server_location) REFERENCES xml_replication,
196
   CONSTRAINT xml_revisions_root_fk
197
		FOREIGN KEY (rootnodeid) REFERENCES xml_nodes_revisions,
198
   CONSTRAINT xml_revisions_catalog_fk
199
		FOREIGN KEY (catalog_id) REFERENCES xml_catalog
200
);
201

    
202
CREATE INDEX xml_revisions_idx1 ON xml_revisions (docid);
203

    
204
/*
205
 * ACL -- table to store ACL for XML documents by principals
206
 */
207
CREATE TABLE xml_access (
208
	docid VARCHAR(250),	-- the document id #
209
	accessfileid VARCHAR(250),	-- the document id # for the access file
210
	principal_name VARCHAR(100),	-- name of user, group, etc.
211
	permission INT8,		-- "read", "write", "all"
212
	perm_type VARCHAR(32),	-- "allowed" or "denied"
213
	perm_order VARCHAR(32),	-- "allow first" or "deny first"
214
	begin_time DATE,		-- the time that permission begins
215
	end_time DATE,		-- the time that permission ends
216
	ticket_count INT8,		-- ticket counter for that permission
217
  subtreeid VARCHAR(32),
218
  startnodeid INT8,
219
  endnodeid INT8,
220
   CONSTRAINT xml_access_ck CHECK (begin_time < end_time),
221
   CONSTRAINT xml_access_accessfileid_fk
222
		FOREIGN KEY (accessfileid) REFERENCES xml_documents
223
);
224
CREATE INDEX xml_access_idx1 ON xml_access (lower(principal_name));
225
CREATE INDEX xml_access_idx2 ON xml_access (permission);
226
CREATE INDEX xml_access_idx3 ON xml_access (perm_type);
227
CREATE INDEX xml_access_idx4 ON xml_access (perm_order);
228
CREATE INDEX xml_access_idx5 ON xml_access (subtreeid);
229

    
230
/*
231
 * Index of Nodes -- table to store precomputed paths through tree for
232
 * quick searching in structured searches
233
 */
234
CREATE TABLE xml_index (
235
	nodeid INT8,		-- the unique node id
236
	path TEXT,	-- precomputed path through tree
237
	docid VARCHAR(250),	-- index to the document id
238
	doctype VARCHAR(100),	-- public id indicating document type
239
        parentnodeid INT8,      -- id of the parent of the node represented
240
				-- by this row
241
   CONSTRAINT xml_index_pk PRIMARY KEY (nodeid,path),
242
   CONSTRAINT xml_index_nodeid_fk FOREIGN KEY (nodeid) REFERENCES xml_nodes,
243
   CONSTRAINT xml_index_docid_fk
244
		FOREIGN KEY (docid) REFERENCES xml_documents
245
);
246

    
247
/*
248
 * Index of the paths in xml_index
249
 */
250
CREATE INDEX xml_index_idx1 ON xml_index (path);
251
CREATE INDEX xml_index_idx2 ON xml_index (docid);
252
CREATE INDEX xml_index_idx3 ON xml_index (nodeid);
253

    
254
CREATE SEQUENCE xml_relation_id_seq;
255
CREATE TABLE xml_relation (
256
	relationid INT8 default nextval('xml_relation_id_seq') PRIMARY KEY,
257
					     -- unique id
258
	docid VARCHAR(250) ,         -- the docid of the package file
259
	                                     -- that this relation came from
260
        packagetype VARCHAR(250),          -- the type of the package
261
	subject VARCHAR(512) NOT NULL, -- the subject of the relation
262
	subdoctype VARCHAR(128),         	-- the doctype of the subject
263
	relationship VARCHAR(128)  NOT NULL,-- the relationship type
264
	object VARCHAR(512) NOT NULL, -- the object of the relation
265
	objdoctype VARCHAR(128),          -- the doctype of the object
266
	CONSTRAINT xml_relation_uk UNIQUE (docid, subject, relationship, object),
267
	CONSTRAINT xml_relation_docid_fk
268
		FOREIGN KEY (docid) REFERENCES xml_documents
269
);
270

    
271
/*
272
 * Table used to store all document identifiers in metacat.  Each identifier
273
 * has a globally unique, unconstrained string, which we will refer to as a
274
 * GUID, and a local metacat identifier, which consists of the docid
275
 * and revision fields. Each row maps one global identifier to the local
276
 * identifier (docid) used within metacat.
277
 */
278
CREATE TABLE identifier (
279
   guid   text,          -- the globally unique string identifier
280
   docid  VARCHAR(250),	 -- the local document id #
281
   rev    INT8,          -- the revision part of the local identifier
282
   CONSTRAINT identifier_pk PRIMARY KEY (guid)
283
);
284

    
285
/*
286
 * Table used to store all document identifiers for system metadata objects
287
 * similar restraints to identifier.  Cannot use identifier table for this 
288
 * purpose because then you have to worry about whether you insert the
289
 * data first or the systemMetadata first.
290
 */
291
CREATE TABLE systemMetadata (
292
   guid   text,          -- the globally unique string identifier of the object that the system metadata describes
293
   docid  VARCHAR(250),	 -- the local document id #
294
   rev    INT8,          -- the revision part of the local identifier
295
   date_uploaded TIMESTAMP, -- the date/time the document was first submitted
296
   rights_holder VARCHAR(250), --the user who has rights to the document, usually the first persons to upload it
297
   checksum VARCHAR(512), --the checksum of the doc using the given algorithm (see below)
298
   checksum_algorithm VARCHAR(250), --the algorithm used to calculate the checksum
299
   origin_member_node VARCHAR(250), --the member node where the document was first uploaded
300
   authoritive_member_node VARCHAR(250), --the member node that currently controls the document
301
   date_modified TIMESTAMP, -- the last date/time that the file was changed
302
   submitter VARCHAR(256), -- the user who originally submitted the doc
303
   object_format VARCHAR(256), --the format of the object
304
   size VARCHAR(256), --the size of the object
305
   CONSTRAINT systemMetadata_pk PRIMARY KEY (guid)
306
);
307

    
308
/*
309
 * accesssubtree -- table to store access subtree info
310
 */
311
CREATE TABLE xml_accesssubtree (
312
	docid		VARCHAR(250),	-- the document id #
313
  rev 		INT8 default 1, --the revision number of the docume
314
  controllevel VARCHAR(50), -- the level it control -- document or subtree
315
  subtreeid VARCHAR(250), -- the subtree id
316
	startnodeid	INT8,	-- the start node id of access subtree
317
  endnodeid INT8, -- the end node if of access subtree
318
  CONSTRAINT xml_accesssubtree_docid_fk
319
		FOREIGN KEY (docid) REFERENCES xml_documents
320
);
321

    
322
/*
323
 * Returnfields -- table to store combinations of returnfields requested
324
 *		    and the number of times this table is accessed
325
 */
326
CREATE SEQUENCE xml_returnfield_id_seq;
327
CREATE TABLE xml_returnfield (
328
        returnfield_id     INT8 default nextval('xml_returnfield_id_seq'),   -- the id for this returnfield entry
329
        returnfield_string VARCHAR(2000),                                    -- the returnfield string
330
        usage_count        INT8,                                             -- the number of times this string has been requested
331
        CONSTRAINT xml_returnfield_pk PRIMARY KEY (returnfield_id)
332
);
333
CREATE INDEX xml_returnfield_idx1 ON xml_returnfield(returnfield_string);
334

    
335
/*
336
 * Queryresults -- table to store queryresults for a given docid
337
 * and returnfield_id
338
 */
339
CREATE SEQUENCE xml_queryresult_id_seq;
340
CREATE TABLE xml_queryresult(
341
  queryresult_id INT8 default nextval('xml_queryresult_id_seq'), -- id for this entry
342
  returnfield_id       INT8,          -- id for the returnfield corresponding to this entry
343
  docid                VARCHAR(250),  -- docid of the document
344
  queryresult_string   TEXT, -- resultant text generated for this docid and given
345
  				       -- returnfield
346
  CONSTRAINT xml_queryresult_pk PRIMARY KEY (queryresult_id),
347
  CONSTRAINT xml_queryresult_searchid_fk
348
               FOREIGN KEY (returnfield_id) REFERENCES xml_returnfield
349
);
350

    
351
CREATE INDEX xml_queryresult_idx1 ON xml_queryresult (returnfield_id, docid);
352

    
353
/*
354
 * Logging -- table to store metadata and data access log
355
 */
356
CREATE SEQUENCE access_log_id_seq;
357
CREATE TABLE access_log (
358
  entryid       INT8 default nextval ('access_log_id_seq'), -- the identifier for the log event
359
  ip_address    VARCHAR(512),   -- the ip address inititiating the event
360
  principal     VARCHAR(512),   -- the user initiiating the event
361
  docid         VARCHAR(250),	-- the document id #
362
  event         VARCHAR(512),   -- the code symbolizing the event type
363
  date_logged   TIMESTAMP,      -- the datetime on which the event occurred
364
  CONSTRAINT access_log_pk PRIMARY KEY (entryid)
365
);
366

    
367

    
368
/*
369
 * Table for indexing the paths specified the administrator in metacat.properties
370
 */
371

    
372
CREATE SEQUENCE xml_path_index_id_seq;
373
CREATE TABLE xml_path_index (
374
    nodeid INT8  default nextval('xml_path_index_id_seq'),
375
        docid VARCHAR(250),     -- the document id
376
        path VARCHAR(1000),     -- precomputed path through tree
377
        nodedata TEXT, -- the data for this node (e.g.,
378
                                -- for TEXT it is the content)
379
        nodedatanumerical FLOAT8, -- the data for this node if
380
                                  -- if it is a number
381
        parentnodeid INT8,      -- id of the parent of the node represented
382
                                -- by this row
383
   CONSTRAINT xml_path_index_pk PRIMARY KEY (nodeid),
384
   CONSTRAINT xml_path_index_docid_fk
385
                FOREIGN KEY (docid) REFERENCES xml_documents
386
);
387

    
388
/*
389
 * Indexes of path, nodedata and nodedatanumerical in xml_path_index
390
 */
391
CREATE INDEX xml_path_index_idx1 ON xml_path_index (path);
392
CREATE INDEX xml_path_index_idx2 ON xml_path_index (nodedata);
393
CREATE INDEX xml_path_index_idx3 ON xml_path_index (nodedatanumerical);
394
CREATE INDEX xml_path_index_idx4 ON xml_path_index (upper(nodedata));
395

    
396
/*
397
 * harvest_site_schedule -- table to store harvest sites and schedule info
398
 */
399
CREATE TABLE harvest_site_schedule (
400
  site_schedule_id INT8,         -- unique id
401
  documentlisturl  VARCHAR(255), -- URL of the site harvest document list
402
  ldapdn           VARCHAR(255), -- LDAP distinguished name for site account
403
  datenextharvest  DATE,         -- scheduled date of next harvest
404
  datelastharvest  DATE,         -- recorded date of last harvest
405
  updatefrequency  INT8,         -- the harvest update frequency
406
  unit             VARCHAR(50),  -- update unit -- days weeks or months
407
  contact_email    VARCHAR(50),  -- email address of the site contact person
408
  ldappwd          VARCHAR(20),  -- LDAP password for site account
409
  CONSTRAINT harvest_site_schedule_pk PRIMARY KEY (site_schedule_id)
410
);
411

    
412
/*
413
 * harvest_log -- table to log entries for harvest operations
414
 */
415
CREATE TABLE harvest_log (
416
  harvest_log_id         INT8,          -- unique id
417
  harvest_date           DATE,          -- date of the current harvest
418
  status                 INT8,          -- non-zero indicates an error status
419
  message                VARCHAR(1000), -- text message for this log entry
420
  harvest_operation_code VARCHAR(30),   -- the type of harvest operation
421
  site_schedule_id       INT8,          -- site schedule id, or 0 if no site
422
  CONSTRAINT harvest_log_pk PRIMARY KEY (harvest_log_id)
423
);
424

    
425
/*
426
 * harvest_detail_log -- table to log detailed info about documents that
427
 *                       generated errors during the harvest
428
 */
429
CREATE TABLE harvest_detail_log (
430
  detail_log_id          INT8,          -- unique id
431
  harvest_log_id         INT8,          -- ponter to the related log entry
432
  scope                  VARCHAR(50),   -- document scope
433
  identifier             INT8,          -- document identifier
434
  revision               INT8,          -- document revision
435
  document_url           VARCHAR(255),  -- document URL
436
  error_message          VARCHAR(1000), -- text error message
437
  document_type          VARCHAR(100),  -- document type
438
  CONSTRAINT harvest_detail_log_pk PRIMARY KEY (detail_log_id),
439
  CONSTRAINT harvest_detail_log_fk
440
        FOREIGN KEY (harvest_log_id) REFERENCES harvest_log
441
);
442

    
443
/*
444
 * db_version -- table to store the version history of this database
445
 */
446
CREATE SEQUENCE db_version_id_seq;
447
CREATE TABLE db_version (
448
  db_version_id   INT8 default nextval ('db_version_id_seq'), -- the identifier for the version
449
  version         VARCHAR(250),     -- the version number
450
  status          INT8,             -- status of the version
451
  date_created    TIMESTAMP,        -- the datetime on which the version was created
452
  CONSTRAINT db_version_pk PRIMARY KEY (db_version_id)
453
);
454

    
455
/*
456
 * scheduled_job -- table to store scheduled jobs
457
 */
458
CREATE SEQUENCE scheduled_job_id_seq;
459
CREATE TABLE scheduled_job (
460
  id INT8 NOT NULL default nextval('scheduled_job_id_seq'),
461
  date_created TIMESTAMP NOT NULL,
462
  date_updated TIMESTAMP NOT NULL,
463
  status VARCHAR(64) NOT NULL,
464
  name VARCHAR(512) NOT NULL,
465
  trigger_name VARCHAR(512) NOT NULL,
466
  group_name VARCHAR(512) NOT NULL,
467
  class_name VARCHAR(1024) NOT NULL,
468
  start_time TIMESTAMP NOT NULL,
469
  end_time TIMESTAMP,
470
  interval_value INT NOT NULL,
471
  interval_unit VARCHAR(8) NOT NULL,
472
  CONSTRAINT scheduled_job_pk PRIMARY KEY (id),
473
  CONSTRAINT scheduled_job_uk UNIQUE (name)
474
);
475

    
476
/*
477
 * scheduled_job_params -- table to store scheduled jobs
478
 */
479
CREATE SEQUENCE scheduled_job_params_id_seq;
480
CREATE TABLE scheduled_job_params (
481
  id INT8  NOT NULL default nextval('scheduled_job_params_id_seq'),
482
  date_created TIMESTAMP NOT NULL,
483
  date_updated TIMESTAMP  NOT NULL,
484
  status VARCHAR(64)  NOT NULL,
485
  job_id INT8 NOT NULL,
486
  key VARCHAR(64) NOT NULL,
487
  value VARCHAR(1024) NOT NULL,
488
  CONSTRAINT scheduled_job_params_pk PRIMARY KEY (id),
489
  CONSTRAINT scheduled_job_params_fk
490
        FOREIGN KEY (job_id) REFERENCES scheduled_job(id)
491
);
(49-49/50)