CREATE TABLE systemMetadata ( guid text, -- the globally unique string identifier of the object that the system metadata describes serial_version VARCHAR(256), --the serial version of the object date_uploaded TIMESTAMP, -- the date/time the document was first submitted rights_holder VARCHAR(250), --the user who has rights to the document, usually the first persons to upload it checksum VARCHAR(512), --the checksum of the doc using the given algorithm (see below) checksum_algorithm VARCHAR(250), --the algorithm used to calculate the checksum origin_member_node VARCHAR(250), --the member node where the document was first uploaded authoritive_member_node VARCHAR(250), --the member node that currently controls the document date_modified TIMESTAMP, -- the last date/time that the file was changed submitter VARCHAR(256), -- the user who originally submitted the doc object_format VARCHAR(256), --the format of the object size VARCHAR(256), --the size of the object archived boolean, -- specifies whether this an archived object replication_allowed boolean, -- replication allowed number_replicas INT8, -- the number of replicas allowed obsoletes text, -- the identifier that this record obsoletes obsoleted_by text, -- the identifier of the record that replaces this record CONSTRAINT systemMetadata_pk PRIMARY KEY (guid) ); CREATE TABLE systemMetadataReplicationPolicy ( guid text, -- the globally unique string identifier of the object that the system metadata describes member_node VARCHAR(250), -- replication member node policy text, -- the policy (preferred, blocked, etc...TBD) CONSTRAINT systemMetadataReplicationPolicy_fk FOREIGN KEY (guid) REFERENCES systemMetadata DEFERRABLE ); CREATE TABLE systemMetadataReplicationStatus ( guid text, -- the globally unique string identifier of the object that the system metadata describes member_node VARCHAR(250), -- replication member node status VARCHAR(250), -- replication status date_verified TIMESTAMP, -- the date replication was verified CONSTRAINT systemMetadataReplicationStatus_fk FOREIGN KEY (guid) REFERENCES systemMetadata DEFERRABLE ); /* * Remove the old Identifier table (pre-2.0) */ DROP TABLE IF EXISTS identifier; /* * Create the new one (DataONE features) */ CREATE TABLE identifier ( guid text, -- the globally unique string identifier docid VARCHAR(250), -- the local document id # rev INT8, -- the revision part of the local identifier CONSTRAINT identifier_pk PRIMARY KEY (guid) ); /* * add the nodedatadate column to the tables that need it */ ALTER TABLE xml_nodes ADD COLUMN nodedatadate TIMESTAMP; ALTER TABLE xml_nodes_revisions ADD COLUMN nodedatadate TIMESTAMP; ALTER TABLE xml_path_index ADD COLUMN nodedatadate TIMESTAMP; CREATE INDEX xml_path_index_idx5 ON xml_path_index (nodedatadate); /** * track the user-agent for the request */ ALTER TABLE access_log ADD COLUMN user_agent VARCHAR(512); /* * Register the new schema */ INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('Schema', 'eml://ecoinformatics.org/eml-2.1.1', '/schema/eml-2.1.1/eml.xsd'); /** * Generate GUIDs for docid.rev */ INSERT INTO identifier (docid, rev, guid) SELECT docid, rev, docid || '.' || rev FROM xml_documents UNION SELECT docid, rev, docid || '.' || rev FROM xml_revisions; --INSERT 0 156644 /** * Add guid in xml_access table */ ALTER TABLE xml_access ADD COLUMN guid text; /** * Expand accessfileid in xml_access table to hold guids */ ALTER TABLE xml_access ALTER COLUMN accessfileid TYPE text; /** * Upgrade xml_access records to use GUID from identifier table * NOTE: This duplicates existing access rules for every revision of a document */ INSERT INTO xml_access ( guid, principal_name, permission, perm_type, perm_order, docid, accessfileid, begin_time, end_time, ticket_count, subtreeid, startnodeid, endnodeid ) SELECT id.guid, xa.principal_name, xa.permission, xa.perm_type, xa.perm_order, xa.docid, xa.accessfileid, xa.begin_time, xa.end_time, xa.ticket_count, xa.subtreeid, xa.startnodeid, xa.endnodeid FROM identifier id, xml_access xa WHERE id.docid = xa.docid; --INSERT 0 311224 /** * Include inline data access rows -- they have a special guid: 'scope.docid.rev.index' */ INSERT INTO xml_access ( guid, principal_name, permission, perm_type, perm_order, docid, accessfileid, begin_time, end_time, ticket_count, subtreeid, startnodeid, endnodeid ) SELECT docid, principal_name, permission, perm_type, perm_order, docid, accessfileid, begin_time, end_time, ticket_count, subtreeid, startnodeid, endnodeid FROM xml_access WHERE docid like '%.%.%.%'; --INSERT 0 18 /** * Update the accessfileid to use their guid * NOTE: uses the last revision's guid as the new value for accessfileid * uses a temporary table **/ CREATE TABLE max_identifier (guid text, docid VARCHAR(250), rev INT8); /** insert the max rev identifier for each document **/ INSERT INTO max_identifier (docid, rev, guid) SELECT docid, MAX(rev), docid || '.' || MAX(rev) FROM identifier GROUP BY docid; --INSERT 0 57841 /** create some indexes to speed up the join **/ CREATE INDEX maxid_docid_index ON max_identifier (docid); CREATE INDEX maxid_guid_index ON max_identifier (guid); CREATE INDEX accessfileid_index on xml_access (accessfileid); CREATE INDEX xml_access_guid_index on xml_access (guid); UPDATE xml_access xa SET accessfileid = maxid.guid FROM max_identifier maxid WHERE xa.accessfileid = maxid.docid AND xa.guid IS NOT null; --UPDATE 310427 DROP INDEX maxid_docid_index; DROP INDEX maxid_guid_index; DROP INDEX accessfileid_index; DROP INDEX xml_access_guid_index; DROP TABLE max_identifier; /** * Remove old access rules */ DELETE FROM xml_access WHERE guid is null; --DELETE 105432 /** * clean up the xml_access table */ ALTER TABLE xml_access DROP COLUMN docid; /** * expand xml_path_index 'path' column to hold larger strings */ ALTER TABLE xml_path_index ALTER COLUMN path TYPE text; /** * include 2.0.0beta4 DTD */ INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-access-2.0.0beta4//EN', '/dtd/eml-access-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-attribute-2.0.0beta4//EN', '/dtd/eml-attribute-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-constraint-2.0.0beta4//EN', '/dtd/eml-constraint-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-coverage-2.0.0beta4//EN', '/dtd/eml-coverage-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-dataset-2.0.0beta4//EN', '/dtd/eml-dataset-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-entity-2.0.0beta4//EN', '/dtd/eml-entity-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-literature-2.0.0beta4//EN', '/dtd/eml-literature-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-physical-2.0.0beta4//EN', '/dtd/eml-physical-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-project-2.0.0beta4//EN', '/dtd/eml-project-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-protocol-2.0.0beta4//EN', '/dtd/eml-protocol-2.0.0beta4.dtd'); INSERT INTO xml_catalog (entry_type, public_id, system_id) VALUES ('DTD', '-//ecoinformatics.org//eml-software-2.0.0beta4//EN', '/dtd/eml-software-2.0.0beta4.dtd'); /* * update the database version */ UPDATE db_version SET status=0; INSERT INTO db_version (version, status, date_created) VALUES ('2.0.0', 1, CURRENT_DATE);