Thread: [Gmod-schema-cmts] SF.net SVN: gmod:[25108] schema/trunk/chado (Page 2)

SourceForge Headquarters 225 Broadway Suite 1600 San Diego, CA 92101 +1 (858) 454-5900

Revision: 25108
          http://gmod.svn.sourceforge.net/gmod/?rev=25108&view=rev
Author:   scottcain
Date:     2011-08-03 16:48:48 +0000 (Wed, 03 Aug 2011)

Log Message:
-----------
updating schema for a minor omission, updating the schema diffs

Modified Paths:
--------------
    schema/trunk/chado/Makefile.PL
    schema/trunk/chado/lib/Bio/Chado/Builder.pm
    schema/trunk/chado/modules/default_nofuncs.sql
    schema/trunk/chado/modules/default_schema.sql
    schema/trunk/chado/modules/stock/stock.sql

Added Paths:
-----------
    schema/trunk/chado/schemas/1.2/
    schema/trunk/chado/schemas/1.2/default_schema.sql
    schema/trunk/chado/schemas/1.2-1.0/
    schema/trunk/chado/schemas/1.2-1.1/
    schema/trunk/chado/schemas/1.2-1.11/
    schema/trunk/chado/schemas/1.2-1.11/diff
    schema/trunk/chado/schemas/1.2-1.11/diff.sql

Modified: schema/trunk/chado/Makefile.PL
===================================================================

--- schema/trunk/chado/Makefile.PL	2011-08-03 16:32:25 UTC (rev 25107)
+++ schema/trunk/chado/Makefile.PL	2011-08-03 16:48:48 UTC (rev 25108)
@@ -46,6 +46,8 @@
 use Template;
 use Module::Build;
 
+my $VERSION = 1.2;
+
 my %args    =  (
   DBDRIVER  => {
     default => 'PostgreSQL'
@@ -385,6 +387,7 @@
   "  LOCAL_TMP=$LOCAL_TMP",
   "  DBORGANISM=$DBORGANISM",
   "  DEFAULT=$DEFAULT",
+  "  VERSION=$VERSION",
 ),"\n\n";
 
 #
@@ -402,6 +405,7 @@
   $conf{'PREFIX'}   = $opts{'PREFIX'};
   $conf{'LIB'}      = $opts{'LIB'};
   $conf{'DEFAULT'}  = $DEFAULT;
+  $conf{'VERSION'}  = $VERSION;
 
   print CONF map { "$_=$conf{ $_ }\n" } keys %conf;
   close CONF or die "Can't write file '$build_config': $!\n";
@@ -502,7 +506,7 @@
 #      'INSTALLSITELIB' => '$(INSTALLSITEARCH)',
     'NAME'		            => 'chado',
 #    'NAME'                => 'gmod',
-    'VERSION'             => '1.2',
+    'VERSION'             => $VERSION,
     'PREREQ_PM'		        => { 
       #'SQL::Translator'   => 0.05,
       #'Class::DBI'        => 0.94,

Modified: schema/trunk/chado/lib/Bio/Chado/Builder.pm
===================================================================
--- schema/trunk/chado/lib/Bio/Chado/Builder.pm	2011-08-03 16:32:25 UTC (rev 25107)
+++ schema/trunk/chado/lib/Bio/Chado/Builder.pm	2011-08-03 16:48:48 UTC (rev 25108)
@@ -74,6 +74,7 @@
   my $db_port   = $conf->{'database'}{'db_port'}  || '';
   my $db_user   = $conf->{'database'}{'db_username'}  || '';
   my $build_dir = $conf->{'build'}{'working_dir'} || '';
+  my $schema_version = $conf->{'build'}{'version'};
   my $init_sql  = catfile( $build_dir, 'load', 'etc', 'initialize.sql' );
   my $sys_call  = "psql -h $db_host -p $db_port -U $db_user -f $init_sql $db_name";
 

Modified: schema/trunk/chado/modules/default_nofuncs.sql
===================================================================
--- schema/trunk/chado/modules/default_nofuncs.sql	2011-08-03 16:32:25 UTC (rev 25107)
+++ schema/trunk/chado/modules/default_nofuncs.sql	2011-08-03 16:48:48 UTC (rev 25108)
@@ -3314,7 +3314,7 @@
 	stock_relationship_cvterm_id SERIAL NOT NULL,
 	PRIMARY KEY (stock_relationship_cvterm_id),
 	stock_relatiohship_id integer NOT NULL,
-	--FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
+	FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
 	cvterm_id integer NOT NULL,
 	FOREIGN KEY (cvterm_id) REFERENCES cvterm (cvterm_id) ON DELETE RESTRICT,
 	pub_id integer,

Modified: schema/trunk/chado/modules/default_schema.sql
===================================================================
--- schema/trunk/chado/modules/default_schema.sql	2011-08-03 16:32:25 UTC (rev 25107)
+++ schema/trunk/chado/modules/default_schema.sql	2011-08-03 16:48:48 UTC (rev 25108)
@@ -40403,7 +40403,7 @@
 	stock_relationship_cvterm_id SERIAL NOT NULL,
 	PRIMARY KEY (stock_relationship_cvterm_id),
 	stock_relatiohship_id integer NOT NULL,
-	--FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
+	FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
 	cvterm_id integer NOT NULL,
 	FOREIGN KEY (cvterm_id) REFERENCES cvterm (cvterm_id) ON DELETE RESTRICT,
 	pub_id integer,

Modified: schema/trunk/chado/modules/stock/stock.sql
===================================================================
--- schema/trunk/chado/modules/stock/stock.sql	2011-08-03 16:32:25 UTC (rev 25107)
+++ schema/trunk/chado/modules/stock/stock.sql	2011-08-03 16:48:48 UTC (rev 25108)
@@ -145,7 +145,7 @@
 	stock_relationship_cvterm_id SERIAL NOT NULL,
 	PRIMARY KEY (stock_relationship_cvterm_id),
 	stock_relatiohship_id integer NOT NULL,
-	--FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
+	FOREIGN KEY (stock_relationship_id) references stock_relationship (stock_relationship_id) ON DELETE CASCADE INITIALLY DEFERRED,
 	cvterm_id integer NOT NULL,
 	FOREIGN KEY (cvterm_id) REFERENCES cvterm (cvterm_id) ON DELETE RESTRICT,
 	pub_id integer,

Added: schema/trunk/chado/schemas/1.2/default_schema.sql
===================================================================
--- schema/trunk/chado/schemas/1.2/default_schema.sql	                        (rev 0)
+++ schema/trunk/chado/schemas/1.2/default_schema.sql	2011-08-03 16:48:48 UTC (rev 25108)
@@ -0,0 +1,41889 @@
+-- $Id: general.sql,v 1.31 2007-03-01 02:45:54 briano Exp $
+-- ==========================================
+-- Chado general module
+--
+-- ================================================
+-- TABLE: tableinfo
+-- ================================================
+
+create table tableinfo (
+    tableinfo_id serial not null,
+    primary key (tableinfo_id),
+    name varchar(30) not null,
+    primary_key_column varchar(30) null,
+    is_view int not null default 0,
+    view_on_table_id int null,
+    superclass_table_id int null,
+    is_updateable int not null default 1,
+    modification_date date not null default now(),
+    constraint tableinfo_c1 unique (name)
+);
+
+COMMENT ON TABLE tableinfo IS NULL;
+
+-- ================================================
+-- TABLE: db
+-- ================================================
+
+create table db (
+    db_id serial not null,
+    primary key (db_id),
+    name varchar(255) not null,
+--    contact_id int,
+--    foreign key (contact_id) references contact (contact_id) on delete cascade INITIALLY DEFERRED,
+    description varchar(255) null,
+    urlprefix varchar(255) null,
+    url varchar(255) null,
+    constraint db_c1 unique (name)
+);
+
+COMMENT ON TABLE db IS 'A database authority. Typical databases in
+bioinformatics are FlyBase, GO, UniProt, NCBI, MGI, etc. The authority
+is generally known by this shortened form, which is unique within the
+bioinformatics and biomedical realm.  To Do - add support for URIs,
+URNs (e.g. LSIDs). We can do this by treating the URL as a URI -
+however, some applications may expect this to be resolvable - to be
+decided.';
+
+-- ================================================
+-- TABLE: dbxref
+-- ================================================
+
+create table dbxref (
+    dbxref_id serial not null,
+    primary key (dbxref_id),
+    db_id int not null,
+    foreign key (db_id) references db (db_id) on delete cascade INITIALLY DEFERRED,
+    accession varchar(255) not null,
+    version varchar(255) not null default '',
+    description text,
+    constraint dbxref_c1 unique (db_id,accession,version)
+);
+create index dbxref_idx1 on dbxref (db_id);
+create index dbxref_idx2 on dbxref (accession);
+create index dbxref_idx3 on dbxref (version);
+
+COMMENT ON TABLE dbxref IS 'A unique, global, public, stable identifier. Not necessarily an external reference - can reference data items inside the particular chado instance being used. Typically a row in a table can be uniquely identified with a primary identifier (called dbxref_id); a table may also have secondary identifiers (in a linking table <T>_dbxref). A dbxref is generally written as <DB>:<ACCESSION> or as <DB>:<ACCESSION>:<VERSION>.';
+
+COMMENT ON COLUMN dbxref.accession IS 'The local part of the identifier. Guaranteed by the db authority to be unique for that db.';
+
+CREATE VIEW db_dbxref_count AS
+  SELECT db.name,count(*) AS num_dbxrefs FROM db INNER JOIN dbxref USING (db_id) GROUP BY db.name;
+COMMENT ON VIEW db_dbxref_count IS 'per-db dbxref counts';
+
+CREATE OR REPLACE FUNCTION store_db (VARCHAR) 
+  RETURNS INT AS 
+'DECLARE
+   v_name             ALIAS FOR $1;
+
+   v_db_id            INTEGER;
+ BEGIN
+    SELECT INTO v_db_id db_id
+      FROM db
+      WHERE name=v_name;
+    IF NOT FOUND THEN
+      INSERT INTO db
+       (name)
+         VALUES
+       (v_name);
+       RETURN currval(''db_db_id_seq'');
+    END IF;
+    RETURN v_db_id;
+ END;
+' LANGUAGE 'plpgsql';
+  
+CREATE OR REPLACE FUNCTION store_dbxref (VARCHAR,VARCHAR) 
+  RETURNS INT AS 
+'DECLARE
+   v_dbname                ALIAS FOR $1;
+   v_accession             ALIAS FOR $1;
+
+   v_db_id                 INTEGER;
+   v_dbxref_id             INTEGER;
+ BEGIN
+    SELECT INTO v_db_id
+      store_db(v_dbname);
+    SELECT INTO v_dbxref_id dbxref_id
+      FROM dbxref
+      WHERE db_id=v_db_id       AND
+            accession=v_accession;
+    IF NOT FOUND THEN
+      INSERT INTO dbxref
+       (db_id,accession)
+         VALUES
+       (v_db_id,v_accession);
+       RETURN currval(''dbxref_dbxref_id_seq'');
+    END IF;
+    RETURN v_dbxref_id;
+ END;
+' LANGUAGE 'plpgsql';
+  
+-- $Id: cv.sql,v 1.37 2007-02-28 15:08:48 briano Exp $
+-- ==========================================
+-- Chado cv module
+--
+-- =================================================================
+-- Dependencies:
+--
+-- :import dbxref from general
+-- =================================================================
+
+-- ================================================
+-- TABLE: cv
+-- ================================================
+create table cv (
+    cv_id serial not null,
+    primary key (cv_id),
+    name varchar(255) not null,
+   definition text,
+   constraint cv_c1 unique (name)
+);
+
+COMMENT ON TABLE cv IS 'A controlled vocabulary or ontology. A cv is
+composed of cvterms (AKA terms, classes, types, universals - relations
+and properties are also stored in cvterm) and the relationships
+between them.';
+
+COMMENT ON COLUMN cv.name IS 'The name of the ontology. This
+corresponds to the obo-format -namespace-. cv names uniquely identify
+the cv. In OBO file format, the cv.name is known as the namespace.';
+
+COMMENT ON COLUMN cv.definition IS 'A text description of the criteria for
+membership of this ontology.';
+
+-- ================================================
+-- TABLE: cvterm
+-- ================================================
+create table cvterm (
+    cvterm_id serial not null,
+    primary key (cvterm_id),
+    cv_id int not null,
+    foreign key (cv_id) references cv (cv_id) on delete cascade INITIALLY DEFERRED,
+    name varchar(1024) not null,
+    definition text,
+    dbxref_id int not null,
+    foreign key (dbxref_id) references dbxref (dbxref_id) on delete set null INITIALLY DEFERRED,
+    is_obsolete int not null default 0,
+    is_relationshiptype int not null default 0,
+    constraint cvterm_c1 unique (name,cv_id,is_obsolete),
+    constraint cvterm_c2 unique (dbxref_id)
+);
+create index cvterm_idx1 on cvterm (cv_id);
+create index cvterm_idx2 on cvterm (name);
+create index cvterm_idx3 on cvterm (dbxref_id);
+
+COMMENT ON TABLE cvterm IS 'A term, class, universal or type within an
+ontology or controlled vocabulary.  This table is also used for
+relations and properties. cvterms constitute nodes in the graph
+defined by the collection of cvterms and cvterm_relationships.';
+
+COMMENT ON COLUMN cvterm.cv_id IS 'The cv or ontology or namespace to which
+this cvterm belongs.';
+
+COMMENT ON COLUMN cvterm.name IS 'A concise human-readable name or
+label for the cvterm. Uniquely identifies a cvterm within a cv.';
+
+COMMENT ON COLUMN cvterm.definition IS 'A human-readable text
+definition.';
+
+COMMENT ON COLUMN cvterm.dbxref_id IS 'Primary identifier dbxref - The
+unique global OBO identifier for this cvterm.  Note that a cvterm may
+have multiple secondary dbxrefs - see also table: cvterm_dbxref.';
+
+COMMENT ON COLUMN cvterm.is_obsolete IS 'Boolean 0=false,1=true; see
+GO documentation for details of obsoletion. Note that two terms with
+different primary dbxrefs may exist if one is obsolete.';
+
+COMMENT ON COLUMN cvterm.is_relationshiptype IS 'Boolean
+0=false,1=true relations or relationship types (also known as Typedefs
+in OBO format, or as properties or slots) form a cv/ontology in
+themselves. We use this flag to indicate whether this cvterm is an
+actual term/class/universal or a relation. Relations may be drawn from
+the OBO Relations ontology, but are not exclusively drawn from there.';
+
+COMMENT ON INDEX cvterm_c1 IS 'A name can mean different things in
+different contexts; for example "chromosome" in SO and GO. A name
+should be unique within an ontology or cv. A name may exist twice in a
+cv, in both obsolete and non-obsolete forms - these will be for
+different cvterms with different OBO identifiers; so GO documentation
+for more details on obsoletion. Note that occasionally multiple
+obsolete terms with the same name will exist in the same cv. If this
+is a possibility for the ontology under consideration (e.g. GO) then the
+ID should be appended to the name to ensure uniqueness.';
+
+COMMENT ON INDEX cvterm_c2 IS 'The OBO identifier is globally unique.';
+
+-- ================================================
+-- TABLE: cvterm_relationship
+-- ================================================
+create table cvterm_relationship (
+    cvterm_relationship_id serial not null,
+    primary key (cvterm_relationship_id),
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    subject_id int not null,
+    foreign key (subject_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    object_id int not null,
+    foreign key (object_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    constraint cvterm_relationship_c1 unique (subject_id,object_id,type_id)
+);
+create index cvterm_relationship_idx1 on cvterm_relationship (type_id);
+create index cvterm_relationship_idx2 on cvterm_relationship (subject_id);
+create index cvterm_relationship_idx3 on cvterm_relationship (object_id);
+
+COMMENT ON TABLE cvterm_relationship IS 'A relationship linking two
+cvterms. Each cvterm_relationship constitutes an edge in the graph
+defined by the collection of cvterms and cvterm_relationships. The
+meaning of the cvterm_relationship depends on the definition of the
+cvterm R refered to by type_id. However, in general the definitions
+are such that the statement "all SUBJs REL some OBJ" is true. The
+cvterm_relationship statement is about the subject, not the
+object. For example "insect wing part_of thorax".';
+
+COMMENT ON COLUMN cvterm_relationship.subject_id IS 'The subject of
+the subj-predicate-obj sentence. The cvterm_relationship is about the
+subject. In a graph, this typically corresponds to the child node.';
+
+COMMENT ON COLUMN cvterm_relationship.object_id IS 'The object of the
+subj-predicate-obj sentence. The cvterm_relationship refers to the
+object. In a graph, this typically corresponds to the parent node.';
+
+COMMENT ON COLUMN cvterm_relationship.type_id IS 'The nature of the
+relationship between subject and object. Note that relations are also
+housed in the cvterm table, typically from the OBO relationship
+ontology, although other relationship types are allowed.';
+
+-- ================================================
+-- TABLE: cvtermpath
+-- ================================================
+create table cvtermpath (
+    cvtermpath_id serial not null,
+    primary key (cvtermpath_id),
+    type_id int,
+    foreign key (type_id) references cvterm (cvterm_id) on delete set null INITIALLY DEFERRED,
+    subject_id int not null,
+    foreign key (subject_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    object_id int not null,
+    foreign key (object_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    cv_id int not null,
+    foreign key (cv_id) references cv (cv_id) on delete cascade INITIALLY DEFERRED,
+    pathdistance int,
+    constraint cvtermpath_c1 unique (subject_id,object_id,type_id,pathdistance)
+);
+create index cvtermpath_idx1 on cvtermpath (type_id);
+create index cvtermpath_idx2 on cvtermpath (subject_id);
+create index cvtermpath_idx3 on cvtermpath (object_id);
+create index cvtermpath_idx4 on cvtermpath (cv_id);
+
+COMMENT ON TABLE cvtermpath IS 'The reflexive transitive closure of
+the cvterm_relationship relation.';
+
+COMMENT ON COLUMN cvtermpath.type_id IS 'The relationship type that
+this is a closure over. If null, then this is a closure over ALL
+relationship types. If non-null, then this references a relationship
+cvterm - note that the closure will apply to both this relationship
+AND the OBO_REL:is_a (subclass) relationship.';
+
+COMMENT ON COLUMN cvtermpath.cv_id IS 'Closures will mostly be within
+one cv. If the closure of a relationship traverses a cv, then this
+refers to the cv of the object_id cvterm.';
+
+COMMENT ON COLUMN cvtermpath.pathdistance IS 'The number of steps
+required to get from the subject cvterm to the object cvterm, counting
+from zero (reflexive relationship).';
+
+-- ================================================
+-- TABLE: cvtermsynonym
+-- ================================================
+create table cvtermsynonym (
+    cvtermsynonym_id serial not null,
+    primary key (cvtermsynonym_id),
+    cvterm_id int not null,
+    foreign key (cvterm_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    synonym varchar(1024) not null,
+    type_id int,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade  INITIALLY DEFERRED,
+    constraint cvtermsynonym_c1 unique (cvterm_id,synonym)
+);
+create index cvtermsynonym_idx1 on cvtermsynonym (cvterm_id);
+
+COMMENT ON TABLE cvtermsynonym IS 'A cvterm actually represents a
+distinct class or concept. A concept can be refered to by different
+phrases or names. In addition to the primary name (cvterm.name) there
+can be a number of alternative aliases or synonyms. For example, "T
+cell" as a synonym for "T lymphocyte".';
+
+COMMENT ON COLUMN cvtermsynonym.type_id IS 'A synonym can be exact,
+narrower, or broader than.';
+
+
+-- ================================================
+-- TABLE: cvterm_dbxref
+-- ================================================
+create table cvterm_dbxref (
+    cvterm_dbxref_id serial not null,
+    primary key (cvterm_dbxref_id),
+    cvterm_id int not null,
+    foreign key (cvterm_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    dbxref_id int not null,
+    foreign key (dbxref_id) references dbxref (dbxref_id) on delete cascade INITIALLY DEFERRED,
+    is_for_definition int not null default 0,
+    constraint cvterm_dbxref_c1 unique (cvterm_id,dbxref_id)
+);
+create index cvterm_dbxref_idx1 on cvterm_dbxref (cvterm_id);
+create index cvterm_dbxref_idx2 on cvterm_dbxref (dbxref_id);
+
+COMMENT ON TABLE cvterm_dbxref IS 'In addition to the primary
+identifier (cvterm.dbxref_id) a cvterm can have zero or more secondary
+identifiers/dbxrefs, which may refer to records in external
+databases. The exact semantics of cvterm_dbxref are not fixed. For
+example: the dbxref could be a pubmed ID that is pertinent to the
+cvterm, or it could be an equivalent or similar term in another
+ontology. For example, GO cvterms are typically linked to InterPro
+IDs, even though the nature of the relationship between them is
+largely one of statistical association. The dbxref may be have data
+records attached in the same database instance, or it could be a
+"hanging" dbxref pointing to some external database. NOTE: If the
+desired objective is to link two cvterms together, and the nature of
+the relation is known and holds for all instances of the subject
+cvterm then consider instead using cvterm_relationship together with a
+well-defined relation.';
+
+COMMENT ON COLUMN cvterm_dbxref.is_for_definition IS 'A
+cvterm.definition should be supported by one or more references. If
+this column is true, the dbxref is not for a term in an external database -
+it is a dbxref for provenance information for the definition.';
+
+
+-- ================================================
+-- TABLE: cvtermprop
+-- ================================================
+create table cvtermprop ( 
+    cvtermprop_id serial not null, 
+    primary key (cvtermprop_id), 
+    cvterm_id int not null, 
+    foreign key (cvterm_id) references cvterm (cvterm_id) on delete cascade, 
+    type_id int not null, 
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade, 
+    value text not null default '', 
+    rank int not null default 0,
+
+    unique(cvterm_id, type_id, value, rank) 
+);
+create index cvtermprop_idx1 on cvtermprop (cvterm_id);
+create index cvtermprop_idx2 on cvtermprop (type_id);
+
+COMMENT ON TABLE cvtermprop IS 'Additional extensible properties can be attached to a cvterm using this table. Corresponds to -AnnotationProperty- in W3C OWL format.';
+
+COMMENT ON COLUMN cvtermprop.type_id IS 'The name of the property or slot is a cvterm. The meaning of the property is defined in that cvterm.';
+
+COMMENT ON COLUMN cvtermprop.value IS 'The value of the property, represented as text. Numeric values are converted to their text representation.';
+
+COMMENT ON COLUMN cvtermprop.rank IS 'Property-Value ordering. Any
+cvterm can have multiple values for any particular property type -
+these are ordered in a list using rank, counting from zero. For
+properties that are single-valued rather than multi-valued, the
+default 0 value should be used.';
+
+
+-- ================================================
+-- TABLE: dbxrefprop
+-- ================================================
+create table dbxrefprop (
+    dbxrefprop_id serial not null,
+    primary key (dbxrefprop_id),
+    dbxref_id int not null,
+    foreign key (dbxref_id) references dbxref (dbxref_id) INITIALLY DEFERRED,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) INITIALLY DEFERRED,
+    value text not null default '',
+    rank int not null default 0,
+    constraint dbxrefprop_c1 unique (dbxref_id,type_id,rank)
+);
+create index dbxrefprop_idx1 on dbxrefprop (dbxref_id);
+create index dbxrefprop_idx2 on dbxrefprop (type_id);
+
+COMMENT ON TABLE dbxrefprop IS 'Metadata about a dbxref. Note that this is not defined in the dbxref module, as it depends on the cvterm table. This table has a structure analagous to cvtermprop.';
+
+
+-- ================================================
+-- TABLE: cvprop
+-- ================================================
+create table cvprop (
+    cvprop_id serial not null,
+    primary key (cvprop_id),
+    cv_id int not null,
+    foreign key (cv_id) references cv (cv_id) INITIALLY DEFERRED,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) INITIALLY DEFERRED,
+    value text,
+    rank int not null default 0,
+    constraint cvprop_c1 unique (cv_id,type_id,rank)
+);
+
+COMMENT ON TABLE cvprop IS 'Additional extensible properties can be attached to a cv using this table.  A notable example would be the cv version';
+
+COMMENT ON COLUMN cvprop.type_id IS 'The name of the property or slot is a cvterm. The meaning of the property is defined in that cvterm.';
+COMMENT ON COLUMN cvprop.value IS 'The value of the property, represented as text. Numeric values are converted to their text representation.';
+
+COMMENT ON COLUMN cvprop.rank IS 'Property-Value ordering. Any
+cv can have multiple values for any particular property type -
+these are ordered in a list using rank, counting from zero. For
+properties that are single-valued rather than multi-valued, the
+default 0 value should be used.';
+
+-- ================================================
+-- TABLE: chadoprop
+-- ================================================
+create table chadoprop (
+    chadoprop_id serial not null,
+    primary key (chadoprop_id),
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) INITIALLY DEFERRED,
+    value text,
+    rank int not null default 0,
+    constraint chadoprop_c1 unique (type_id,rank)
+);
+
+COMMENT ON TABLE chadoprop IS 'This table is different from other prop tables in the database, as it is for storing information about the database itself, like schema version';
+
+COMMENT ON COLUMN chadoprop.type_id IS 'The name of the property or slot is a cvterm. The meaning of the property is defined in that cvterm.';
+COMMENT ON COLUMN chadoprop.value IS 'The value of the property, represented as text. Numeric values are converted to their text representation.';
+
+COMMENT ON COLUMN chadoprop.rank IS 'Property-Value ordering. Any
+cv can have multiple values for any particular property type -
+these are ordered in a list using rank, counting from zero. For
+properties that are single-valued rather than multi-valued, the
+default 0 value should be used.';
+
+CREATE OR REPLACE VIEW cv_root AS
+ SELECT 
+  cv_id,
+  cvterm_id AS root_cvterm_id
+ FROM cvterm
+ WHERE 
+  cvterm_id NOT IN ( SELECT subject_id FROM cvterm_relationship)    AND
+  is_obsolete=0;
+
+COMMENT ON VIEW cv_root IS 'the roots of a cv are the set of terms
+which have no parents (terms that are not the subject of a
+relation). Most cvs will have a single root, some may have >1. All
+will have at least 1';
+
+CREATE OR REPLACE VIEW cv_leaf AS
+ SELECT 
+  cv_id,
+  cvterm_id
+ FROM cvterm
+ WHERE 
+  cvterm_id NOT IN ( SELECT object_id FROM cvterm_relationship);
+
+COMMENT ON VIEW cv_leaf IS 'the leaves of a cv are the set of terms
+which have no children (terms that are not the object of a
+relation). All cvs will have at least 1 leaf';
+
+CREATE OR REPLACE VIEW common_ancestor_cvterm AS
+ SELECT
+  p1.subject_id          AS cvterm1_id,
+  p2.subject_id          AS cvterm2_id,
+  p1.object_id           AS ancestor_cvterm_id,
+  p1.pathdistance        AS pathdistance1,
+  p2.pathdistance        AS pathdistance2,
+  p1.pathdistance + p2.pathdistance
+                         AS total_pathdistance
+ FROM
+  cvtermpath AS p1,
+  cvtermpath AS p2
+ WHERE 
+  p1.object_id = p2.object_id;
+
+COMMENT ON VIEW common_ancestor_cvterm IS 'The common ancestor of any
+two terms is the intersection of both terms ancestors. Two terms can
+have multiple common ancestors. Use total_pathdistance to get the
+least common ancestor';
+
+CREATE OR REPLACE VIEW common_descendant_cvterm AS
+ SELECT
+  p1.object_id           AS cvterm1_id,
+  p2.object_id           AS cvterm2_id,
+  p1.subject_id          AS ancestor_cvterm_id,
+  p1.pathdistance        AS pathdistance1,
+  p2.pathdistance        AS pathdistance2,
+  p1.pathdistance + p2.pathdistance
+                         AS total_pathdistance
+ FROM
+  cvtermpath AS p1,
+  cvtermpath AS p2
+ WHERE 
+  p1.subject_id = p2.subject_id;
+
+COMMENT ON VIEW common_descendant_cvterm IS 'The common descendant of
+any two terms is the intersection of both terms descendants. Two terms
+can have multiple common descendants. Use total_pathdistance to get
+the least common ancestor';
+
+CREATE OR REPLACE VIEW stats_paths_to_root AS
+ SELECT 
+  subject_id                            AS cvterm_id, 
+  count(DISTINCT cvtermpath_id)         AS total_paths,
+  avg(pathdistance)                     AS avg_distance,
+  min(pathdistance)                     AS min_distance,
+  max(pathdistance)                     AS max_distance
+ FROM cvtermpath INNER JOIN cv_root ON (object_id=root_cvterm_id)
+ GROUP BY cvterm_id;
+
+COMMENT ON VIEW stats_paths_to_root IS 'per-cvterm statistics on its
+placement in the DAG relative to the root. There may be multiple paths
+from any term to the root. This gives the total number of paths, and
+the average minimum and maximum distances. Here distance is defined by
+cvtermpath.pathdistance';
+CREATE VIEW cv_cvterm_count AS
+  SELECT cv.name,count(*) AS num_terms_excl_obs FROM cv INNER JOIN cvterm USING (cv_id) WHERE is_obsolete=0 GROUP BY cv.name;
+COMMENT ON VIEW cv_cvterm_count IS 'per-cv terms counts (excludes obsoletes)';
+
+CREATE VIEW cv_cvterm_count_with_obs AS
+  SELECT cv.name,count(*) AS num_terms_incl_obs FROM cv INNER JOIN cvterm USING (cv_id) GROUP BY cv.name;
+COMMENT ON VIEW cv_cvterm_count_with_obs IS 'per-cv terms counts (includes obsoletes)';
+
+CREATE VIEW cv_link_count AS
+ SELECT cv.name AS cv_name,
+        relation.name AS relation_name,
+        relation_cv.name AS relation_cv_name,
+        count(*) AS num_links
+ FROM cv 
+  INNER JOIN cvterm ON (cvterm.cv_id=cv.cv_id) 
+  INNER JOIN cvterm_relationship ON (cvterm.cvterm_id=subject_id)
+  INNER JOIN cvterm AS relation ON (type_id=relation.cvterm_id)
+  INNER JOIN cv AS relation_cv ON (relation.cv_id=relation_cv.cv_id) 
+ GROUP BY cv.name,relation.name,relation_cv.name;
+
+COMMENT ON VIEW cv_link_count IS 'per-cv summary of number of
+links (cvterm_relationships) broken down by
+relationship_type. num_links is the total # of links of the specified
+type in which the subject_id of the link is in the named cv';
+
+CREATE VIEW cv_path_count AS
+ SELECT cv.name AS cv_name,
+        relation.name AS relation_name,
+        relation_cv.name AS relation_cv_name,
+        count(*) AS num_paths
+ FROM cv 
+  INNER JOIN cvterm ON (cvterm.cv_id=cv.cv_id) 
+  INNER JOIN cvtermpath ON (cvterm.cvterm_id=subject_id)
+  INNER JOIN cvterm AS relation ON (type_id=relation.cvterm_id)
+  INNER JOIN cv AS relation_cv ON (relation.cv_id=relation_cv.cv_id) 
+ GROUP BY cv.name,relation.name,relation_cv.name;
+
+COMMENT ON VIEW cv_path_count IS 'per-cv summary of number of
+paths (cvtermpaths) broken down by relationship_type. num_paths is the
+total # of paths of the specified type in which the subject_id of the
+path is in the named cv. See also: cv_distinct_relations';
+
+CREATE OR REPLACE FUNCTION _get_all_subject_ids(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    root alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    cterm2 cvtermpath%ROWTYPE;
+BEGIN
+
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = root LOOP
+        RETURN NEXT cterm;
+        FOR cterm2 IN SELECT * FROM _get_all_subject_ids(cterm.subject_id) LOOP
+            RETURN NEXT cterm2;
+        END LOOP;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+---arg: parent term id
+---return: all children term id and their parent term id with relationship type id
+CREATE OR REPLACE FUNCTION get_all_subject_ids(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    root alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    exist_c int;
+BEGIN
+
+    SELECT INTO exist_c count(*) FROM cvtermpath WHERE object_id = root and pathdistance <= 0;
+    IF (exist_c > 0) THEN
+        FOR cterm IN SELECT * FROM cvtermpath WHERE object_id = root and pathdistance > 0 LOOP
+            RETURN NEXT cterm;
+        END LOOP;
+    ELSE
+        FOR cterm IN SELECT * FROM _get_all_subject_ids(root) LOOP
+            RETURN NEXT cterm;
+        END LOOP;
+    END IF;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION get_graph_below(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    root alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    cterm2 cvtermpath%ROWTYPE;
+
+BEGIN
+
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = root LOOP
+        RETURN NEXT cterm;
+        FOR cterm2 IN SELECT * FROM get_all_subject_ids(cterm.subject_id) LOOP
+            RETURN NEXT cterm2;
+        END LOOP;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+
+CREATE OR REPLACE FUNCTION get_graph_above(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    leaf alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    cterm2 cvtermpath%ROWTYPE;
+
+BEGIN
+
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE subject_id = leaf LOOP
+        RETURN NEXT cterm;
+        FOR cterm2 IN SELECT * FROM get_all_object_ids(cterm.object_id) LOOP
+            RETURN NEXT cterm2;
+        END LOOP;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION _get_all_object_ids(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    leaf alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    cterm2 cvtermpath%ROWTYPE;
+BEGIN
+
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE subject_id = leaf LOOP
+        RETURN NEXT cterm;
+        FOR cterm2 IN SELECT * FROM _get_all_object_ids(cterm.object_id) LOOP
+            RETURN NEXT cterm2;
+        END LOOP;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+---arg: child term id
+---return: all parent term id and their childrent term id with relationship type id
+CREATE OR REPLACE FUNCTION get_all_object_ids(integer) RETURNS SETOF cvtermpath AS
+'
+DECLARE
+    leaf alias for $1;
+    cterm cvtermpath%ROWTYPE;
+    exist_c int;
+BEGIN
+
+
+    SELECT INTO exist_c count(*) FROM cvtermpath WHERE object_id = leaf and pathdistance <= 0;
+    IF (exist_c > 0) THEN
+        FOR cterm IN SELECT * FROM cvtermpath WHERE subject_id = leaf AND pathdistance > 0 LOOP
+            RETURN NEXT cterm;
+        END LOOP;
+    ELSE
+        FOR cterm IN SELECT * FROM _get_all_object_ids(leaf) LOOP
+            RETURN NEXT cterm;
+        END LOOP;
+    END IF;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+---arg: sql statement which must be in the form of select cvterm_id from ...
+---return: a set of cvterm ids that includes what is in sql statement and their children (subject ids)
+CREATE OR REPLACE FUNCTION get_it_sub_cvterm_ids(text) RETURNS SETOF cvterm AS
+'
+DECLARE
+    query alias for $1;
+    cterm cvterm%ROWTYPE;
+    cterm2 cvterm%ROWTYPE;
+BEGIN
+    FOR cterm IN EXECUTE query LOOP
+        RETURN NEXT cterm;
+        FOR cterm2 IN SELECT subject_id as cvterm_id FROM get_all_subject_ids(cterm.cvterm_id) LOOP
+            RETURN NEXT cterm2;
+        END LOOP;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+--- example: select * from fill_cvtermpath(7); where 7 is cv_id for an ontology
+--- fill path from the node to its children and their children
+CREATE OR REPLACE FUNCTION _fill_cvtermpath4node(INTEGER, INTEGER, INTEGER, INTEGER, INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    origin alias for $1;
+    child_id alias for $2;
+    cvid alias for $3;
+    typeid alias for $4;
+    depth alias for $5;
+    cterm cvterm_relationship%ROWTYPE;
+    exist_c int;
+
+BEGIN
+
+    --- RAISE NOTICE ''depth=% root=%'', depth,child_id;
+    --- not check type_id as it may be null and not very meaningful in cvtermpath when pathdistance > 1
+    SELECT INTO exist_c count(*) FROM cvtermpath WHERE cv_id = cvid AND object_id = origin AND subject_id = child_id AND pathdistance = depth;
+
+    IF (exist_c = 0) THEN
+        INSERT INTO cvtermpath (object_id, subject_id, cv_id, type_id, pathdistance) VALUES(origin, child_id, cvid, typeid, depth);
+    END IF;
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = child_id LOOP
+        PERFORM _fill_cvtermpath4node(origin, cterm.subject_id, cvid, cterm.type_id, depth+1);
+    END LOOP;
+    RETURN 1;
+END;
+'
+LANGUAGE 'plpgsql';
+
+
+CREATE OR REPLACE FUNCTION _fill_cvtermpath4root(INTEGER, INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    rootid alias for $1;
+    cvid alias for $2;
+    ttype int;
+    cterm cvterm_relationship%ROWTYPE;
+    child cvterm_relationship%ROWTYPE;
+
+BEGIN
+
+    SELECT INTO ttype cvterm_id FROM cvterm WHERE (name = ''isa'' OR name = ''is_a'');
+    PERFORM _fill_cvtermpath4node(rootid, rootid, cvid, ttype, 0);
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = rootid LOOP
+        PERFORM _fill_cvtermpath4root(cterm.subject_id, cvid);
+        -- RAISE NOTICE ''DONE for term, %'', cterm.subject_id;
+    END LOOP;
+    RETURN 1;
+END;
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION fill_cvtermpath(INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    cvid alias for $1;
+    root cvterm%ROWTYPE;
+
+BEGIN
+
+    DELETE FROM cvtermpath WHERE cv_id = cvid;
+
+    FOR root IN SELECT DISTINCT t.* from cvterm t LEFT JOIN cvterm_relationship r ON (t.cvterm_id = r.subject_id) INNER JOIN cvterm_relationship r2 ON (t.cvterm_id = r2.object_id) WHERE t.cv_id = cvid AND r.subject_id is null LOOP
+        PERFORM _fill_cvtermpath4root(root.cvterm_id, root.cv_id);
+    END LOOP;
+    RETURN 1;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION fill_cvtermpath(cv.name%TYPE) RETURNS INTEGER AS
+'
+DECLARE
+    cvname alias for $1;
+    cv_id   int;
+    rtn     int;
+BEGIN
+
+    SELECT INTO cv_id cv.cv_id from cv WHERE cv.name = cvname;
+    SELECT INTO rtn fill_cvtermpath(cv_id);
+    RETURN rtn;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION _fill_cvtermpath4node2detect_cycle(INTEGER, INTEGER, INTEGER, INTEGER, INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    origin alias for $1;
+    child_id alias for $2;
+    cvid alias for $3;
+    typeid alias for $4;
+    depth alias for $5;
+    cterm cvterm_relationship%ROWTYPE;
+    exist_c int;
+    ccount  int;
+    ecount  int;
+    rtn     int;
+BEGIN
+
+    EXECUTE ''SELECT * FROM tmpcvtermpath p1, tmpcvtermpath p2 WHERE p1.subject_id=p2.object_id AND p1.object_id=p2.subject_id AND p1.object_id = ''|| origin || '' AND p2.subject_id = '' || child_id || ''AND '' || depth || ''> 0'';
+    GET DIAGNOSTICS ccount = ROW_COUNT;
+    IF (ccount > 0) THEN
+        --RAISE EXCEPTION ''FOUND CYCLE: node % on cycle path'',origin;
+        RETURN origin;
+    END IF;
+
+    EXECUTE ''SELECT * FROM tmpcvtermpath WHERE cv_id = '' || cvid || '' AND object_id = '' || origin || '' AND subject_id = '' || child_id || '' AND '' || origin || ''<>'' || child_id;
+    GET DIAGNOSTICS ecount = ROW_COUNT;
+    IF (ecount > 0) THEN
+        --RAISE NOTICE ''FOUND TWICE (node), will check root obj % subj %'',origin, child_id;
+        SELECT INTO rtn _fill_cvtermpath4root2detect_cycle(child_id, cvid);
+        IF (rtn > 0) THEN
+            RETURN rtn;
+        END IF;
+    END IF;
+
+    EXECUTE ''SELECT * FROM tmpcvtermpath WHERE cv_id = '' || cvid || '' AND object_id = '' || origin || '' AND subject_id = '' || child_id || '' AND pathdistance = '' || depth;
+    GET DIAGNOSTICS exist_c = ROW_COUNT;
+    IF (exist_c = 0) THEN
+        EXECUTE ''INSERT INTO tmpcvtermpath (object_id, subject_id, cv_id, type_id, pathdistance) VALUES('' || origin || '', '' || child_id || '', '' || cvid || '', '' || typeid || '', '' || depth || '')'';
+    END IF;
+
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = child_id LOOP
+        --RAISE NOTICE ''DOING for node, % %'', origin, cterm.subject_id;
+        SELECT INTO rtn _fill_cvtermpath4node2detect_cycle(origin, cterm.subject_id, cvid, cterm.type_id, depth+1);
+        IF (rtn > 0) THEN
+            RETURN rtn;
+        END IF;
+    END LOOP;
+    RETURN 0;
+END;
+'
+LANGUAGE 'plpgsql';
+
+
+CREATE OR REPLACE FUNCTION _fill_cvtermpath4root2detect_cycle(INTEGER, INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    rootid alias for $1;
+    cvid alias for $2;
+    ttype int;
+    ccount int;
+    cterm cvterm_relationship%ROWTYPE;
+    child cvterm_relationship%ROWTYPE;
+    rtn     int;
+BEGIN
+
+    SELECT INTO ttype cvterm_id FROM cvterm WHERE (name = ''isa'' OR name = ''is_a'');
+    SELECT INTO rtn _fill_cvtermpath4node2detect_cycle(rootid, rootid, cvid, ttype, 0);
+    IF (rtn > 0) THEN
+        RETURN rtn;
+    END IF;
+    FOR cterm IN SELECT * FROM cvterm_relationship WHERE object_id = rootid LOOP
+        EXECUTE ''SELECT * FROM tmpcvtermpath p1, tmpcvtermpath p2 WHERE p1.subject_id=p2.object_id AND p1.object_id=p2.subject_id AND p1.object_id='' || rootid || '' AND p1.subject_id='' || cterm.subject_id;
+        GET DIAGNOSTICS ccount = ROW_COUNT;
+        IF (ccount > 0) THEN
+            --RAISE NOTICE ''FOUND TWICE (root), will check root obj % subj %'',rootid,cterm.subject_id;
+            SELECT INTO rtn _fill_cvtermpath4node2detect_cycle(rootid, cterm.subject_id, cvid, ttype, 0);
+            IF (rtn > 0) THEN
+                RETURN rtn;
+            END IF;
+        ELSE
+            SELECT INTO rtn _fill_cvtermpath4root2detect_cycle(cterm.subject_id, cvid);
+            IF (rtn > 0) THEN
+                RETURN rtn;
+            END IF;
+        END IF;
+    END LOOP;
+    RETURN 0;
+END;
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION get_cycle_cvterm_id(INTEGER, INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    cvid alias for $1;
+    rootid alias for $2;
+    rtn     int;
+BEGIN
+
+    CREATE TEMP TABLE tmpcvtermpath(object_id int, subject_id int, cv_id int, type_id int, pathdistance int);
+    CREATE INDEX tmp_cvtpath1 ON tmpcvtermpath(object_id, subject_id);
+
+    SELECT INTO rtn _fill_cvtermpath4root2detect_cycle(rootid, cvid);
+    IF (rtn > 0) THEN
+        DROP TABLE tmpcvtermpath;
+        RETURN rtn;
+    END IF;
+    DROP TABLE tmpcvtermpath;
+    RETURN 0;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION get_cycle_cvterm_ids(INTEGER) RETURNS SETOF INTEGER AS
+'
+DECLARE
+    cvid alias for $1;
+    root cvterm%ROWTYPE;
+    rtn     int;
+BEGIN
+
+
+    FOR root IN SELECT DISTINCT t.* from cvterm t WHERE cv_id = cvid LOOP
+        SELECT INTO rtn get_cycle_cvterm_id(cvid,root.cvterm_id);
+        IF (rtn > 0) THEN
+            RETURN NEXT rtn;
+        END IF;
+    END LOOP;
+    RETURN;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION get_cycle_cvterm_id(INTEGER) RETURNS INTEGER AS
+'
+DECLARE
+    cvid alias for $1;
+    root cvterm%ROWTYPE;
+    rtn     int;
+BEGIN
+
+    CREATE TEMP TABLE tmpcvtermpath(object_id int, subject_id int, cv_id int, type_id int, pathdistance int);
+    CREATE INDEX tmp_cvtpath1 ON tmpcvtermpath(object_id, subject_id);
+
+    FOR root IN SELECT DISTINCT t.* from cvterm t LEFT JOIN cvterm_relationship r ON (t.cvterm_id = r.subject_id) INNER JOIN cvterm_relationship r2 ON (t.cvterm_id = r2.object_id) WHERE t.cv_id = cvid AND r.subject_id is null LOOP
+        SELECT INTO rtn _fill_cvtermpath4root2detect_cycle(root.cvterm_id, root.cv_id);
+        IF (rtn > 0) THEN
+            DROP TABLE tmpcvtermpath;
+            RETURN rtn;
+        END IF;
+    END LOOP;
+    DROP TABLE tmpcvtermpath;
+    RETURN 0;
+END;   
+'
+LANGUAGE 'plpgsql';
+
+CREATE OR REPLACE FUNCTION get_cycle_cvterm_id(cv.name%TYPE) RETURNS INTEGER AS
+'
+DECLARE
+    cvname alias for $1;
+    cv_id int;
+    rtn int;
+BEGIN
+
+    SELECT INTO cv_id cv.cv_id from cv WHERE cv.name = cvname;
+    SELECT INTO rtn  get_cycle_cvterm_id(cv_id);
+
+    RETURN rtn;
+END;   
+'
+LANGUAGE 'plpgsql';
+-- $Id: pub.sql,v 1.27 2007-02-19 20:50:44 briano Exp $
+-- ==========================================
+-- Chado pub module
+--
+-- =================================================================
+-- Dependencies:
+--
+-- :import cvterm from cv
+-- :import dbxref from general
+-- =================================================================
+
+-- ================================================
+-- TABLE: pub
+-- ================================================
+
+create table pub (
+    pub_id serial not null,
+    primary key (pub_id),
+    title text,
+    volumetitle text,
+    volume varchar(255),
+    series_name varchar(255),
+    issue varchar(255),
+    pyear varchar(255),
+    pages varchar(255),
+    miniref varchar(255),
+    uniquename text not null,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    is_obsolete boolean default 'false',
+    publisher varchar(255),
+    pubplace varchar(255),
+    constraint pub_c1 unique (uniquename)
+);
+CREATE INDEX pub_idx1 ON pub (type_id);
+
+COMMENT ON TABLE pub IS 'A documented provenance artefact - publications,
+documents, personal communication.';
+COMMENT ON COLUMN pub.title IS 'Descriptive general heading.';
+COMMENT ON COLUMN pub.volumetitle IS 'Title of part if one of a series.';
+COMMENT ON COLUMN pub.series_name IS 'Full name of (journal) series.';
+COMMENT ON COLUMN pub.pages IS 'Page number range[s], e.g. 457--459, viii + 664pp, lv--lvii.';
+COMMENT ON COLUMN pub.type_id IS  'The type of the publication (book, journal, poem, graffiti, etc). Uses pub cv.';
+
+-- ================================================
+-- TABLE: pub_relationship
+-- ================================================
+
+create table pub_relationship (
+    pub_relationship_id serial not null,
+    primary key (pub_relationship_id),
+    subject_id int not null,
+    foreign key (subject_id) references pub (pub_id) on delete cascade INITIALLY DEFERRED,
+    object_id int not null,
+    foreign key (object_id) references pub (pub_id) on delete cascade INITIALLY DEFERRED,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+
+    constraint pub_relationship_c1 unique (subject_id,object_id,type_id)
+);
+create index pub_relationship_idx1 on pub_relationship (subject_id);
+create index pub_relationship_idx2 on pub_relationship (object_id);
+create index pub_relationship_idx3 on pub_relationship (type_id);
+
+COMMENT ON TABLE pub_relationship IS 'Handle relationships between
+publications, e.g. when one publication makes others obsolete, when one
+publication contains errata with respect to other publication(s), or
+when one publication also appears in another pub.';
+
+-- ================================================
+-- TABLE: pub_dbxref
+-- ================================================
+
+create table pub_dbxref (
+    pub_dbxref_id serial not null,
+    primary key (pub_dbxref_id),
+    pub_id int not null,
+    foreign key (pub_id) references pub (pub_id) on delete cascade INITIALLY DEFERRED,
+    dbxref_id int not null,
+    foreign key (dbxref_id) references dbxref (dbxref_id) on delete cascade INITIALLY DEFERRED,
+    is_current boolean not null default 'true',
+    constraint pub_dbxref_c1 unique (pub_id,dbxref_id)
+);
+create index pub_dbxref_idx1 on pub_dbxref (pub_id);
+create index pub_dbxref_idx2 on pub_dbxref (dbxref_id);
+
+COMMENT ON TABLE pub_dbxref IS 'Handle links to repositories,
+e.g. Pubmed, Biosis, zoorec, OCLC, Medline, ISSN, coden...';
+
+
+-- ================================================
+-- TABLE: pubauthor
+-- ================================================
+
+create table pubauthor (
+    pubauthor_id serial not null,
+    primary key (pubauthor_id),
+    pub_id int not null,
+    foreign key (pub_id) references pub (pub_id) on delete cascade INITIALLY DEFERRED,
+    rank int not null,
+    editor boolean default 'false',
+    surname varchar(100) not null,
+    givennames varchar(100),
+    suffix varchar(100),
+
+    constraint pubauthor_c1 unique (pub_id, rank)
+);
+create index pubauthor_idx2 on pubauthor (pub_id);
+
+COMMENT ON TABLE pubauthor IS 'An author for a publication. Note the denormalisation (hence lack of _ in table name) - this is deliberate as it is in general too hard to assign IDs to authors.';
+COMMENT ON COLUMN pubauthor.givennames IS 'First name, initials';
+COMMENT ON COLUMN pubauthor.suffix IS 'Jr., Sr., etc';
+COMMENT ON COLUMN pubauthor.rank IS 'Order of author in author list for this pub - order is important.';
+COMMENT ON COLUMN pubauthor.editor IS 'Indicates whether the author is an editor for linked publication. Note: this is a boolean field but does not follow the normal chado convention for naming booleans.';
+
+
+-- ================================================
+-- TABLE: pubprop
+-- ================================================
+
+create table pubprop (
+    pubprop_id serial not null,
+    primary key (pubprop_id),
+    pub_id int not null,
+    foreign key (pub_id) references pub (pub_id) on delete cascade INITIALLY DEFERRED,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    value text not null,
+    rank integer,
+
+    constraint pubprop_c1 unique (pub_id,type_id,rank)
+);
+create index pubprop_idx1 on pubprop (pub_id);
+create index pubprop_idx2 on pubprop (type_id);
+
+COMMENT ON TABLE pubprop IS 'Property-value pairs for a pub. Follows standard chado pattern.';
+-- $Id: organism.sql,v 1.19 2007-04-01 18:45:41 briano Exp $
+-- ==========================================
+-- Chado organism module
+--
+-- ============
+-- DEPENDENCIES
+-- ============
+-- :import cvterm from cv
+-- :import dbxref from general
+-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+-- ================================================
+-- TABLE: organism
+-- ================================================
+
+create table organism (
+	organism_id serial not null,
+	primary key (organism_id),
+	abbreviation varchar(255) null,
+	genus varchar(255) not null,
+	species varchar(255) not null,
+	common_name varchar(255) null,
+	comment text null,
+	constraint organism_c1 unique (genus,species)
+);
+
+COMMENT ON TABLE organism IS 'The organismal taxonomic
+classification. Note that phylogenies are represented using the
+phylogeny module, and taxonomies can be represented using the cvterm
+module or the phylogeny module.';
+
+COMMENT ON COLUMN organism.species IS 'A type of organism is always
+uniquely identified by genus and species. When mapping from the NCBI
+taxonomy names.dmp file, this column must be used where it
+is present, as the common_name column is not always unique (e.g. environmental
+samples). If a particular strain or subspecies is to be represented,
+this is appended onto the species name. Follows standard NCBI taxonomy
+pattern.';
+
+-- ================================================
+-- TABLE: organism_dbxref
+-- ================================================
+
+create table organism_dbxref (
+    organism_dbxref_id serial not null,
+    primary key (organism_dbxref_id),
+    organism_id int not null,
+    foreign key (organism_id) references organism (organism_id) on delete cascade INITIALLY DEFERRED,
+    dbxref_id int not null,
+    foreign key (dbxref_id) references dbxref (dbxref_id) on delete cascade INITIALLY DEFERRED,
+    constraint organism_dbxref_c1 unique (organism_id,dbxref_id)
+);
+create index organism_dbxref_idx1 on organism_dbxref (organism_id);
+create index organism_dbxref_idx2 on organism_dbxref (dbxref_id);
+
+-- ================================================
+-- TABLE: organismprop
+-- ================================================
+
+create table organismprop (
+    organismprop_id serial not null,
+    primary key (organismprop_id),
+    organism_id int not null,
+    foreign key (organism_id) references organism (organism_id) on delete cascade INITIALLY DEFERRED,
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    value text null,
+    rank int not null default 0,
+    constraint organismprop_c1 unique (organism_id,type_id,rank)
+);
+create index organismprop_idx1 on organismprop (organism_id);
+create index organismprop_idx2 on organismprop (type_id);
+
+COMMENT ON TABLE organismprop IS 'Tag-value properties - follows standard chado model.';
+
+
+CREATE OR REPLACE FUNCTION get_organism_id(VARCHAR,VARCHAR) RETURNS INT
+ AS '
+  SELECT organism_id 
+  FROM organism
+  WHERE genus=$1
+    AND species=$2
+ ' LANGUAGE 'sql';
+
+CREATE OR REPLACE FUNCTION get_organism_id(VARCHAR) RETURNS INT
+ AS ' 
+SELECT organism_id
+  FROM organism
+  WHERE genus=substring($1,1,position('' '' IN $1)-1)
+    AND species=substring($1,position('' '' IN $1)+1)
+ ' LANGUAGE 'sql';
+
+CREATE OR REPLACE FUNCTION get_organism_id_abbrev(VARCHAR) RETURNS INT
+ AS '
+SELECT organism_id
+  FROM organism
+  WHERE substr(genus,1,1)=substring($1,1,1)
+    AND species=substring($1,position('' '' IN $1)+1)
+ ' LANGUAGE 'sql';
+
+CREATE OR REPLACE FUNCTION store_organism (VARCHAR,VARCHAR,VARCHAR) 
+  RETURNS INT AS 
+'DECLARE
+   v_genus            ALIAS FOR $1;
+   v_species          ALIAS FOR $2;
+   v_common_name      ALIAS FOR $3;
+
+   v_organism_id      INTEGER;
+ BEGIN
+    SELECT INTO v_organism_id organism_id
+      FROM organism
+      WHERE genus=v_genus               AND
+            species=v_species;
+    IF NOT FOUND THEN
+      INSERT INTO organism
+       (genus,species,common_name)
+         VALUES
+       (v_genus,v_species,v_common_name);
+       RETURN currval(''organism_organism_id_seq'');
+    ELSE
+      UPDATE organism
+       SET common_name=v_common_name
+      WHERE organism_id = v_organism_id;
+    END IF;
+    RETURN v_organism_id;
+ END;
+' LANGUAGE 'plpgsql';
+  
+-- $Id: sequence.sql,v 1.69 2009-05-14 02:44:23 scottcain Exp $
+-- ==========================================
+-- Chado sequence module
+--
+-- =================================================================
+-- Dependencies:
+--
+-- :import cvterm from cv
+-- :import pub from pub
+-- :import organism from organism
+-- :import dbxref from general
+-- =================================================================
+
+-- ================================================
+-- TABLE: feature
+-- ================================================
+
+create table feature (
+    feature_id serial not null,
+    primary key (feature_id),
+    dbxref_id int,
+    foreign key (dbxref_id) references dbxref (dbxref_id) on delete set null INITIALLY DEFERRED,
+    organism_id int not null,
+    foreign key (organism_id) references organism (organism_id) on delete cascade INITIALLY DEFERRED,
+    name varchar(255),
+    uniquename text not null,
+    residues text,
+    seqlen int,
+    md5checksum char(32),
+    type_id int not null,
+    foreign key (type_id) references cvterm (cvterm_id) on delete cascade INITIALLY DEFERRED,
+    is_analysis boolean not null default 'false',
+    is_obsolete boolean not null default 'false',
+    timeaccessioned timestamp not null default current_timestamp,
+    timelastmodified timestamp not null default current_timestamp,
+    constraint feature_c1 unique (organism_id,uniquename,type_id)
+);
+create sequence feature_uniquename_seq;
+create index feature_name_ind1 on feature(name);
+create index feature_idx1 on feature (dbxref_id);
+create index feature_idx2 on feature (organism_id);
+create index feature_idx3 on feature (type_id);
+create index feature_idx4 on feature (uniquename);
+create index feature_idx5 on feature (lower(name));
+
+ALTER TABLE feature ALTER residues SET STORAGE EXTERNAL;
+
+COMMENT ON TABLE feature IS 'A feature is a biological sequence or a
+section of a biological sequence, or a collection of such
+sections. Examples include genes, exons, transcripts, regulatory
+regions, polypeptides, protein domains, chromosome sequences, sequence
+variations, cross-genome match regions such as hits and HSPs and so
+on; see the Sequence Ontology for more. The combination of
+organism_id, uniquename and type_id should be unique.';
+
+COMMENT ON COLUMN feature.dbxref_id IS 'An optional primary public stable
+identifier for this feature. Secondary identifiers and external
+dbxrefs go in the table feature_dbxref.';
+
+COMMENT ON COLUMN feature.organism_id IS 'The organism to which this feature
+belongs. This column is mandatory.';
+
+COMMENT ON COLUMN feature.name IS 'The optional human-readable common name for
+a feature, for display purposes.';
+
+COMMENT ON COLUMN feature.uniquename IS 'The unique name for a feature; may
+not be necessarily be particularly human-readable, although this is
+preferred. This name must be unique for this type of feature within
+this organism.';
+
+COMMENT ON COLUMN feature.residues IS 'A sequence of alphabetic characters
+representing biological residues (nucleic acids, amino acids). This
+column does not need to be manifested for all features; it is optional
+for features such as exons where the residues can be derived from the
+featureloc. It is recommended that the value for this column be
+manifested for features which may may non-contiguous sublocations (e.g.
+transcripts), since derivation at query time is non-trivial. For
+expressed sequence, the DNA sequence should be used rather than the
+RNA sequence. The default storage method for the residues column is
+EXTERNAL, which will store it uncompressed to make substring operations
+faster.';
+
+COMMENT ON COLUMN feature.seqlen IS 'The length of the residue feature. See
+column:residues. This column is partially redundant with the residues
+column, and also with featureloc. This column is required because the
+location may be unknown and the residue sequence may not be
+manifested, yet it may be desirable to store and query the length of
+the feature. The seqlen should always be manifested where the length
+of the sequence is known.';
+
+COMMENT ON COLUMN feature.md5checksum IS 'The 32-character checksum of the sequence,
+calculated using the MD5 algorithm. This is practically guaranteed to
+be unique for any feature. This column thus acts as a unique
+identifier on the mathematical sequence.';
+
+COMMENT ON COLUMN feature.type_id IS 'A required reference to a table:cvterm
+giving the feature type. This will typically be a Sequence Ontology
+identifier. This column is thus used to subclass the feature table.';
+
+COMMENT ON COLUMN feature.is_analysis IS 'Boolean indicating whether this
+feature is annotated or the result of an automated analysis. Analysis
+results also use the companalysis module. Note that the dividing line
+between analysis and annotation may be fuzzy, this should be determined on
+a per-project basis in a consistent manner. One requirement is that
+there should only be one non-analysis version of each wild-type gene
+feature in a genome, whereas the same gene feature can be predicted
+multiple times in different analyses.';
+
+COMMENT ON COLUMN feature.is_obsolete IS 'Boolean indicating whether this
+feature has been obsoleted. Some chado instances may choose to simply
+remove the feature altogether, others may choose to keep an obsolete
+row in the table.';
+
+COMMENT ON COLUMN feature.timeaccessioned IS 'For handling object
+accession or modification timestamps (as opposed to database auditing data,
+handled elsewhere). The expectation is that these fields would be
+available to software interacting with chado.';
+
+COMMENT ON COLUMN feature.timelastmodified IS 'For handling object
+accession or modification timestamps (as opposed to database auditing data,
+handled elsewhere). The expectation is that these fields would be
+available to software interacting with chado.';
+
+--- COMMENT ON INDEX feature_c1 IS 'Any feature can be globally identified
+--- by the combination of organism, uniquename and feature type';
+
+-- ================================================
+-- TABLE: featureloc
+-- ================================================
+
+create table featureloc (
+    featureloc_id serial not null,
+    primary key (featureloc_id),
+    feature_id int not null,
+    foreign key (feature_id) references feature (feature_id) on delete cascade INITIALLY DEFERRED,
+    srcfeature_id int,
+    foreign key (srcfeature_id) references feature (feature_id) on delete set null INITIALLY DEFERRED,
+    fmin int,
+    is_fmin_partial boolean not null default 'false',
+    fmax int,
+    is_fmax_partial boolean not null default 'false',
+    strand smallint,
+    phase int,
+    residue_info text,
+    locgroup int not null default 0,
+    rank int not null default 0,
+    constraint featureloc_c1 unique (feature_id,locgroup,rank),
+    constraint featureloc_c2 check (fmin <= fmax)
+);
+create index featureloc_idx1 on featureloc (feature_id);
+create index featureloc_idx2 on featureloc (srcfeature_id);
+create index featureloc_idx3 on featureloc (srcfeature_id,fmin,fmax);
+
+COMMENT ON TABLE featureloc IS 'The location of a feature relative to
+another feature. Important: interbase coordinates are used. This is
+vital as it allows us to represent zero-length features e.g. splice
+sites, insertion points without an awkward fuzzy system. Features
+typically...
 
[truncated message content]

Thread: [Gmod-schema-cmts] SF.net SVN: gmod:[25108] schema/trunk/chado (Page 2)

gmod-schema-cmts