123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517 |
- <?php
- function tripal_chado_add_tripal_gff_temp_table() {
- $schema = [
- 'table' => 'tripal_gff_temp',
- 'fields' => [
- 'feature_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'organism_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'uniquename' => [
- 'type' => 'text',
- 'not null' => TRUE,
- ],
- 'type_name' => [
- 'type' => 'varchar',
- 'length' => '1024',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'tripal_gff_temp_idx0' => ['feature_id'],
- 'tripal_gff_temp_idx0' => ['organism_id'],
- 'tripal_gff_temp_idx1' => ['uniquename'],
- ],
- 'unique keys' => [
- 'tripal_gff_temp_uq0' => ['feature_id'],
- 'tripal_gff_temp_uq1' => ['uniquename', 'organism_id', 'type_name'],
- ],
- ];
- chado_create_custom_table('tripal_gff_temp', $schema, TRUE, NULL, FALSE);
- }
- /**
- *
- */
- function tripal_chado_add_tripal_gffcds_temp_table() {
- $schema = [
- 'table' => 'tripal_gffcds_temp',
- 'fields' => [
- 'feature_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'parent_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'phase' => [
- 'type' => 'int',
- 'not null' => FALSE,
- ],
- 'strand' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'fmin' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'fmax' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'tripal_gff_temp_idx0' => ['feature_id'],
- 'tripal_gff_temp_idx0' => ['parent_id'],
- ],
- ];
- chado_create_custom_table('tripal_gffcds_temp', $schema, TRUE, NULL, FALSE);
- }
- /**
- *
- */
- function tripal_chado_add_tripal_gffprotein_temp_table() {
- $schema = [
- 'table' => 'tripal_gffprotein_temp',
- 'fields' => [
- 'feature_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'parent_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'fmin' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'fmax' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'tripal_gff_temp_idx0' => ['feature_id'],
- 'tripal_gff_temp_idx0' => ['parent_id'],
- ],
- 'unique keys' => [
- 'tripal_gff_temp_uq0' => ['feature_id'],
- ],
- ];
- chado_create_custom_table('tripal_gffprotein_temp', $schema, TRUE, NULL, FALSE);
- }
- /**
- * Creates a temporary table to store obo details while loading an obo file
- *
- */
- function tripal_chado_add_tripal_obo_temp_table() {
- // the tripal_obo_temp table is used for temporary housing of records when loading OBO files
- // we create it here using plain SQL because we want it to be in the chado schema but we
- // do not want to use the Tripal Custom Table API because we don't want it to appear in the
- // list of custom tables. It needs to be available for the Tripal Chado API so we create it
- // here and then define it in the tripal_cv/api/tripal_cv.schema.api.inc
- if (!chado_table_exists('tripal_obo_temp')) {
- $sql = "
- CREATE TABLE {tripal_obo_temp} (
- id character varying(255) NOT NULL,
- stanza text NOT NULL,
- type character varying(50) NOT NULL,
- CONSTRAINT tripal_obo_temp_uq0 UNIQUE (id)
- );
- ";
- chado_query($sql);
- $sql = "CREATE INDEX tripal_obo_temp_idx0 ON {tripal_obo_temp} USING btree (id)";
- chado_query($sql);
- $sql = "CREATE INDEX tripal_obo_temp_idx1 ON {tripal_obo_temp} USING btree (type)";
- chado_query($sql);
- }
- }
- /**
- * Creates a materialized view that stores the type & number of stocks per
- * organism
- *
- * @ingroup tripal_stock
- */
- function tripal_chado_add_organism_stock_count_mview() {
- $view_name = 'organism_stock_count';
- $comment = 'Stores the type and number of stocks per organism';
- $schema = [
- 'description' => $comment,
- 'table' => $view_name,
- 'fields' => [
- 'organism_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'genus' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'species' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'common_name' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => FALSE,
- ],
- 'num_stocks' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'cvterm_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'stock_type' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'organism_stock_count_idx1' => ['organism_id'],
- 'organism_stock_count_idx2' => ['cvterm_id'],
- 'organism_stock_count_idx3' => ['stock_type'],
- ],
- ];
- $sql = "
- SELECT
- O.organism_id, O.genus, O.species, O.common_name,
- count(S.stock_id) as num_stocks,
- CVT.cvterm_id, CVT.name as stock_type
- FROM organism O
- INNER JOIN stock S ON O.Organism_id = S.organism_id
- INNER JOIN cvterm CVT ON S.type_id = CVT.cvterm_id
- GROUP BY
- O.Organism_id, O.genus, O.species, O.common_name, CVT.cvterm_id, CVT.name
- ";
- chado_add_mview($view_name, 'tripal_stock', $schema, $sql, $comment, FALSE);
- }
- /**
- * Adds a materialized view keeping track of the type of features associated
- * with each library
- *
- * @ingroup tripal_library
- */
- function tripal_chado_add_library_feature_count_mview() {
- $view_name = 'library_feature_count';
- $comment = 'Provides count of feature by type that are associated with all libraries';
- $schema = [
- 'table' => $view_name,
- 'description' => $comment,
- 'fields' => [
- 'library_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'name' => [
- 'type' => 'varchar',
- 'length' => 255,
- 'not null' => TRUE,
- ],
- 'num_features' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'feature_type' => [
- 'type' => 'varchar',
- 'length' => 255,
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'library_feature_count_idx1' => ['library_id'],
- ],
- ];
- $sql = "
- SELECT
- L.library_id, L.name,
- count(F.feature_id) as num_features,
- CVT.name as feature_type
- FROM library L
- INNER JOIN library_feature LF ON LF.library_id = L.library_id
- INNER JOIN feature F ON LF.feature_id = F.feature_id
- INNER JOIN cvterm CVT ON F.type_id = CVT.cvterm_id
- GROUP BY L.library_id, L.name, CVT.name
- ";
- chado_add_mview($view_name, 'tripal_library', $schema, $sql, $comment, FALSE);
- }
- /**
- *
- */
- /**
- * Creates a materialized view that stores the type & number of features per
- * organism
- *
- * @ingroup tripal_feature
- */
- function tripal_chado_add_organism_feature_count_mview() {
- $view_name = 'organism_feature_count';
- $comment = 'Stores the type and number of features per organism';
- $schema = [
- 'description' => $comment,
- 'table' => $view_name,
- 'fields' => [
- 'organism_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'genus' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'species' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'common_name' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => FALSE,
- ],
- 'num_features' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'cvterm_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'feature_type' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'organism_feature_count_idx1' => ['organism_id'],
- 'organism_feature_count_idx2' => ['cvterm_id'],
- 'organism_feature_count_idx3' => ['feature_type'],
- ],
- ];
- $sql = "
- SELECT
- O.organism_id, O.genus, O.species, O.common_name,
- count(F.feature_id) as num_features,
- CVT.cvterm_id, CVT.name as feature_type
- FROM organism O
- INNER JOIN feature F ON O.Organism_id = F.organism_id
- INNER JOIN cvterm CVT ON F.type_id = CVT.cvterm_id
- GROUP BY
- O.Organism_id, O.genus, O.species, O.common_name, CVT.cvterm_id, CVT.name
- ";
- chado_add_mview($view_name, 'tripal_feature', $schema, $sql, $comment, FALSE);
- }
- /**
- * Creates a view showing the link between an organism & it's analysis through
- * associated features.
- *
- */
- function tripal_chado_add_analysis_organism_mview() {
- $view_name = 'analysis_organism';
- $comment = t('This view is for associating an organism (via it\'s associated features) to an analysis.');
- // this is the SQL used to identify the organism to which an analsysis
- // has been used. This is obtained though the analysisfeature -> feature -> organism
- // joins
- $sql = "
- SELECT DISTINCT A.analysis_id, O.organism_id
- FROM analysis A
- INNER JOIN analysisfeature AF ON A.analysis_id = AF.analysis_id
- INNER JOIN feature F ON AF.feature_id = F.feature_id
- INNER JOIN organism O ON O.organism_id = F.organism_id
- ";
- // the schema array for describing this view
- $schema = [
- 'table' => $view_name,
- 'description' => $comment,
- 'fields' => [
- 'analysis_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'organism_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'networkmod_qtl_indx0' => ['analysis_id'],
- 'networkmod_qtl_indx1' => ['organism_id'],
- ],
- 'foreign keys' => [
- 'analysis' => [
- 'table' => 'analysis',
- 'columns' => [
- 'analysis_id' => 'analysis_id',
- ],
- ],
- 'organism' => [
- 'table' => 'organism',
- 'columns' => [
- 'organism_id' => 'organism_id',
- ],
- ],
- ],
- ];
- // add the view
- chado_add_mview($view_name, 'tripal_analysis', $schema, $sql, $comment, FALSE);
- }
- /**
- * Add a materialized view that maps cv to db records.
- *
- * This is needed for viewing cv trees
- *
- */
- function tripal_chado_add_db2cv_mview_mview() {
- $mv_name = 'db2cv_mview';
- $comment = 'A table for quick lookup of the vocabularies and the databases they are associated with.';
- $schema = [
- 'table' => $mv_name,
- 'description' => $comment,
- 'fields' => [
- 'cv_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'cvname' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'db_id' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'dbname' => [
- 'type' => 'varchar',
- 'length' => '255',
- 'not null' => TRUE,
- ],
- 'num_terms' => [
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'cv_id_idx' => ['cv_id'],
- 'cvname_idx' => ['cvname'],
- 'db_id_idx' => ['db_id'],
- 'dbname_idx' => ['db_id'],
- ],
- ];
- $sql = "
- SELECT DISTINCT CV.cv_id, CV.name as cvname, DB.db_id, DB.name as dbname,
- COUNT(CVT.cvterm_id) as num_terms
- FROM cv CV
- INNER JOIN cvterm CVT on CVT.cv_id = CV.cv_id
- INNER JOIN dbxref DBX on DBX.dbxref_id = CVT.dbxref_id
- INNER JOIN db DB on DB.db_id = DBX.db_id
- WHERE CVT.is_relationshiptype = 0 and CVT.is_obsolete = 0
- GROUP BY CV.cv_id, CV.name, DB.db_id, DB.name
- ORDER BY DB.name
- ";
- // Create the MView
- chado_add_mview($mv_name, 'tripal_chado', $schema, $sql, $comment, FALSE);
- }
- /**
- * Add a materialized view of root terms for all chado cvs.
- *
- * This is needed for viewing cv trees
- *
- */
- function tripal_chado_add_cv_root_mview_mview() {
- $mv_name = 'cv_root_mview';
- $comment = 'A list of the root terms for all controlled vocabularies. This is needed for viewing CV trees';
- $schema = [
- 'table' => $mv_name,
- 'description' => $comment,
- 'fields' => [
- 'name' => [
- 'type' => 'varchar',
- 'length' => 255,
- 'not null' => TRUE,
- ],
- 'cvterm_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'cv_id' => [
- 'size' => 'big',
- 'type' => 'int',
- 'not null' => TRUE,
- ],
- 'cv_name' => [
- 'type' => 'varchar',
- 'length' => 255,
- 'not null' => TRUE,
- ],
- ],
- 'indexes' => [
- 'cv_root_mview_indx1' => ['cvterm_id'],
- 'cv_root_mview_indx2' => ['cv_id'],
- ],
- ];
- $sql = "
- SELECT DISTINCT CVT.name, CVT.cvterm_id, CV.cv_id, CV.name
- FROM cvterm CVT
- LEFT JOIN cvterm_relationship CVTR ON CVT.cvterm_id = CVTR.subject_id
- INNER JOIN cvterm_relationship CVTR2 ON CVT.cvterm_id = CVTR2.object_id
- INNER JOIN cv CV on CV.cv_id = CVT.cv_id
- WHERE CVTR.subject_id is NULL and
- CVT.is_relationshiptype = 0 and CVT.is_obsolete = 0
- ";
- // Create the MView
- chado_add_mview($mv_name, 'tripal_chado', $schema, $sql, $comment, FALSE);
- }
|