'tripal_gff_temp', 'fields' => [ 'feature_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'organism_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'uniquename' => [ 'type' => 'text', 'not null' => TRUE, ], 'type_name' => [ 'type' => 'varchar', 'length' => '1024', 'not null' => TRUE, ], ], 'indexes' => [ 'tripal_gff_temp_idx0' => ['feature_id'], 'tripal_gff_temp_idx0' => ['organism_id'], 'tripal_gff_temp_idx1' => ['uniquename'], ], 'unique keys' => [ 'tripal_gff_temp_uq0' => ['feature_id'], 'tripal_gff_temp_uq1' => ['uniquename', 'organism_id', 'type_name'], ], ]; chado_create_custom_table('tripal_gff_temp', $schema, TRUE, NULL, FALSE); } /** * */ function tripal_chado_add_tripal_gffcds_temp_table() { $schema = [ 'table' => 'tripal_gffcds_temp', 'fields' => [ 'feature_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'parent_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'phase' => [ 'type' => 'int', 'not null' => FALSE, ], 'strand' => [ 'type' => 'int', 'not null' => TRUE, ], 'fmin' => [ 'type' => 'int', 'not null' => TRUE, ], 'fmax' => [ 'type' => 'int', 'not null' => TRUE, ], ], 'indexes' => [ 'tripal_gff_temp_idx0' => ['feature_id'], 'tripal_gff_temp_idx0' => ['parent_id'], ], ]; chado_create_custom_table('tripal_gffcds_temp', $schema, TRUE, NULL, FALSE); } /** * */ function tripal_chado_add_tripal_gffprotein_temp_table() { $schema = [ 'table' => 'tripal_gffprotein_temp', 'fields' => [ 'feature_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'parent_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'fmin' => [ 'type' => 'int', 'not null' => TRUE, ], 'fmax' => [ 'type' => 'int', 'not null' => TRUE, ], ], 'indexes' => [ 'tripal_gff_temp_idx0' => ['feature_id'], 'tripal_gff_temp_idx0' => ['parent_id'], ], 'unique keys' => [ 'tripal_gff_temp_uq0' => ['feature_id'], ], ]; chado_create_custom_table('tripal_gffprotein_temp', $schema, TRUE, NULL, FALSE); } /** * Creates a temporary table to store obo details while loading an obo file * */ function tripal_chado_add_tripal_obo_temp_table() { // the tripal_obo_temp table is used for temporary housing of records when loading OBO files // we create it here using plain SQL because we want it to be in the chado schema but we // do not want to use the Tripal Custom Table API because we don't want it to appear in the // list of custom tables. It needs to be available for the Tripal Chado API so we create it // here and then define it in the tripal_cv/api/tripal_cv.schema.api.inc if (!chado_table_exists('tripal_obo_temp')) { $sql = " CREATE TABLE {tripal_obo_temp} ( id character varying(255) NOT NULL, stanza text NOT NULL, type character varying(50) NOT NULL, CONSTRAINT tripal_obo_temp_uq0 UNIQUE (id) ); "; chado_query($sql); $sql = "CREATE INDEX tripal_obo_temp_idx0 ON {tripal_obo_temp} USING btree (id)"; chado_query($sql); $sql = "CREATE INDEX tripal_obo_temp_idx1 ON {tripal_obo_temp} USING btree (type)"; chado_query($sql); } } /** * Creates a materialized view that stores the type & number of stocks per * organism * * @ingroup tripal_stock */ function tripal_chado_add_organism_stock_count_mview() { $view_name = 'organism_stock_count'; $comment = 'Stores the type and number of stocks per organism'; $schema = [ 'description' => $comment, 'table' => $view_name, 'fields' => [ 'organism_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'genus' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'species' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'common_name' => [ 'type' => 'varchar', 'length' => '255', 'not null' => FALSE, ], 'num_stocks' => [ 'type' => 'int', 'not null' => TRUE, ], 'cvterm_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'stock_type' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], ], 'indexes' => [ 'organism_stock_count_idx1' => ['organism_id'], 'organism_stock_count_idx2' => ['cvterm_id'], 'organism_stock_count_idx3' => ['stock_type'], ], ]; $sql = " SELECT O.organism_id, O.genus, O.species, O.common_name, count(S.stock_id) as num_stocks, CVT.cvterm_id, CVT.name as stock_type FROM organism O INNER JOIN stock S ON O.Organism_id = S.organism_id INNER JOIN cvterm CVT ON S.type_id = CVT.cvterm_id GROUP BY O.Organism_id, O.genus, O.species, O.common_name, CVT.cvterm_id, CVT.name "; chado_add_mview($view_name, 'tripal_stock', $schema, $sql, $comment, FALSE); } /** * Adds a materialized view keeping track of the type of features associated * with each library * * @ingroup tripal_library */ function tripal_chado_add_library_feature_count_mview() { $view_name = 'library_feature_count'; $comment = 'Provides count of feature by type that are associated with all libraries'; $schema = [ 'table' => $view_name, 'description' => $comment, 'fields' => [ 'library_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'name' => [ 'type' => 'varchar', 'length' => 255, 'not null' => TRUE, ], 'num_features' => [ 'type' => 'int', 'not null' => TRUE, ], 'feature_type' => [ 'type' => 'varchar', 'length' => 255, 'not null' => TRUE, ], ], 'indexes' => [ 'library_feature_count_idx1' => ['library_id'], ], ]; $sql = " SELECT L.library_id, L.name, count(F.feature_id) as num_features, CVT.name as feature_type FROM library L INNER JOIN library_feature LF ON LF.library_id = L.library_id INNER JOIN feature F ON LF.feature_id = F.feature_id INNER JOIN cvterm CVT ON F.type_id = CVT.cvterm_id GROUP BY L.library_id, L.name, CVT.name "; chado_add_mview($view_name, 'tripal_library', $schema, $sql, $comment, FALSE); } /** * */ /** * Creates a materialized view that stores the type & number of features per * organism * * @ingroup tripal_feature */ function tripal_chado_add_organism_feature_count_mview() { $view_name = 'organism_feature_count'; $comment = 'Stores the type and number of features per organism'; $schema = [ 'description' => $comment, 'table' => $view_name, 'fields' => [ 'organism_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'genus' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'species' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'common_name' => [ 'type' => 'varchar', 'length' => '255', 'not null' => FALSE, ], 'num_features' => [ 'type' => 'int', 'not null' => TRUE, ], 'cvterm_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'feature_type' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], ], 'indexes' => [ 'organism_feature_count_idx1' => ['organism_id'], 'organism_feature_count_idx2' => ['cvterm_id'], 'organism_feature_count_idx3' => ['feature_type'], ], ]; $sql = " SELECT O.organism_id, O.genus, O.species, O.common_name, count(F.feature_id) as num_features, CVT.cvterm_id, CVT.name as feature_type FROM organism O INNER JOIN feature F ON O.Organism_id = F.organism_id INNER JOIN cvterm CVT ON F.type_id = CVT.cvterm_id GROUP BY O.Organism_id, O.genus, O.species, O.common_name, CVT.cvterm_id, CVT.name "; chado_add_mview($view_name, 'tripal_feature', $schema, $sql, $comment, FALSE); } /** * Creates a view showing the link between an organism & it's analysis through * associated features. * */ function tripal_chado_add_analysis_organism_mview() { $view_name = 'analysis_organism'; $comment = t('This view is for associating an organism (via it\'s associated features) to an analysis.'); // this is the SQL used to identify the organism to which an analsysis // has been used. This is obtained though the analysisfeature -> feature -> organism // joins $sql = " SELECT DISTINCT A.analysis_id, O.organism_id FROM analysis A INNER JOIN analysisfeature AF ON A.analysis_id = AF.analysis_id INNER JOIN feature F ON AF.feature_id = F.feature_id INNER JOIN organism O ON O.organism_id = F.organism_id "; // the schema array for describing this view $schema = [ 'table' => $view_name, 'description' => $comment, 'fields' => [ 'analysis_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'organism_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], ], 'indexes' => [ 'networkmod_qtl_indx0' => ['analysis_id'], 'networkmod_qtl_indx1' => ['organism_id'], ], 'foreign keys' => [ 'analysis' => [ 'table' => 'analysis', 'columns' => [ 'analysis_id' => 'analysis_id', ], ], 'organism' => [ 'table' => 'organism', 'columns' => [ 'organism_id' => 'organism_id', ], ], ], ]; // add the view chado_add_mview($view_name, 'tripal_analysis', $schema, $sql, $comment, FALSE); } /** * Add a materialized view that maps cv to db records. * * This is needed for viewing cv trees * */ function tripal_chado_add_db2cv_mview_mview() { $mv_name = 'db2cv_mview'; $comment = 'A table for quick lookup of the vocabularies and the databases they are associated with.'; $schema = [ 'table' => $mv_name, 'description' => $comment, 'fields' => [ 'cv_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'cvname' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'db_id' => [ 'type' => 'int', 'not null' => TRUE, ], 'dbname' => [ 'type' => 'varchar', 'length' => '255', 'not null' => TRUE, ], 'num_terms' => [ 'type' => 'int', 'not null' => TRUE, ], ], 'indexes' => [ 'cv_id_idx' => ['cv_id'], 'cvname_idx' => ['cvname'], 'db_id_idx' => ['db_id'], 'dbname_idx' => ['db_id'], ], ]; $sql = " SELECT DISTINCT CV.cv_id, CV.name as cvname, DB.db_id, DB.name as dbname, COUNT(CVT.cvterm_id) as num_terms FROM cv CV INNER JOIN cvterm CVT on CVT.cv_id = CV.cv_id INNER JOIN dbxref DBX on DBX.dbxref_id = CVT.dbxref_id INNER JOIN db DB on DB.db_id = DBX.db_id WHERE CVT.is_relationshiptype = 0 and CVT.is_obsolete = 0 GROUP BY CV.cv_id, CV.name, DB.db_id, DB.name ORDER BY DB.name "; // Create the MView chado_add_mview($mv_name, 'tripal_chado', $schema, $sql, $comment, FALSE); } /** * Add a materialized view of root terms for all chado cvs. * * This is needed for viewing cv trees * */ function tripal_chado_add_cv_root_mview_mview() { $mv_name = 'cv_root_mview'; $comment = 'A list of the root terms for all controlled vocabularies. This is needed for viewing CV trees'; $schema = [ 'table' => $mv_name, 'description' => $comment, 'fields' => [ 'name' => [ 'type' => 'varchar', 'length' => 255, 'not null' => TRUE, ], 'cvterm_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'cv_id' => [ 'size' => 'big', 'type' => 'int', 'not null' => TRUE, ], 'cv_name' => [ 'type' => 'varchar', 'length' => 255, 'not null' => TRUE, ], ], 'indexes' => [ 'cv_root_mview_indx1' => ['cvterm_id'], 'cv_root_mview_indx2' => ['cv_id'], ], ]; $sql = " SELECT DISTINCT CVT.name, CVT.cvterm_id, CV.cv_id, CV.name FROM cvterm CVT LEFT JOIN cvterm_relationship CVTR ON CVT.cvterm_id = CVTR.subject_id INNER JOIN cvterm_relationship CVTR2 ON CVT.cvterm_id = CVTR2.object_id INNER JOIN cv CV on CV.cv_id = CVT.cv_id WHERE CVTR.subject_id is NULL and CVT.is_relationshiptype = 0 and CVT.is_obsolete = 0 "; // Create the MView chado_add_mview($mv_name, 'tripal_chado', $schema, $sql, $comment, FALSE); }