print_r($identifiers, TRUE) ) ); } elseif (empty($identifiers)) { tripal_report_error( 'tripal_chado_api', TRIPAL_ERROR, "tripal_get_cv: You did not pass in anything to identify the cv you want. The identifier is expected to be an array with the key matching a column name in the cv table (ie: cv_id or name). You passed in %identifier.", array( '%identifier'=> print_r($identifiers, TRUE) ) ); } // Try to get the cv $cv = chado_generate_var( 'cv', $identifiers, $options ); // Ensure the cv is singular. If it's an array then it is not singular if (is_array($cv)) { tripal_report_error( 'tripal_chado_api', TRIPAL_ERROR, "tripal_get_cv: The identifiers you passed in were not unique. You passed in %identifier.", array( '%identifier'=> print_r($identifiers, TRUE) ) ); } // Report an error if $cv is FALSE since then chado_generate_var has failed elseif ($cv === FALSE) { tripal_report_error( 'tripal_chado_api', TRIPAL_ERROR, "tripal_get_cv: chado_generate_var() failed to return a cv based on the identifiers you passed in. You should check that your identifiers are correct, as well as, look for a chado_generate_var error for additional clues. You passed in %identifier.", array( '%identifier'=> print_r($identifiers, TRUE) ) ); } // Else, as far we know, everything is fine so give them their cv :) else { return $cv; } } /** * Create an options array to be used in a form element which provides a * list of all chado cvs * * @return * An array(cv_id => name) for each cv in the chado cv table * * @ingroup tripal_chado_api */ function tripal_get_cv_select_options() { $results = chado_select_record('cv', array('cv_id', 'name'), array(), array('order_by' => array('name' => 'ASC'))); $options = array(); $options[] = 'Select a Vocabulary'; foreach ($results as $r) { $options[$r->cv_id] = $r->name; } return $options; } /** * Retrieves a chado controlled vocabulary term variable * * @param $identifier * An array apropriate for use with the chado_generate_var for uniquely * identifying a cvterm record. Alternativley, there are also some specially * handled keys. They are: * - id: an ID for the term of the for [dbname]:[accession], where [dbname] * is the short name of the vocabulary and accession is the unique ID. * - cv_id: an integer indicating the cv_id or an array with 'name' => the * name of the cv. * - synonym: an array with 'name' => the name of the synonym of the cvterm * you want returned; 'cv_id' => the cv_id of the synonym; 'cv_name' => * the name of the cv of the synonym * - property: An array/object describing the property to select records * for. It should at least have either a type_name (if unique across cvs) * or type_id. Other supported keys include: cv_id/cv_name (of the type), * value and rank * @param $options * An array of options. Supported keys include: * - Any keys supported by chado_generate_var(). See that function * definition for additional details. * * NOTE: the $identifier parameter can really be any array similar to $values * passed into chado_select_record(). It should fully specify the cvterm * record to be returned. * * @return * If unique values were passed in as an identifier then an object describing * the cvterm will be returned (will be a chado variable from * chado_generate_var()). Otherwise, FALSE will be returned. * * @ingroup tripal_cv_api */ function tripal_get_cvterm($identifiers, $options = array()) { // Set Defaults if (!isset($options['include_fk'])) { // Tells chado_generate_var to only get the cv $options['include_fk'] = array('cv_id' => TRUE); } // Error Checking of parameters if (!is_array($identifiers)) { tripal_report_error('tripal_cv_api', TRIPAL_ERROR, "tripal_get_cvterm: The identifier passed in is expected to be an array with the key matching a column name in the cvterm table (ie: cvterm_id or name). You passed in %identifier.", array('%identifier'=> print_r($identifiers, TRUE)) ); } elseif (empty($identifiers)) { tripal_report_error('tripal_cv_api', TRIPAL_ERROR, "tripal_get_cvterm: You did not pass in anything to identify the cvterm you want. The identifier is expected to be an array with the key matching a column name in the cvterm table (ie: cvterm_id or name). You passed in %identifier.", array('%identifier'=> print_r($identifiers, TRUE)) ); } // If synonym was passed in, then process this first before calling chado_generate_var() if (isset($identifiers['synonym'])) { $synonym = $identifiers['synonym']['name']; $values = array('synonym' => $synonym); if (isset($identifiers['synonym']['cv_id'])) { $values['cvterm_id'] = array('cv_id' => $identifiers['synonym']['cv_id']); } if (isset($identifiers['synonym']['cv_name'])) { $values['cvterm_id'] = array('cv_id' => array('name' => $identifiers['synonym']['cv_name'])); } $options = array( 'case_insensitive_columns' => array('name') ); $result = chado_select_record('cvtermsynonym', array('cvterm_id'), $values, $options); // if the synonym doens't exist or more than one record is returned then return false if (count($result) == 0) { return FALSE; } if (count($result) > 1) { return FALSE; } $identifiers = array('cvterm_id' => $result[0]->cvterm_id); } // If one of the identifiers is property then use chado_get_record_with_property() if (isset($identifiers['property'])) { $property = $identifiers['property']; unset($identifiers['property']); $cvterm = chado_get_record_with_property( array('table' => 'cvterm', 'base_records' => $identifiers), array('type_name' => $property), $options ); } if (isset($identifiers['id'])) { list($db_name, $accession) = preg_split('/:/', $identifiers['id']); $cvterm = chado_generate_var('cvterm',array( 'dbxref_id' => array( 'db_id' => array( 'name' => $db_name, ), 'accession' => $accession, ) )); } // Else we have a simple case and we can just use chado_generate_var to get the cvterm else { // Try to get the cvterm $cvterm = chado_generate_var('cvterm', $identifiers, $options); } // Ensure the cvterm is singular. If it's an array then it is not singular if (is_array($cvterm)) { tripal_report_error( 'tripal_cv_api', TRIPAL_ERROR, "tripal_get_cvterm: The identifiers you passed in were not unique. You passed in %identifier.", array( '%identifier'=> print_r($identifiers, TRUE) ) ); } // Report an error if $cvterm is FALSE since then chado_generate_var has failed elseif ($cvterm === FALSE) { tripal_report_error( 'tripal_cv_api', TRIPAL_ERROR, "tripal_get_cvterm: chado_generate_var() failed to return a cvterm based on the identifiers you passed in. You should check that your identifiers are correct, as well as, look for a chado_generate_var error for additional clues. You passed in %identifier.", array( '%identifier'=> print_r($identifiers, TRUE) ) ); } // Else, as far we know, everything is fine so give them their cvterm :) else { return $cvterm; } } /** * Create an options array to be used in a form element * which provides a list of all chado cvterms * * @param $cv_id * The chado cv_id; only cvterms with the supplied cv_id will be returned * @param $rel_type * Set to TRUE if the terms returned should only be relationship types in * the vocabulary. This is useful for creating drop-downs of terms * used for relationship linker tables. * * @return * An associative array with the cvterm_id's as keys. The first * element in the array has a key of '0' and a value of 'Select a Type' * * @ingroup tripal_chado_api */ function tripal_get_cvterm_select_options($cv_id, $rel_type = FALSE) { $columns = array('cvterm_id', 'name'); $values = array('cv_id' => $cv_id); if ($rel_type) { $values['is_relationshiptype'] = 1; } $s_options = array('order_by' => array('name' => 'ASC')); $cvterms = chado_select_record('cvterm', $columns, $values, $s_options); $options = array(); $options[0] = 'Select a Type'; foreach ($cvterms as $cvterm) { $options[$cvterm->cvterm_id] = $cvterm->name; } return $options; } /** * Updates the cvtermpath table of Chado for the specified CV. * * @param $cv_id * The chado cv_id; * @param $job_id * This function is intended to be used with the Tripal Jobs API. * When this function is called as a job the $job_id is automatically * passed to this function. * @return * TRUE on success FALSE on failure * * @ingroup tripal_chado_api */ function tripal_update_cvtermpath($cv_id, $job_id = NULL) { // TODO: need better error checking in this function // first get the controlled vocabulary name: $sql = "SELECT * FROM {cv} WHERE cv_id = :cv_id"; $cv = chado_query($sql, array(':cv_id' => $cv_id))->fetchObject(); print "\nUpdating cvtermpath for $cv->name...\n"; // We need to set the chado schema as active because some of the // functions call other functions which would not be in scope. $previous = chado_set_active('chado'); try { $sql = "SELECT * FROM fill_cvtermpath(:name)"; db_query($sql, array(':name' => $cv->name)); chado_set_active($previous); } catch (Exception $e) { chado_set_active($previous); $error = $e->getMessage(); tripal_report_error('tripal_chado', TRIPAL_ERROR, "Could not fill cvtermpath table: @error", array('@error' => $error)); return FALSE; } return TRUE; } /** * Duplicate of fill_cvtermpath() stored procedure in Chado. * * Identifies all of the root terms of the controlled vocabulary. These * root terms are then processed by calling the * tripal_update_cvtermpath_root_loop() function on each one. * * @param $cvid * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id). * @param $job_id */ function tripal_update_cvtermpath_bak($cv_id, $job_id = NULL){ // TODO: there's a function to determine the current Chado instance. // we should use that. $prev_db = chado_set_active('chado'); try { $result = db_query(' SELECT DISTINCT t.* FROM cvterm t LEFT JOIN cvterm_relationship r ON (t.cvterm_id = r.subject_id) INNER JOIN cvterm_relationship r2 ON (t.cvterm_id = r2.object_id) WHERE t.cv_id = :cvid AND r.subject_id is null', array(':cvid' => $cv_id) ); // Iterate through each root level term. $record = $result->fetchAll(); $roots = array(); foreach ($record as $item){ tripal_update_cvtermpath_root_loop($item->cvterm_id, $item->cv_id, $roots); } } catch (Exception $e) { // If there's an exception we have to set the database back. So, do that // and then rethrow the error. chado_set_active($prev_db); throw $e; } chado_set_active($prev_db); } /** * Duplicate of _fill_cvtermpath4root() stored procedure in Chado. * * This function process a "branch" of the ontology. Initially, the * "root" starts at the top of the tree. But, as the cvtermpath is populated * the "root" becomes terms deeper in the tree. * * @param $rootid * The term ID from the cvterm table of Chado (i.e. cvterm.cvterm_id). * @param $cvid * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id). */ function tripal_update_cvtermpath_root_loop($rootid, $cvid, &$roots){ // Get's the cvterm record for this "root". $ttype = db_select('cvterm', 'cv') ->fields('cv', array('cvterm_id')); $db_or = db_or(); $db_or->condition('cv.name', "isa", '='); $db_or->condition('cv.name', "is_a", '='); $ttype->condition($db_or); $result = $ttype->execute()->fetchObject(); $term_id = $rootid . '|' . $rootid . '|' . $cvid . '|' . $result->cvterm_id; // If the child_id matches any other id in the array then we've hit a loop. foreach ($roots as $element_id) { if ($element_id == $term_id) { return; } } // Then add that new entry to the $tree_path. $roots[] = $term_id; // Descends through the branch starting at this "root" term. $visited = array(); $depth = 0; tripal_update_cvtermpath_loop($rootid, $rootid, $cvid, $result->cvterm_id, $depth, 0, $visited); // Get's the children terms of this "root" term and then recursively calls // this function making each child root. $cterm = db_query( 'SELECT * FROM cvterm_relationship WHERE object_id = :rootid ', array(':rootid' => $rootid) ); while($cterm_result = $cterm->fetchAssoc()) { tripal_update_cvtermpath_root_loop($cterm_result['subject_id'], $cvid, $roots); } } /** * * @param $origin * The root terms cvterm_id. * @param $child_id * The cvterm_id of the current child term. The child term is a descendent * of the origin. * @param $cv_id * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id). * @param $type_id * The relationship type between the origin term and the child. * @param $depth * The depth of the recursion. * @param $increment_of_depth. * An integer ?? * @param $tree_path. * The array of every term between the current child and the origin. Each * element in the array is an associative array with the keys: * -build_id: an string identifier for the child that combines the origin, * child cvterm_id,cv_id, and the type_id. * -depth: the depth that a child was inserted into the cvtermpath table. * @return multitype: */ $loop_data; function tripal_update_cvtermpath_loop($origin, $child_id, $cv_id, $type_id, $depth, $increment_of_depth, $tree_path){ // An array of global $loop_data; // Check to see if a row with these values already exists. chado_set_active('chado'); $count = db_query( 'SELECT * FROM cvtermpath WHERE cv_id = :cvid AND object_id = :origin AND subject_id = :child_id AND pathdistance = :depth ', array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth) ); $count_total = $count->rowCount(); // If we've already seen this term then just return, we don't want // to insert it again. if ($count_total > 0) { return $loop_data; } // Build the ID. $term_id = $origin . '|' . $child_id . '|' . $cv_id . '|' . $type_id; // Now check if the most recent entry already exists in the array. if ($increment_of_depth != 0 && empty($loop_data)) { // Search the $tree_path for the new $child_id in the build_id column. foreach ($tree_path as $parent) { // If this child is the same as a parent term that has already been // processed then we have a potential loop. if ($parent['build_id'] == $term_id) { // The loop checker function below. $result_of_loop_checker = tripal_update_cvtermpath_loop_checker($origin, $child_id, $cv_id, $type_id, $depth, $increment_of_depth, 0, $parent, array(), $depth); if (!empty($result_of_loop_checker)) { $loop_data = $result_of_loop_checker; //Find the depth of the loop start by finding it in the array_of_children foreach($tree_path as $children => $child){ if($child['build_id'] == $loop_data['build_id']){ $loop_location = $child['depth']; } } $array_loop_data = (array)$loop_data; $array_loop_data['depth'] = $loop_location; $loop_data = $array_loop_data; break; } } if (!empty($loop_data)) { return $loop_data; } } } // We have not detected a loop, so it's safe to insert the term. $query = db_insert('cvtermpath') ->fields([ 'object_id' => $origin, 'subject_id' => $child_id, 'cv_id' => $cv_id, 'type_id' => $type_id, 'pathdistance' => $depth, ]); $rows = $query->execute(); // Then add that new entry to the $tree_path. $tree_path[$increment_of_depth] = [ 'build_id' => $term_id, 'depth' => $depth ]; // Get all of the relationships of this child term, and recursively // call the tripal_update_cvtermpath_loop() function to continue // descending down the tree. $query = db_select('cvterm_relationship', 'cvtr') ->fields('cvtr') ->condition('cvtr.object_id', $child_id, '=') ->execute(); $cterm_relationships = $query->fetchAll(); foreach ($cterm_relationships as $item) { if (!empty($loop_data)) { if ($loop_data['depth'] < $depth) { break; } elseif ($loop_data['depth'] > $depth) { $loop_data = NULL; break; } } else { $increment_of_depth++; tripal_update_cvtermpath_loop($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $increment_of_depth, $tree_path); } } } /** * @param $origin * @param $child_id * @param $cv_id * @param $type_id * @param $depth * @param $increment_of_depth * @param $distance_between_parent_child * @param $possible_start_of_loop * @param $array_of_possible_loop * @param $depth_at_start_of_loop * * @return bool */ function tripal_update_cvtermpath_loop_checker($origin, $child_id, $cv_id, $type_id, $depth, $increment_of_depth, $distance_between_parent_child, $possible_start_of_loop, $array_of_possible_loop, $depth_at_start_of_loop){ // Find the child terms of the current term via the relationship taboe. chado_set_active('chado'); $query = db_select('cvterm_relationship', 'cvtr') ->fields('cvtr') ->condition('cvtr.object_id', $child_id, '=') ->execute(); $cterm_relationships = $query->fetchAll(); // Iterate through the child terms via the relationships. foreach ($cterm_relationships as $item){ // Search the $tree_path for the new $child_id in the build_id column. foreach ($array_of_possible_loop as $parent) { if ($parent['build_id'] === $possible_start_of_loop['build_id']) { // If the search returns something check for a possible loop. if (!empty($parent)) { $result = tripal_update_cvtermpath_loop_checker_traverse($origin, $child_id, $cv_id, $type_id, $depth, $increment_of_depth, $possible_start_of_loop, $array_of_possible_loop, array(), 0); if(!empty($result)){ break 2; } } } } $increment_of_depth++; $distance_between_parent_child++; $child_id = $origin . '|' . $item->subject_id . '|' . $cv_id . '|' . $item->type_id; $array_of_possible_loop[$distance_between_parent_child] = ['build_id' => $child_id]; $result = tripal_update_cvtermpath_loop_checker($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $increment_of_depth, $distance_between_parent_child, $possible_start_of_loop, $array_of_possible_loop, $depth_at_start_of_loop); if($result !== FALSE){ return $result; } } if (!empty($result)) { return $result; } else { return FALSE; } } function tripal_update_cvtermpath_loop_checker_traverse($origin, $child_id, $cv_id, $type_id, $depth, $increment_of_depth, $possible_start_of_loop, $array_of_possible_loop, $traverse_of_loop, $increment) { //watchdog('debug', '
$increment: '. print_r($increment, TRUE) .''); /*if ($increment > 10) { die(); }*/ chado_set_active('chado'); $query = db_select('cvterm_relationship', 'cvtr') ->fields('cvtr') ->condition('cvtr.object_id', $child_id, '=') ->execute(); $cterm = $query->fetchAll(); foreach ($cterm as $item) { if ($array_of_possible_loop === $traverse_of_loop) { watchdog('debug', 'LOOP'); //Report the loop. $loop_found = end($array_of_possible_loop); break; } elseif ($array_of_possible_loop != $traverse_of_loop) { $increment_of_depth++; $increment++; $child_id = $origin . '|' . $item->subject_id . '|' . $cv_id . '|' . $item->type_id; $traverse_of_loop[$increment] = ['build_id' => $child_id]; $result = tripal_update_cvtermpath_loop_checker_traverse($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $increment_of_depth, $possible_start_of_loop, $array_of_possible_loop, $traverse_of_loop, $increment); if ($result !== FALSE) { return $result; } } } if ($loop_found) { return $loop_found; } else { return FALSE; } } /* * * @param $origin * @param $subject_id * @param $cv_idxkcd * @param $type_id * @param $depth * @return multitype: function tripal_update_cvtermpath_loop($origin, $child_id, $cv_id, $type_id, $depth){ // Variables and arrays needed for loop checking. $tree_path; $array_of_possible_loop; $possible_start_of_loop; $distance_between_parent_child; $increment_of_depth; chado_set_active('chado'); $count = db_query( 'SELECT * FROM cvtermpath WHERE cv_id = :cvid AND object_id = :origin AND subject_id = :child_id AND pathdistance = :depth ', array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth) ); $count_total = $count->rowCount(); //Loop check chado_set_active('chado'); $loop = db_query( 'SELECT * FROM cvtermpath WHERE cv_id = :cvid AND object_id = :origin AND subject_id = :child_id AND type_id = :type_id ', array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':type_id' => $type_id,) ); $loop_check = $loop->rowCount(); //watchdog('debug', '
tripal_ds_preprocess_TripalEntity $rows ' . print_r($rows, TRUE) . ''); /*if(!empty($rows)){ foreach($rows as $row){ tripal_update_cvtermpath_loop_check($origin, $child_id, $cv_id, $type_id, $depth, $row->cvtermpath_id, 0); } } else {*/ //If no loop proceed. /*try{ if($count_total == 0) { chado_set_active('chado'); $query = db_insert('cvtermpath') ->fields(array( 'object_id' => $origin, 'subject_id' => $child_id, 'cv_id' => $cv_id, 'type_id' => $type_id, 'pathdistance' => $depth, )); $rows = $query->execute(); } if ($loop_check == 0) { chado_set_active('chado'); $query = db_select('cvterm_relationship', 'cvtr') ->fields('cvtr') ->condition('cvtr.object_id', $child_id, '=') ->execute(); $cterm = $query->fetchAll(); foreach ($cterm as $item) { //watchdog('debug', '
tripal_ds_preprocess_TripalEntity $item ' . print_r($item, TRUE) . ''); tripal_update_cvtermpath_loop($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1); }; //} } } catch(Exception $e){ watchdog_exception('tripal_ds', $e); return FALSE; } return 1; } */ /** * * @param $origin * @param $subject_id * @param $cv_id * @param $type_id * @param $depth * @return multitype: function tripal_update_cvtermpath_loop_check($origin, $child_id, $cv_id, $type_id, $depth, $cvtermpath_id, $loop_count, $loop_check, $object_id){ //Store the //Check if the passed parameters match any of the items in the loop_check array. if(!empty($loop_check)){ foreach($loop_check as $item){ if ($item['type_id'] = $type_id){ if($item['subject_id'] = $child_id){ if($item['object_id'] = $object_id){ //Loop found, roll back all rows until $cvtermpath_id-1 (last correct entry) // and step into the next loop } } } } } $loop_count + 1; chado_set_active('chado'); $count = db_query( 'SELECT * FROM cvtermpath WHERE cv_id = :cvid AND object_id = :origin AND subject_id = :child_id AND pathdistance = :depth ', array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth) ); $count_total = $count->rowCount(); if ($count_total == 0) { chado_set_active('chado'); $query = db_insert('cvtermpath') ->fields(array( 'object_id' => $origin, 'subject_id' => $child_id, 'cv_id' => $cv_id, 'type_id' => $type_id, 'pathdistance' => $depth, )); $rows = $query->execute(); $cterm = array(); $query = db_select('cvterm_relationship', 'cvtr') ->fields('cvtr') ->condition('cvtr.object_id', $child_id, '=' ) ->execute(); $cterm = $query->fetchAll(); foreach ($cterm as $item) { $loop_check[$loop_count]= $item; tripal_update_cvtermpath_loop_check($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $loop_count, $loop_check, $item->object_id); }; } return 1; } */ /** * Adds a controlled vocabular to the CV table of Chado. * * @param $name * The name of the controlled vocabulary. These are typically all lower case * with no special characters other than an undrescore (for spaces). * @param $comment * A description or definition of the vocabulary. * * @return * An object populated with fields from the newly added database. * * @ingroup tripal_chado_api */ function tripal_insert_cv($name, $definition) { // insert/update values $ins_values = array( 'name' => $name, 'definition' => $definition ); // see if the CV default exists already in the database $sel_values = array('name' => $name); $results = chado_select_record('cv', array('*'), $sel_values); // if it does not exists then add it if (count($results) == 0) { $success = chado_insert_record('cv', $ins_values); if (!$success) { tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to create the CV record", NULL); return FALSE; } $results = chado_select_record('cv', array('*'), $sel_values); } // if it already exists then do an update else { $success = chado_update_record('cv', $sel_values, $ins_values); if (!$success) { tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to update the CV record", NULL); return FALSE; } $results = chado_select_record('cv', array('*'), $sel_values); } // return the cv object return $results[0]; } /** * Add's a controlled vocabulary term to Chado. * * This function will add a cvterm record (and a dbxref record if appropriate * values are provided). If the parent vocabulary does not exist then * that also is added to the cv table. If the cvterm is a relationship term * then the 'is_relationship' value should be set. All * terms must also have a corresponding database. This is specified in the * term's ID just before the colon (e.g. GO:003824). If the database does not * exist in the DB table then it will be added automatically. The accession * (the value just after the colon in the term's ID) will be added to the * dbxref table. If the CVterm already exists and $update is set (default) * then the cvterm is updated. If the CVTerm already exists and $update is * not set, then no changes are made and the CVTerm object is returned. * * @param $term * An associative array with the following keys: * - id: the term accession. must be of the form