| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432 | 
							- <?php
 
- /**
 
-  * Publishes content in Chado as a new TripalEntity entity.
 
-  *
 
-  * @param $values
 
-  *   A key/value associative array that supports the following keys:
 
-  *   - bundle_name:  The name of the the TripalBundle (e.g. bio_data-12345).
 
-  * @param $job_id
 
-  *   (Optional) The numeric job ID as provided by the Tripal jobs system. There
 
-  *   is no need to specify this argument if this function is being called
 
-  *   outside of the jobs systems.
 
-  *
 
-  * @return boolean
 
-  *   TRUE if all of the records of the given bundle type were published, and
 
-  *   FALSE if a failure occured.
 
-  */
 
- function tripal_chado_publish_records($values, $job_id = NULL) {
 
-   // We want the job object in order to report progress.
 
-   if (is_object($job_id)) {
 
-     $job = $job_id;
 
-   }
 
-   if (is_numeric($job_id)) {
 
-     $job = new TripalJob();
 
-     $job->load($job_id);
 
-   }
 
-   $report_progress = FALSE;
 
-   if (is_object($job)) {
 
-     $report_progress = TRUE;
 
-   }
 
-   // Make sure we have the required options: bundle_name.
 
-   if (!array_key_exists('bundle_name', $values) or !$values['bundle_name']) {
 
-     tripal_report_error('tripal_chado', TRIPAL_ERROR,
 
-       "Could not publish record: @error",
 
-       array('@error' => 'The bundle name must be provided'));
 
-     return FALSE;
 
-   }
 
-   // Get the incoming arguments from the $values array.
 
-   $bundle_name = $values['bundle_name'];
 
-   $filters = array_key_exists('filters', $values) ? $values['filters'] : array();
 
-   $sync_node = array_key_exists('sync_node', $values) ? $values['sync_node'] : '';
 
-   // Load the bundle entity so we can get information about which Chado
 
-   // table/field this entity belongs to.
 
-   $bundle = tripal_load_bundle_entity(array('name' => $bundle_name));
 
-   if (!$bundle) {
 
-     tripal_report_error('tripal_chado', TRIPAL_ERROR,
 
-         "Unknown bundle. Could not publish record: @error",
 
-         array('@error' => 'The bundle name must be provided'));
 
-     return FALSE;
 
-   }
 
-   $chado_entity_table = chado_get_bundle_entity_table($bundle);
 
-   // Get the mapping of the bio data type to the Chado table.
 
-   $chado_bundle = db_select('chado_bundle', 'cb')
 
-     ->fields('cb')
 
-     ->condition('bundle_id', $bundle->id)
 
-     ->execute()
 
-     ->fetchObject();
 
-   if(!$chado_bundle) {
 
-     tripal_report_error('tripal_chado', TRIPAL_ERROR,
 
-         "Cannot find mapping of bundle to Chado tables. Could not publish record.");
 
-     return FALSE;
 
-   }
 
-   $table = $chado_bundle->data_table;
 
-   $type_column = $chado_bundle->type_column;
 
-   $type_linker_table = $chado_bundle->type_linker_table;
 
-   $cvterm_id  = $chado_bundle->type_id;
 
-   $type_value = $chado_bundle->type_value;
 
-   // Get the table information for the Chado table.
 
-   $table_schema = chado_get_schema($table);
 
-   $pkey_field = $table_schema['primary key'][0];
 
-   // Construct the SQL for identifying which records should be published.
 
-   $args = array();
 
-   $select = "SELECT T.$pkey_field as record_id ";
 
-   $from = "
 
-     FROM {" . $table . "} T
 
-       LEFT JOIN [" . $chado_entity_table . "] CE on CE.record_id = T.$pkey_field
 
-   ";
 
-   // For migration of Tripal v2 nodes to entities we want to include the
 
-   // coresponding chado linker table.
 
-   if ($sync_node && db_table_exists('chado_' . $table)) {
 
-     $select = "SELECT T.$pkey_field as record_id, CT.nid ";
 
-     $from .= " INNER JOIN [chado_" . $table . "] CT ON CT.$pkey_field = T.$pkey_field";
 
-   }
 
-   $where = " WHERE CE.record_id IS NULL ";
 
-   // Handle records that are mapped to property tables.
 
-   if ($type_linker_table and $type_column and $type_value) {
 
-     $propschema = chado_get_schema($type_linker_table);
 
-     $fkeys = $propschema['foreign keys'][$table]['columns'];
 
-     foreach ($fkeys as $leftkey => $rightkey) {
 
-       if ($rightkey == $pkey_field) {
 
-         $from .= " INNER JOIN {" . $type_linker_table . "} LT ON T.$pkey_field = LT.$leftkey ";
 
-       }
 
-     }
 
-     $where .= "AND LT.$type_column = :cvterm_id and LT.value = :prop_value";
 
-     $args[':cvterm_id'] = $cvterm_id;
 
-     $args[':prop_value'] = $type_value;
 
-   }
 
-   // Handle records that are mapped to cvterm linking tables.
 
-   if ($type_linker_table and $type_column and !$type_value) {
 
-     $cvtschema = chado_get_schema($type_linker_table);
 
-     $fkeys = $cvtschema['foreign keys'][$table]['columns'];
 
-     foreach ($fkeys as $leftkey => $rightkey) {
 
-       if ($rightkey == $pkey_field) {
 
-         $from .= " INNER JOIN {" . $type_linker_table . "} LT ON T.$pkey_field = LT.$leftkey ";
 
-       }
 
-     }
 
-     $where .= "AND LT.$type_column = :cvterm_id";
 
-     $args[':cvterm_id'] = $cvterm_id;
 
-   }
 
-   // Handle records that are mapped via a type_id column in the base table.
 
-   if (!$type_linker_table and $type_column) {
 
-     $where .= "AND T.$type_column = :cvterm_id";
 
-     $args[':cvterm_id'] = $cvterm_id;
 
-   }
 
-   // Handle the case where records are in the cvterm table and mapped via a single
 
-   // vocab.  Here we use the type_value for the cv_id.
 
-   if ($table == 'cvterm' and $type_value) {
 
-     $where .= "AND T.cv_id = :cv_id";
 
-     $args[':cv_id'] = $type_value;
 
-   }
 
-   // Handle the case where records are in the cvterm table but we want to
 
-   // use all of the child terms.
 
-   if ($table == 'cvterm' and !$type_value) {
 
-     $where .= "AND T.cvterm_id IN (
 
-        SELECT CVTP.subject_id
 
-        FROM {cvtermpath} CVTP
 
-        WHERE CVTP.object_id = :cvterm_id)
 
-      ";
 
-     $args[':cvterm_id'] = $cvterm_id;
 
-   }
 
-   // Now add in any additional filters
 
-   $fields = field_info_field_map();
 
-   foreach ($fields as $field_name => $details) {
 
-     if (array_key_exists('TripalEntity', $details['bundles']) and
 
-         in_array($bundle_name, $details['bundles']['TripalEntity']) and
 
-         in_array($field_name, array_keys($filters))){
 
-       $instance = field_info_instance('TripalEntity', $field_name, $bundle_name);
 
-       $chado_table = $instance['settings']['chado_table'];
 
-       $chado_column = $instance['settings']['chado_column'];
 
-       if ($chado_table == $table) {
 
-         $where .= " AND T.$chado_column = :$field_name";
 
-         $args[":$field_name"] = $filters[$field_name];
 
-       }
 
-     }
 
-   }
 
-   // First get the count
 
-   $sql = "SELECT count(*) as num_records " . $from . $where;
 
-   $result = chado_query($sql, $args);
 
-   $count = $result->fetchField();
 
-   // calculate the interval for updates
 
-   $interval = intval($count / 50);
 
-   if ($interval < 1) {
 
-     $interval = 1;
 
-   }
 
-   // Perform the query.
 
-   $sql = $select . $from . $where;
 
-   $records = chado_query($sql, $args);
 
-   $transaction = db_transaction();
 
-   print "\nNOTE: publishing records is performed using a database transaction. \n" .
 
-       "If the load fails or is terminated prematurely then the entire set of \n" .
 
-       "is rolled back with no changes to the database\n\n";
 
-   $i = 0;
 
-   printf("%d of %d records. (%0.2f%%) Memory: %s bytes\r", $i, $count, 0, number_format(memory_get_usage()));
 
-   try {
 
-     while($record = $records->fetchObject()) {
 
-       // update the job status every interval
 
-       if ($i % $interval == 0) {
 
-         $complete = ($i / $count) * 33.33333333;
 
-         // Currently don't support setting job progress within a transaction.
 
-         // if ($report_progress) { $job->setProgress(intval($complete * 3)); }
 
-         printf("%d of %d records. (%0.2f%%) Memory: %s bytes\r", $i, $count, $complete * 3, number_format(memory_get_usage()));
 
-       }
 
-       // First save the tripal_entity record.
 
-       $record_id = $record->record_id;
 
-       $ec = entity_get_controller('TripalEntity');
 
-       $entity = $ec->create(array(
 
-         'bundle' => $bundle_name,
 
-         'term_id' => $bundle->term_id,
 
-         // Add in the Chado details for when the hook_entity_create()
 
-         // is called and our tripal_chado_entity_create() implementation
 
-         // can deal with it.
 
-         'chado_record' => chado_generate_var($table, array($pkey_field => $record_id)),
 
-         'chado_record_id' => $record_id,
 
-       ));
 
-       $entity = $entity->save();
 
-       if (!$entity) {
 
-         throw new Exception('Could not create entity.');
 
-       }
 
-       // Next save the chado entity record.
 
-       $entity_record = array(
 
-         'entity_id' => $entity->id,
 
-         'record_id' => $record_id,
 
-       );
 
-       // For the Tv2 to Tv3 migration we want to add the nid to the
 
-       // entity so we can associate the node with the entity.
 
-       if (property_exists($record, 'nid')) {
 
-         $entity_record['nid'] = $record->nid;
 
-       }
 
-       $result = db_insert($chado_entity_table)
 
-         ->fields($entity_record)
 
-         ->execute();
 
-       if(!$result){
 
-         throw new Exception('Could not create mapping of entity to Chado record.');
 
-       }
 
-       $i++;
 
-     }
 
-   }
 
-   catch (Exception $e) {
 
-     $transaction->rollback();
 
-     $error = $e->getMessage();
 
-     tripal_report_error('tripal_chado', TRIPAL_ERROR, "Could not publish record: @error", array('@error' => $error));
 
-     drupal_set_message('Failed publishing record. See recent logs for more details.', 'error');
 
-     return FALSE;
 
-   }
 
-   drupal_set_message("Succesfully published $i " . $bundle->label . " record(s).");
 
-   return TRUE;
 
- }
 
- /**
 
-  * Returns an array of tokens based on Tripal Entity Fields.
 
-  *
 
-  * @param $base_table
 
-  *    The name of a base table in Chado.
 
-  * @return
 
-  *    An array of tokens where the key is the machine_name of the token.
 
-  */
 
- function tripal_get_chado_tokens($base_table) {
 
-   $tokens = array();
 
-   $table_descrip = chado_get_schema($base_table);
 
-   foreach ($table_descrip['fields'] as $field_name => $field_details) {
 
-     $token = '[' . $base_table . '.' . $field_name . ']';
 
-     $location = implode(' > ',array($base_table, $field_name));
 
-     $tokens[$token] = array(
 
-       'name' => ucwords(str_replace('_',' ',$base_table)) . ': ' . ucwords(str_replace('_',' ',$field_name)),
 
-       'table' => $base_table,
 
-       'field' => $field_name,
 
-       'token' => $token,
 
-       'description' => array_key_exists('description', $field_details) ? $field_details['description'] : '',
 
-       'location' => $location
 
-     );
 
-     if (!array_key_exists('description', $field_details) or preg_match('/TODO/',$field_details['description'])) {
 
-       $tokens[$token]['description'] = 'The '.$field_name.' field of the '.$base_table.' table.';
 
-     }
 
-   }
 
-   // RECURSION:
 
-   // Follow the foreign key relationships recursively
 
-   if (array_key_exists('foreign keys', $table_descrip)) {
 
-     foreach ($table_descrip['foreign keys'] as $table => $details) {
 
-       foreach ($details['columns'] as $left_field => $right_field) {
 
-         $sub_token_prefix = $base_table . '.' . $left_field;
 
-         $sub_location_prefix = implode(' > ',array($base_table, $left_field));
 
-         $sub_tokens = tripal_get_chado_tokens($table);
 
-         if (is_array($sub_tokens)) {
 
-           $tokens = array_merge($tokens, $sub_tokens);
 
-         }
 
-       }
 
-     }
 
-   }
 
-   return $tokens;
 
- }
 
- /**
 
-  * Replace all Chado Tokens in a given string.
 
-  *
 
-  * NOTE: If there is no value for a token then the token is removed.
 
-  *
 
-  * @param string $string
 
-  *   The string containing tokens.
 
-  * @param $record
 
-  *   A Chado record as generated by chado_generate_var()
 
-  *
 
-  * @return
 
-  *   The string will all tokens replaced with values.
 
-  */
 
- function tripal_replace_chado_tokens($string, $record) {
 
-   // Get the list of tokens
 
-   $tokens = tripal_get_chado_tokens($record->tablename);
 
-   // Determine which tokens were used in the format string
 
-   if (preg_match_all('/\[[^]]+\]/', $string, $used_tokens)) {
 
-     // Get the value for each token used
 
-     foreach ($used_tokens[0] as $token) {
 
-       $token_info = $tokens[$token];
 
-       if (!empty($token_info)) {
 
-         $table = $token_info['table'];
 
-         $var = $record;
 
-         $value = '';
 
-         // Iterate through each portion of the location string. An example string
 
-         // might be:  stock > type_id > name.
 
-         $location = explode('>', $token_info['location']);
 
-         foreach ($location as $index) {
 
-           $index = trim($index);
 
-           // if $var is an object then it is the $node object or a table
 
-           // that has been expanded.
 
-           if (is_object($var)) {
 
-             // check to see if the index is a member of the object. If so,
 
-             // then reset the $var to this value.
 
-             if (property_exists($var, $index)) {
 
-               $value = $var->$index;
 
-             }
 
-           }
 
-           // if the $var is an array then there are multiple instances of the same
 
-           // table in a FK relationship (e.g. relationship tables)
 
-           elseif (is_array($var)) {
 
-             $value = $var[$index];
 
-           }
 
-           else {
 
-             tripal_report_error('tripal_chado', TRIPAL_WARNING,
 
-               'Tokens: Unable to determine the value of %token. Things went awry when trying ' .
 
-               'to access \'%index\' for the following: \'%var\'.',
 
-               array('%token' => $token, '%index' => $index, '%var' => print_r($var,TRUE))
 
-             );
 
-           }
 
-         }
 
-         $string = str_replace($token, $value, $string);
 
-       }
 
-     }
 
-   }
 
-   return $string;
 
- }
 
- /**
 
-  * Retrieve an entity_id for a chado record.
 
-  *
 
-  * @param string $chado_table
 
-  *   The chado_table where the record is stored.
 
-  * @param integer $record_id
 
-  *   The record_id which is the primary key of the chado table.
 
-  *
 
-  * @return
 
-  *   Return an integer representing the entity_id or NULL if not found. The
 
-  *   record is then accessible on the website through URL /bio_data/<entity_id>
 
-  */
 
- function tripal_get_chado_entity_id ($chado_table, $record_id) {
 
-   // To find the bundle_table, check if type_column is used for the chado table.
 
-   $type_column =
 
-     db_select('chado_bundle', 'CB')
 
-     ->fields('CB', array('type_column'))
 
-     ->condition('data_table', $chado_table)
 
-     ->execute()
 
-     ->fetchField();
 
-   // If there is a type_column, get bundle_id by specifying the data_table,
 
-   // type_column, and type_id.
 
-   $bundle_id = NULL;
 
-   if ($type_column) {
 
-     $schema = chado_get_schema($chado_table);
 
-     $pkey = is_array($schema['primary key']) ? $schema['primary key'][0] : $schema['primary key'];
 
-     $type_id = NULL;
 
-     if (key_exists($type_column, $schema['fields'])) {
 
-       $type_id =
 
-         db_select("chado.$chado_table", 'C')
 
-           ->fields('C', array($type_column))
 
-           ->condition($pkey, $record_id)
 
-           ->execute()
 
-           ->fetchField();
 
-     }
 
-     if ($type_id) {
 
-       $bundle_id =
 
-         db_select('chado_bundle', 'CB')
 
-           ->fields('CB', array('bundle_id'))
 
-           ->condition('data_table', $chado_table)
 
-           ->condition('type_column', $type_column)
 
-           ->condition('type_id', $type_id)
 
-           ->execute()
 
-           ->fetchField();
 
-     }
 
-   }
 
-   // If type_column is not used, get bundle_id by specifying the data_table.
 
-   else {
 
-     $bundle_id =
 
-       db_select('chado_bundle', 'CB')
 
-         ->fields('CB', array('bundle_id'))
 
-         ->condition('data_table', $chado_table)
 
-         ->execute()
 
-         ->fetchField();
 
-   }
 
-   // If bundle_id is found, find the bundle table name and return the entity_id.
 
-   $entity_id = NULL;
 
-   if ($bundle_id) {
 
-     $table_name =
 
-       db_select('tripal_bundle', 'TB')
 
-         ->fields('TB', array('name'))
 
-         ->condition('id', $bundle_id)
 
-         ->execute()
 
-         ->fetchField();
 
-     $entity_id =
 
-       db_select('chado_' . $table_name, 'CBD')
 
-         ->fields('CBD', array('entity_id'))
 
-         ->condition('record_id', $record_id)
 
-         ->execute()
 
-         ->fetchField();
 
-   }
 
-   return $entity_id;
 
- }
 
 
  |