tripal_chado.field_storage.inc 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624
  1. <?php
  2. /**
  3. * Implements hook_field_storage_info().
  4. */
  5. function tripal_chado_field_storage_info() {
  6. return array(
  7. 'field_chado_storage' => array(
  8. 'label' => t('Chado'),
  9. 'description' => t('Stores fields in the local Chado database.'),
  10. 'settings' => array(),
  11. // The logo_url key is supported by Tripal. It's not a Drupal key. It's
  12. // used for adding a logo or picture for the data store to help make it
  13. // more easily recognized on the field_ui_field_overview_form. Ideally
  14. // the URL should point to a relative path on the local Drupal site.
  15. 'logo_url' => url(drupal_get_path('module', 'tripal') . '/theme/images/250px-ChadoLogo.png'),
  16. ),
  17. );
  18. }
  19. /**
  20. * Implements hook_field_storage_write().
  21. */
  22. function tripal_chado_field_storage_write($entity_type, $entity, $op, $fields) {
  23. // Get the bundle and the term for this entity.
  24. $bundle = tripal_load_bundle_entity(array('name' => $entity->bundle));
  25. $term = entity_load('TripalTerm', array('id' => $entity->term_id));
  26. $term = reset($term);
  27. // Convert the Tripal term entity into the appropriate record in Chado.
  28. $dbxref = tripal_get_dbxref(array('accession' => $term->accession, 'db_id' => array('name' => $term->vocab->vocabulary)));
  29. $cvterm = tripal_get_cvterm(array('dbxref_id' => $dbxref->dbxref_id));
  30. // Get the base table, type field and record_id from the entity.
  31. $base_table = $entity->chado_table;
  32. $type_field = $entity->chado_column;
  33. $record = $entity->chado_record;
  34. $record_id = $entity->chado_record_id;
  35. $base_schema = chado_get_schema($base_table);
  36. $base_pkey = $base_schema['primary key'][0];
  37. // Convert the fields into a key/value list of fields and their values.
  38. $field_vals = tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity);
  39. // First, write the record for the base table. If we have a record id then
  40. // this is an update and we need to set the primary key. If not, then this
  41. // is an insert and we need to set the type_id if the table supports it.
  42. $values = $field_vals[$base_table];
  43. if ($record_id) {
  44. $values[$base_pkey] = $record_id;
  45. }
  46. elseif ($type_field) {
  47. $values[$type_field] = $cvterm->cvterm_id;
  48. }
  49. $base_record_id = tripal_chado_field_storage_write_table($base_table, $values);
  50. // If this is an insert then add the chado_entity record.
  51. if ($op == FIELD_STORAGE_INSERT) {
  52. // Add a record to the chado_entity table so that the data for the
  53. // fields can be pulled from Chado when loaded the next time.
  54. $record = array(
  55. 'entity_id' => $entity->id,
  56. 'record_id' => $base_record_id,
  57. 'data_table' => $base_table,
  58. 'type_table' => $base_table,
  59. 'field' => $type_field,
  60. );
  61. $success = drupal_write_record('chado_entity', $record);
  62. if (!$success) {
  63. drupal_set_message('Unable to insert new Chado entity.', 'error');
  64. }
  65. }
  66. // Now that we have handled the base table, we need to handle linking tables.
  67. foreach ($field_vals as $table_name => $details) {
  68. // Skip the base table as we've already dealt with it.
  69. if ($table_name == $base_table) {
  70. continue;
  71. }
  72. foreach ($details as $delta => $values) {
  73. $record_id = tripal_chado_field_storage_write_table($table_name, $values);
  74. }
  75. }
  76. }
  77. /**
  78. * Write (inserts/updates/deletes) values for a Chado table.
  79. *
  80. * The $values array is of the same format used by chado_insert_record() and
  81. * chado_update_record(). However, both of those methods will use any nested
  82. * arrays (i.e. representing foreign keys) to select an appropriate record ID
  83. * that can be substituted as the value. Here, the nested arrays are
  84. * either inserted or updated as well, but the choice is determined if the
  85. * primary key value is present. If present an update occurs, if not present
  86. * then an insert occurs.
  87. *
  88. * This function is recursive and nested arrays from the lowest point of the
  89. * "tree" are dealt with first.
  90. *
  91. * @param $table_name
  92. * The name of the table on which the insertion/update is performed.
  93. * @param $values
  94. * The values array for the insertion.
  95. *
  96. * @throws Exception
  97. *
  98. * @return
  99. * The unique record ID.
  100. */
  101. function tripal_chado_field_storage_write_table($table_name, $values) {
  102. $schema = chado_get_schema($table_name);
  103. $fkeys = $schema['foreign keys'];
  104. $pkey = $schema['primary key'][0];
  105. // Fields with a cardinality greater than 1 will often submit an
  106. // empty form. We want to remove these empty submissions. We can detect
  107. // them if all of the fields are empty.
  108. $num_empty = 0;
  109. foreach ($values as $column => $value) {
  110. if (!$value) {
  111. $num_empty++;
  112. }
  113. }
  114. if ($num_empty == count(array_keys($values))) {
  115. return '';
  116. }
  117. // If the primary key column has a value but all other values are empty then
  118. // this is a delete.
  119. if (array_key_exists($pkey, $values) and $values[$pkey]) {
  120. $num_vals = 0;
  121. foreach ($values as $value) {
  122. if ($value) {
  123. $num_vals++;
  124. }
  125. }
  126. if ($num_vals == 1) {
  127. $new_vals[$pkey] = $values[$pkey];
  128. if (!chado_delete_record($table_name, $new_vals)) {
  129. throw new Exception('Could not delete record from table: "' . $table_name . '".');
  130. }
  131. return '';
  132. }
  133. }
  134. // If the primary key column does not have a value then this is an insert.
  135. if (!array_key_exists($pkey, $values) or !$values[$pkey] or !isset($values[$pkey])) {
  136. // Before inserting, we want to make sure the record does not
  137. // already exist. Using the unique constraint check for a matching record.
  138. $options = array('is_duplicate' => TRUE);
  139. $is_duplicate = chado_select_record($table_name, array('*'), $values, $options);
  140. if($is_duplicate) {
  141. $record = chado_select_record($table_name, array('*'), $values);
  142. return $record[0]->$pkey;
  143. }
  144. // Insert the values array as a new record in the table but remove the
  145. // pkey as it should be set.
  146. $new_vals = $values;
  147. unset($new_vals[$pkey]);
  148. $record = chado_insert_record($table_name, $new_vals);
  149. if ($record === FALSE) {
  150. throw new Exception('Could not insert Chado record into table: "' . $table_name . '".');
  151. }
  152. return $record[$pkey];
  153. }
  154. // If we've made it to this point then this is an update.
  155. // TODO: what if the unique constraint matches another record? That is
  156. // not being tested for here.
  157. $match[$pkey] = $values[$pkey];
  158. if (!chado_update_record($table_name, $match, $values)) {
  159. drupal_set_message("Could not update Chado record in table: $table_name.", 'error');
  160. }
  161. return $values[$pkey];
  162. }
  163. /**
  164. * Implements hook_field_storage_load().
  165. *
  166. * Responsible for loading the fields from the Chado database and adding
  167. * their values to the entity.
  168. */
  169. function tripal_chado_field_storage_load($entity_type, $entities, $age,
  170. $fields, $options) {
  171. $load_current = $age == FIELD_LOAD_CURRENT;
  172. global $language;
  173. $langcode = $language->language;
  174. foreach ($entities as $id => $entity) {
  175. if (property_exists($entity, 'chado_table')) {
  176. // Get the base table and record id for the fields of this entity.
  177. $base_table = $entity->chado_table;
  178. $type_field = $entity->chado_column;
  179. $record_id = $entity->chado_record_id;
  180. }
  181. else {
  182. // Get the base table and record id for the fields of this entity.
  183. $details = db_select('chado_entity', 'ce')
  184. ->fields('ce')
  185. ->condition('entity_id', $entity->id)
  186. ->execute()
  187. ->fetchObject();
  188. if (!$details) {
  189. // TODO: what to do if record is missing!
  190. }
  191. // Get some values needed for loading the values from Chado.
  192. $base_table = isset($details->data_table) ? $details->data_table : '';
  193. $type_field = isset($details->field) ? $details->field : '';
  194. $record_id = isset($details->record_id) ? $details->record_id : '';
  195. }
  196. // Get this table's schema.
  197. $schema = chado_get_schema($base_table);
  198. $pkey_field = $schema['primary key'][0];
  199. // Get the base record if one exists
  200. $columns = array('*');
  201. $match = array($pkey_field => $record_id);
  202. $record = chado_generate_var($base_table, $match);
  203. $entity->chado_record = $record;
  204. // Iterate through the entity's fields so we can get the column names
  205. // that need to be selected from each of the tables represented.
  206. $tables = array();
  207. foreach ($fields as $field_id => $ids) {
  208. // By the time this hook runs, the relevant field definitions have been
  209. // populated and cached in FieldInfo, so calling field_info_field_by_id()
  210. // on each field individually is more efficient than loading all fields in
  211. // memory upfront with field_info_field_by_ids().
  212. $field = field_info_field_by_id($field_id);
  213. $field_name = $field['field_name'];
  214. $field_type = $field['type'];
  215. $field_module = $field['module'];
  216. // Get the instnace for this field
  217. $instance = field_info_instance($entity_type, $field_name, $entity->bundle);
  218. // Skip fields that don't map to a Chado table (e.g. kvproperty_adder).
  219. if (!array_key_exists('settings', $instance) or !array_key_exists('chado_table', $instance['settings'])) {
  220. continue;
  221. }
  222. // Get the Chado table and column for this field.
  223. $field_table = $instance['settings']['chado_table'];
  224. $field_column = $instance['settings']['chado_column'];
  225. // There are only two types of fields: 1) fields that represent a single
  226. // column of the base table, or 2) fields that represent a linked record
  227. // in a many-to-one relationship with the base table.
  228. // Type 1: fields from base tables.
  229. if ($field_table == $base_table) {
  230. // Set an empty value by default, and if there is a record, then update.
  231. $entity->{$field_name}['und'][0]['value'] = '';
  232. if ($record and property_exists($record, $field_column)) {
  233. // If the field column is an object then it's a FK to another table.
  234. // and because $record object is created by the chado_generate_var()
  235. // function we must go one more level deeper to get the value
  236. if (is_object($record->$field_column)) {
  237. $entity->{$field_name}['und'][0]['chado-' . $field_table . '__' . $field_column] = $record->$field_column->$field_column;
  238. }
  239. else {
  240. // For non FK fields we'll make the field value be the same
  241. // as the column value.
  242. $entity->{$field_name}['und'][0]['value'] = $record->$field_column;
  243. $entity->{$field_name}['und'][0]['chado-' . $field_table . '__' . $field_column] = $record->$field_column;
  244. }
  245. }
  246. // Allow the creating module to alter the value if desired. The
  247. // module should do this if the field has any other form elements
  248. // that need populationg besides the value which was set above.
  249. tripal_load_include_field_class($field_type);
  250. if (class_exists($field_type) and is_subclass_of($field_type, 'TripalField')) {
  251. $tfield = new $field_type($field, $instance);
  252. $tfield->load($entity, array('record' => $record));
  253. }
  254. }
  255. // Type 2: fields for linked records. These fields will have any number
  256. // of form elements that might need populating so we'll offload the
  257. // loading of these fields to the field itself.
  258. if ($field_table != $base_table) {
  259. // Set an empty value by default, and let the hook function update it.
  260. $entity->{$field_name}['und'][0]['value'] = '';
  261. tripal_load_include_field_class($field_type);
  262. if (class_exists($field_type) && method_exists($field_type, 'load')) {
  263. $tfield = new $field_type($field, $instance);
  264. $tfield->load($entity, array('record' => $record));
  265. }
  266. }
  267. } // end: foreach ($fields as $field_id => $ids) {
  268. } // end: foreach ($entities as $id => $entity) {
  269. }
  270. /**
  271. * Merges the values of all fields into a single array keyed by table name.
  272. */
  273. function tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity) {
  274. $all_fields = array();
  275. $base_fields = array();
  276. // Iterate through all of the fields and organize them into a
  277. // new fields array keyed by the table name
  278. foreach ($fields as $field_id => $ids) {
  279. // Get the field name and information about it.
  280. $field = field_info_field_by_id($field_id);
  281. $field_name = $field['field_name'];
  282. // Some fields (e.g. chado_linker_cvterm_adder) don't add data to
  283. // Chado so they don't have a table, but they are still attached to the
  284. // entity. Just skip these.
  285. if (!array_key_exists('chado_table', $field['settings'])) {
  286. continue;
  287. }
  288. $chado_table = $field['settings']['chado_table'];
  289. $chado_column = $field['settings']['chado_column'];
  290. $base_table = $field['settings']['base_table'];
  291. // Iterate through the field's items. Fields with cardinality ($delta) > 1
  292. // are multi-valued.
  293. $items = field_get_items($entity_type, $entity, $field_name);
  294. $temp = array();
  295. foreach ($items as $delta => $item) {
  296. // A field may have multiple items. The field can use items
  297. // indexed with "chado-" to represent values that should map directly
  298. // to chado tables and fields.
  299. foreach ($item as $item_name => $value) {
  300. $matches = array();
  301. if (preg_match('/^chado-(.*?)__(.*?)$/', $item_name, $matches)) {
  302. $table_name = $matches[1];
  303. $column_name = $matches[2];
  304. // If this field belongs to the base table then we just add
  305. // those values in... there's no delta.
  306. if ($table_name == $base_table) {
  307. $base_fields[$table_name][$column_name] = $value;
  308. }
  309. else {
  310. $temp[$table_name][$delta][$column_name] = $value;
  311. }
  312. }
  313. }
  314. // If there is no value set for the field using the
  315. // chado-[table_name]__[field name] naming schema then check if a 'value'
  316. // item is present and if so use that for the table column value.
  317. if ((!array_key_exists($chado_table, $temp) or
  318. !array_key_exists($delta, $temp[$chado_table]) or
  319. !array_key_exists($chado_column, $temp[$chado_table][$delta])) and
  320. array_key_exists('value', $items[$delta]) and
  321. !is_array($items[$delta]['value'])) {
  322. // If this field belongs to the base table then we just add
  323. // those values in... there's no delta.
  324. if ($base_table == $chado_table) {
  325. $base_fields[$chado_table][$chado_column] = $item['value'];
  326. }
  327. else {
  328. $temp[$chado_table][$delta][$chado_column] = $item['value'];
  329. }
  330. }
  331. }
  332. // Now merge the records for this field with the $new_fields array
  333. foreach ($temp as $table_name => $details) {
  334. foreach ($details as $delta => $list) {
  335. $all_fields[$table_name][] = $list;
  336. }
  337. }
  338. }
  339. $all_fields = array_merge($base_fields, $all_fields);
  340. return $all_fields;
  341. }
  342. /**
  343. * Recurses through a field's items breaking it into a nested array.
  344. */
  345. function tripal_chado_field_storage_expand_field($item_name, $value) {
  346. $matches = array();
  347. if (preg_match('/^(.*?)--(.*?)$/', $item_name, $matches)) {
  348. $parent_item_name = $matches[1];
  349. $sub_item_name = $matches[2];
  350. $sub_item = tripal_chado_field_storage_expand_field($sub_item_name, $value);
  351. return array($parent_item_name => $sub_item);
  352. }
  353. else {
  354. return array($item_name => $value);
  355. }
  356. }
  357. /**
  358. * Implements hook_field_storage_query().
  359. */
  360. function tripal_chado_field_storage_query($query) {
  361. //print_r($query->fieldConditions);
  362. // The conditions and order bys are reorganized into a filters array for the
  363. // chado_select_record function()
  364. $filters = array();
  365. // Iterate through all the conditions and add to the filters array
  366. // a chado_select_record compatible set of filters.
  367. foreach ($query->fieldConditions as $index => $condition) {
  368. $field = $condition['field'];
  369. // Skip conditions that don't belong to this storage type.
  370. if ($field['storage']['type'] != 'field_chado_storage') {
  371. continue;
  372. }
  373. $column = $condition['column'];
  374. $value = $condition['value'];
  375. $field_type = $field['type'];
  376. $field_module = $field['module'];
  377. $settings = $field['settings'];
  378. $chado_table = $settings['chado_table'];
  379. $chado_column = $settings['chado_column'];
  380. // Set the value for this field search.
  381. $subfields = explode('.', $column);
  382. //print_r($subfields);
  383. if (count($subfields) > 1) {
  384. // Get the term for this field's column and replace the field_name with
  385. // the term. We need to do this for the recursive function to work.
  386. // We must lowercase the term and underscore it because that's how we
  387. // can support case-insensitivity and lack of spacing such as for
  388. // web services.
  389. $subfield1 = tripal_get_chado_semweb_term($chado_table, $chado_column, array('return_object' => TRUE));
  390. $subfields[0] = strtolower(preg_replace('/ /', '_', $subfield1->name));
  391. $value = tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value);
  392. $value = array_shift($value);
  393. }
  394. else {
  395. $value = $condition['value'];
  396. }
  397. // Use the appropriate operator.
  398. $operator = $condition['operator'] ? $condition['operator'] : '=';
  399. switch ($operator) {
  400. case '=':
  401. $filters[$chado_table][$chado_column] = $value;
  402. break;
  403. case '>':
  404. case '>=':
  405. case '<':
  406. case '<=':
  407. $filters[$chado_table][$chado_column] = array(
  408. 'op' => $operator,
  409. 'data' => $value,
  410. );
  411. break;
  412. case '<>':
  413. $filters[$chado_table][$chado_column] = array(
  414. 'op' => '<>',
  415. 'data' => $value,
  416. );
  417. break;
  418. case 'CONTAINS':
  419. $filters[$chado_table][$chado_column] = array(
  420. 'op' => 'LIKE',
  421. 'data' => '%' . $value . '%',
  422. );
  423. break;
  424. case 'NOT':
  425. $filters[$chado_table][$chado_column] = array(
  426. 'op' => 'NOT LIKE',
  427. 'data' => '%' . $value . '%',
  428. );
  429. break;
  430. case 'STARTS WITH':
  431. $filters[$chado_table][$chado_column] = array(
  432. 'op' => 'LIKE',
  433. 'data' => $value . '%',
  434. );
  435. break;
  436. case 'NOT STARTS':
  437. $filters[$chado_table][$chado_column] = array(
  438. 'op' => 'NOT LIKE',
  439. 'data' => $value . '%',
  440. );
  441. break;
  442. case 'ENDS WITH':
  443. $filters[$chado_table][$chado_column] = array(
  444. 'op' => 'LIKE',
  445. 'data' => '%' . $value,
  446. );
  447. break;
  448. case 'NOT ENDS':
  449. $filters[$chado_table][$chado_column] = array(
  450. 'op' => 'NOT LIKE',
  451. 'data' => '%' . $value,
  452. );
  453. break;
  454. default:
  455. // unrecognized operation.
  456. break;
  457. }
  458. }
  459. // Now get the list for sorting.
  460. foreach ($query->order as $index => $sort) {
  461. $field = $sort['specifier']['field'];
  462. // Skip sorts that don't belong to this storage type.
  463. if ($field['storage']['type'] != 'field_chado_storage') {
  464. continue;
  465. }
  466. $direction = $sort['direction'];
  467. $field_type = $field['type'];
  468. $field_module = $field['module'];
  469. $settings = $field['settings'];
  470. $chado_table = $settings['chado_table'];
  471. $chado_column = $settings['chado_column'];
  472. $sorting[$chado_table][$chado_column] = $direction;
  473. }
  474. // Iterate through the filters and perform the query
  475. $entity_ids = array();
  476. foreach ($filters as $chado_table => $values) {
  477. //print_r($chado_table);
  478. //print_r($values);
  479. // First get the matching record IDs from the Chado table.
  480. $schema = chado_get_schema($chado_table);
  481. $pkey = $schema['primary key'][0];
  482. $results = chado_select_record($chado_table, array($pkey), $values);
  483. $record_ids = array();
  484. foreach ($results as $result) {
  485. $record_ids[] = $result->$pkey;
  486. }
  487. // Next look for matching IDs in the chado_entity table.
  488. $filter_ids = array();
  489. if (count($record_ids) > 0) {
  490. $select = db_select('chado_entity', 'CE');
  491. $select->join('tripal_entity', 'TE', 'TE.id = CE.entity_id');
  492. $select->fields('CE', array('entity_id'));
  493. $select->fields('TE', array('bundle'));
  494. $select->condition('record_id', $record_ids);
  495. // If a bundle is specified then make sure we match on the bundle.
  496. if (array_key_exists('bundle', $query->entityConditions)) {
  497. $select->condition('bundle', $query->entityConditions['bundle']);
  498. }
  499. $results = $select->execute();
  500. while ($result = $results->fetchObject()) {
  501. $entity_ids[] = array($result->entity_id, 0, $result->bundle);
  502. }
  503. }
  504. }
  505. $result = array(
  506. 'TripalEntity' => array()
  507. );
  508. foreach ($entity_ids as $ids) {
  509. $result['TripalEntity'][$ids[0]] = entity_create_stub_entity('TripalEntity', $ids);
  510. }
  511. return $result;
  512. }
  513. /**
  514. *
  515. * @param $subfields
  516. * @param $value
  517. */
  518. function tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value) {
  519. $sub_value = array();
  520. // Get the subvalue for this iteration
  521. $subfield = array_shift($subfields);
  522. // Get the cvterms mapped to this table.
  523. $columns = db_select('chado_semweb', 'CS')
  524. ->fields('CS', array('chado_column', 'cvterm_id'))
  525. ->condition('chado_table', $chado_table)
  526. ->execute();
  527. // Iterate through the columns and find the one with cvterm that matches
  528. // the subfield name.
  529. $chado_column = '';
  530. while($column = $columns->fetchObject()) {
  531. $cvterm_id = $column->cvterm_id;
  532. $cvterm = tripal_get_cvterm(array('cvterm_id' => $cvterm_id));
  533. // Convert the term name to lower-case and replace spaces with underscores
  534. // so we can perform case insensitive comparisions and ingore spacing.
  535. $term_name = strtolower(preg_replace('/ /', '_', $cvterm->name));
  536. if ($subfield == $term_name) {
  537. $chado_column = $column->chado_column;
  538. }
  539. }
  540. // If we have more subfields then this should be a foreign key and we should
  541. // recurse.
  542. if (count($subfields) > 0) {
  543. // Get the foreign keys for this Chado table.
  544. $schema = chado_get_schema($chado_table);
  545. $fkeys = $schema['foreign keys'];
  546. // Iterate through the FKs to find the one that matches this Chado field.
  547. foreach ($fkeys as $fk_table => $details) {
  548. foreach ($details['columns'] as $lkey => $rkey) {
  549. if ($lkey == $chado_column) {
  550. $sub_value = tripal_chado_field_storage_recurse_subfilters($fk_table, $subfields, $value);
  551. return array($chado_column => $sub_value);
  552. }
  553. }
  554. }
  555. }
  556. return array($chado_column => $value);
  557. }