tripal_chado.field_storage.inc 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624
  1. <?php
  2. /**
  3. * Implements hook_field_storage_info().
  4. */
  5. function tripal_chado_field_storage_info() {
  6. return array(
  7. 'field_chado_storage' => array(
  8. 'label' => t('Chado'),
  9. 'description' => t('Stores fields in the local Chado database.'),
  10. 'settings' => array(),
  11. // The logo_url key is supported by Tripal. It's not a Drupal key. It's
  12. // used for adding a logo or picture for the data store to help make it
  13. // more easily recognized on the field_ui_field_overview_form. Ideally
  14. // the URL should point to a relative path on the local Drupal site.
  15. 'logo_url' => url(drupal_get_path('module', 'tripal') . '/theme/images/250px-ChadoLogo.png'),
  16. ),
  17. );
  18. }
  19. /**
  20. * Implements hook_field_storage_write().
  21. */
  22. function tripal_chado_field_storage_write($entity_type, $entity, $op, $fields) {
  23. // Get the bundle and the term for this entity.
  24. $bundle = tripal_load_bundle_entity(array('name' => $entity->bundle));
  25. $term = entity_load('TripalTerm', array('id' => $entity->term_id));
  26. $term = reset($term);
  27. // Convert the Tripal term entity into the appropriate record in Chado.
  28. $dbxref = tripal_get_dbxref(array('accession' => $term->accession, 'db_id' => array('name' => $term->vocab->vocabulary)));
  29. $cvterm = tripal_get_cvterm(array('dbxref_id' => $dbxref->dbxref_id));
  30. // Get the base table, type field and record_id from the entity.
  31. $base_table = $entity->chado_table;
  32. $type_field = $entity->chado_column;
  33. $record = $entity->chado_record;
  34. $record_id = $entity->chado_record_id;
  35. $base_schema = chado_get_schema($base_table);
  36. $base_pkey = $base_schema['primary key'][0];
  37. // Convert the fields into a key/value list of fields and their values.
  38. $field_vals = tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity);
  39. // First, write the record for the base table. If we have a record id then
  40. // this is an update and we need to set the primary key. If not, then this
  41. // is an insert and we need to set the type_id if the table supports it.
  42. $values = $field_vals[$base_table];
  43. if ($record_id) {
  44. $values[$base_pkey] = $record_id;
  45. }
  46. elseif ($type_field) {
  47. $values[$type_field] = $cvterm->cvterm_id;
  48. }
  49. $base_record_id = tripal_chado_field_storage_write_table($base_table, $values);
  50. // If this is an insert then add the chado_entity record.
  51. if ($op == FIELD_STORAGE_INSERT) {
  52. // Add a record to the chado_entity table so that the data for the
  53. // fields can be pulled from Chado when loaded the next time.
  54. $record = array(
  55. 'entity_id' => $entity->id,
  56. 'record_id' => $base_record_id,
  57. 'data_table' => $base_table,
  58. );
  59. $success = drupal_write_record('chado_entity', $record);
  60. if (!$success) {
  61. drupal_set_message('Unable to insert new Chado entity.', 'error');
  62. }
  63. }
  64. // Now that we have handled the base table, we need to handle linking tables.
  65. foreach ($field_vals as $table_name => $details) {
  66. // Skip the base table as we've already dealt with it.
  67. if ($table_name == $base_table) {
  68. continue;
  69. }
  70. foreach ($details as $delta => $values) {
  71. $record_id = tripal_chado_field_storage_write_table($table_name, $values);
  72. }
  73. }
  74. }
  75. /**
  76. * Write (inserts/updates/deletes) values for a Chado table.
  77. *
  78. * The $values array is of the same format used by chado_insert_record() and
  79. * chado_update_record(). However, both of those methods will use any nested
  80. * arrays (i.e. representing foreign keys) to select an appropriate record ID
  81. * that can be substituted as the value. Here, the nested arrays are
  82. * either inserted or updated as well, but the choice is determined if the
  83. * primary key value is present. If present an update occurs, if not present
  84. * then an insert occurs.
  85. *
  86. * This function is recursive and nested arrays from the lowest point of the
  87. * "tree" are dealt with first.
  88. *
  89. * @param $table_name
  90. * The name of the table on which the insertion/update is performed.
  91. * @param $values
  92. * The values array for the insertion.
  93. *
  94. * @throws Exception
  95. *
  96. * @return
  97. * The unique record ID.
  98. */
  99. function tripal_chado_field_storage_write_table($table_name, $values) {
  100. $schema = chado_get_schema($table_name);
  101. $fkeys = $schema['foreign keys'];
  102. $pkey = $schema['primary key'][0];
  103. // Fields with a cardinality greater than 1 will often submit an
  104. // empty form. We want to remove these empty submissions. We can detect
  105. // them if all of the fields are empty.
  106. $num_empty = 0;
  107. foreach ($values as $column => $value) {
  108. if (!$value) {
  109. $num_empty++;
  110. }
  111. }
  112. if ($num_empty == count(array_keys($values))) {
  113. return '';
  114. }
  115. // If the primary key column has a value but all other values are empty then
  116. // this is a delete.
  117. if (array_key_exists($pkey, $values) and $values[$pkey]) {
  118. $num_vals = 0;
  119. foreach ($values as $value) {
  120. if ($value) {
  121. $num_vals++;
  122. }
  123. }
  124. if ($num_vals == 1) {
  125. $new_vals[$pkey] = $values[$pkey];
  126. if (!chado_delete_record($table_name, $new_vals)) {
  127. throw new Exception('Could not delete record from table: "' . $table_name . '".');
  128. }
  129. return '';
  130. }
  131. }
  132. // If the primary key column does not have a value then this is an insert.
  133. if (!array_key_exists($pkey, $values) or !$values[$pkey] or !isset($values[$pkey])) {
  134. // Before inserting, we want to make sure the record does not
  135. // already exist. Using the unique constraint check for a matching record.
  136. $options = array('is_duplicate' => TRUE);
  137. $is_duplicate = chado_select_record($table_name, array('*'), $values, $options);
  138. if($is_duplicate) {
  139. $record = chado_select_record($table_name, array('*'), $values);
  140. return $record[0]->$pkey;
  141. }
  142. // Insert the values array as a new record in the table but remove the
  143. // pkey as it should be set.
  144. $new_vals = $values;
  145. unset($new_vals[$pkey]);
  146. $record = chado_insert_record($table_name, $new_vals);
  147. if ($record === FALSE) {
  148. throw new Exception('Could not insert Chado record into table: "' . $table_name . '".');
  149. }
  150. return $record[$pkey];
  151. }
  152. // If we've made it to this point then this is an update.
  153. // TODO: what if the unique constraint matches another record? That is
  154. // not being tested for here.
  155. $match[$pkey] = $values[$pkey];
  156. if (!chado_update_record($table_name, $match, $values)) {
  157. drupal_set_message("Could not update Chado record in table: $table_name.", 'error');
  158. }
  159. return $values[$pkey];
  160. }
  161. /**
  162. * Implements hook_field_storage_load().
  163. *
  164. * Responsible for loading the fields from the Chado database and adding
  165. * their values to the entity.
  166. */
  167. function tripal_chado_field_storage_load($entity_type, $entities, $age,
  168. $fields, $options) {
  169. $load_current = $age == FIELD_LOAD_CURRENT;
  170. global $language;
  171. $langcode = $language->language;
  172. foreach ($entities as $id => $entity) {
  173. if (property_exists($entity, 'chado_table')) {
  174. // Get the base table and record id for the fields of this entity.
  175. $base_table = $entity->chado_table;
  176. $type_field = $entity->chado_column;
  177. $record_id = $entity->chado_record_id;
  178. }
  179. else {
  180. $bundle = tripal_load_bundle_entity(array('name' => $entity->bundle));
  181. $base_table = $bundle->data_table;
  182. $type_field = $bundle->type_column;
  183. // Get the base table and record id for the fields of this entity.
  184. $details = db_select('chado_entity', 'ce')
  185. ->fields('ce')
  186. ->condition('entity_id', $entity->id)
  187. ->execute()
  188. ->fetchObject();
  189. if (!$details) {
  190. // TODO: what to do if record is missing!
  191. }
  192. $record_id = isset($details->record_id) ? $details->record_id : '';
  193. }
  194. // Get this table's schema.
  195. $schema = chado_get_schema($base_table);
  196. $pkey_field = $schema['primary key'][0];
  197. // Get the base record if one exists
  198. $columns = array('*');
  199. $match = array($pkey_field => $record_id);
  200. $record = chado_generate_var($base_table, $match);
  201. $entity->chado_record = $record;
  202. // Iterate through the entity's fields so we can get the column names
  203. // that need to be selected from each of the tables represented.
  204. $tables = array();
  205. foreach ($fields as $field_id => $ids) {
  206. // By the time this hook runs, the relevant field definitions have been
  207. // populated and cached in FieldInfo, so calling field_info_field_by_id()
  208. // on each field individually is more efficient than loading all fields in
  209. // memory upfront with field_info_field_by_ids().
  210. $field = field_info_field_by_id($field_id);
  211. $field_name = $field['field_name'];
  212. $field_type = $field['type'];
  213. $field_module = $field['module'];
  214. // Get the instnace for this field
  215. $instance = field_info_instance($entity_type, $field_name, $entity->bundle);
  216. // Skip fields that don't map to a Chado table (e.g. kvproperty_adder).
  217. if (!array_key_exists('settings', $instance) or !array_key_exists('chado_table', $instance['settings'])) {
  218. continue;
  219. }
  220. // Get the Chado table and column for this field.
  221. $field_table = $instance['settings']['chado_table'];
  222. $field_column = $instance['settings']['chado_column'];
  223. // There are only two types of fields: 1) fields that represent a single
  224. // column of the base table, or 2) fields that represent a linked record
  225. // in a many-to-one relationship with the base table.
  226. // Type 1: fields from base tables.
  227. if ($field_table == $base_table) {
  228. // Set an empty value by default, and if there is a record, then update.
  229. $entity->{$field_name}['und'][0]['value'] = '';
  230. if ($record and property_exists($record, $field_column)) {
  231. // If the field column is an object then it's a FK to another table.
  232. // and because $record object is created by the chado_generate_var()
  233. // function we must go one more level deeper to get the value
  234. if (is_object($record->$field_column)) {
  235. $entity->{$field_name}['und'][0]['chado-' . $field_table . '__' . $field_column] = $record->$field_column->$field_column;
  236. }
  237. else {
  238. // For non FK fields we'll make the field value be the same
  239. // as the column value.
  240. $entity->{$field_name}['und'][0]['value'] = $record->$field_column;
  241. $entity->{$field_name}['und'][0]['chado-' . $field_table . '__' . $field_column] = $record->$field_column;
  242. }
  243. }
  244. // Allow the creating module to alter the value if desired. The
  245. // module should do this if the field has any other form elements
  246. // that need populationg besides the value which was set above.
  247. tripal_load_include_field_class($field_type);
  248. if (class_exists($field_type) and is_subclass_of($field_type, 'TripalField')) {
  249. $tfield = new $field_type($field, $instance);
  250. $tfield->load($entity, array('record' => $record));
  251. }
  252. }
  253. // Type 2: fields for linked records. These fields will have any number
  254. // of form elements that might need populating so we'll offload the
  255. // loading of these fields to the field itself.
  256. if ($field_table != $base_table) {
  257. // Set an empty value by default, and let the hook function update it.
  258. $entity->{$field_name}['und'][0]['value'] = '';
  259. tripal_load_include_field_class($field_type);
  260. if (class_exists($field_type) && method_exists($field_type, 'load')) {
  261. $tfield = new $field_type($field, $instance);
  262. $tfield->load($entity, array('record' => $record));
  263. }
  264. }
  265. } // end: foreach ($fields as $field_id => $ids) {
  266. } // end: foreach ($entities as $id => $entity) {
  267. }
  268. /**
  269. * Merges the values of all fields into a single array keyed by table name.
  270. */
  271. function tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity) {
  272. $all_fields = array();
  273. $base_fields = array();
  274. // Iterate through all of the fields and organize them into a
  275. // new fields array keyed by the table name
  276. foreach ($fields as $field_id => $ids) {
  277. // Get the field name and information about it.
  278. $field = field_info_field_by_id($field_id);
  279. $field_name = $field['field_name'];
  280. // Some fields (e.g. chado_linker_cvterm_adder) don't add data to
  281. // Chado so they don't have a table, but they are still attached to the
  282. // entity. Just skip these.
  283. if (!array_key_exists('chado_table', $field['settings'])) {
  284. continue;
  285. }
  286. $chado_table = $field['settings']['chado_table'];
  287. $chado_column = $field['settings']['chado_column'];
  288. $base_table = $field['settings']['base_table'];
  289. // Iterate through the field's items. Fields with cardinality ($delta) > 1
  290. // are multi-valued.
  291. $items = field_get_items($entity_type, $entity, $field_name);
  292. $temp = array();
  293. foreach ($items as $delta => $item) {
  294. // A field may have multiple items. The field can use items
  295. // indexed with "chado-" to represent values that should map directly
  296. // to chado tables and fields.
  297. foreach ($item as $item_name => $value) {
  298. $matches = array();
  299. if (preg_match('/^chado-(.*?)__(.*?)$/', $item_name, $matches)) {
  300. $table_name = $matches[1];
  301. $column_name = $matches[2];
  302. // If this field belongs to the base table then we just add
  303. // those values in... there's no delta.
  304. if ($table_name == $base_table) {
  305. $base_fields[$table_name][$column_name] = $value;
  306. }
  307. else {
  308. $temp[$table_name][$delta][$column_name] = $value;
  309. }
  310. }
  311. }
  312. // If there is no value set for the field using the
  313. // chado-[table_name]__[field name] naming schema then check if a 'value'
  314. // item is present and if so use that for the table column value.
  315. if ((!array_key_exists($chado_table, $temp) or
  316. !array_key_exists($delta, $temp[$chado_table]) or
  317. !array_key_exists($chado_column, $temp[$chado_table][$delta])) and
  318. array_key_exists('value', $items[$delta]) and
  319. !is_array($items[$delta]['value'])) {
  320. // If this field belongs to the base table then we just add
  321. // those values in... there's no delta.
  322. if ($base_table == $chado_table) {
  323. $base_fields[$chado_table][$chado_column] = $item['value'];
  324. }
  325. else {
  326. $temp[$chado_table][$delta][$chado_column] = $item['value'];
  327. }
  328. }
  329. }
  330. // Now merge the records for this field with the $new_fields array
  331. foreach ($temp as $table_name => $details) {
  332. foreach ($details as $delta => $list) {
  333. $all_fields[$table_name][] = $list;
  334. }
  335. }
  336. }
  337. $all_fields = array_merge($base_fields, $all_fields);
  338. return $all_fields;
  339. }
  340. /**
  341. * Recurses through a field's items breaking it into a nested array.
  342. */
  343. function tripal_chado_field_storage_expand_field($item_name, $value) {
  344. $matches = array();
  345. if (preg_match('/^(.*?)--(.*?)$/', $item_name, $matches)) {
  346. $parent_item_name = $matches[1];
  347. $sub_item_name = $matches[2];
  348. $sub_item = tripal_chado_field_storage_expand_field($sub_item_name, $value);
  349. return array($parent_item_name => $sub_item);
  350. }
  351. else {
  352. return array($item_name => $value);
  353. }
  354. }
  355. /**
  356. * Implements hook_field_storage_query().
  357. */
  358. function tripal_chado_field_storage_query($query) {
  359. //print_r($query->fieldConditions);
  360. // The conditions and order bys are reorganized into a filters array for the
  361. // chado_select_record function()
  362. $filters = array();
  363. // Iterate through all the conditions and add to the filters array
  364. // a chado_select_record compatible set of filters.
  365. foreach ($query->fieldConditions as $index => $condition) {
  366. $field = $condition['field'];
  367. // Skip conditions that don't belong to this storage type.
  368. if ($field['storage']['type'] != 'field_chado_storage') {
  369. continue;
  370. }
  371. $column = $condition['column'];
  372. $value = $condition['value'];
  373. $field_type = $field['type'];
  374. $field_module = $field['module'];
  375. $settings = $field['settings'];
  376. $chado_table = $settings['chado_table'];
  377. $chado_column = $settings['chado_column'];
  378. // Set the value for this field search.
  379. $subfields = explode('.', $column);
  380. //print_r($subfields);
  381. if (count($subfields) > 1) {
  382. // Get the term for this field's column and replace the field_name with
  383. // the term. We need to do this for the recursive function to work.
  384. // We must lowercase the term and underscore it because that's how we
  385. // can support case-insensitivity and lack of spacing such as for
  386. // web services.
  387. $subfield1 = tripal_get_chado_semweb_term($chado_table, $chado_column, array('return_object' => TRUE));
  388. $subfields[0] = strtolower(preg_replace('/ /', '_', $subfield1->name));
  389. $value = tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value);
  390. $value = array_shift($value);
  391. }
  392. else {
  393. $value = $condition['value'];
  394. }
  395. // Use the appropriate operator.
  396. $operator = $condition['operator'] ? $condition['operator'] : '=';
  397. switch ($operator) {
  398. case '=':
  399. $filters[$chado_table][$chado_column] = $value;
  400. break;
  401. case '>':
  402. case '>=':
  403. case '<':
  404. case '<=':
  405. $filters[$chado_table][$chado_column] = array(
  406. 'op' => $operator,
  407. 'data' => $value,
  408. );
  409. break;
  410. case '<>':
  411. $filters[$chado_table][$chado_column] = array(
  412. 'op' => '<>',
  413. 'data' => $value,
  414. );
  415. break;
  416. case 'CONTAINS':
  417. $filters[$chado_table][$chado_column] = array(
  418. 'op' => 'LIKE',
  419. 'data' => '%' . $value . '%',
  420. );
  421. break;
  422. case 'NOT':
  423. $filters[$chado_table][$chado_column] = array(
  424. 'op' => 'NOT LIKE',
  425. 'data' => '%' . $value . '%',
  426. );
  427. break;
  428. case 'STARTS WITH':
  429. $filters[$chado_table][$chado_column] = array(
  430. 'op' => 'LIKE',
  431. 'data' => $value . '%',
  432. );
  433. break;
  434. case 'NOT STARTS':
  435. $filters[$chado_table][$chado_column] = array(
  436. 'op' => 'NOT LIKE',
  437. 'data' => $value . '%',
  438. );
  439. break;
  440. case 'ENDS WITH':
  441. $filters[$chado_table][$chado_column] = array(
  442. 'op' => 'LIKE',
  443. 'data' => '%' . $value,
  444. );
  445. break;
  446. case 'NOT ENDS':
  447. $filters[$chado_table][$chado_column] = array(
  448. 'op' => 'NOT LIKE',
  449. 'data' => '%' . $value,
  450. );
  451. break;
  452. default:
  453. // unrecognized operation.
  454. break;
  455. }
  456. }
  457. // Now get the list for sorting.
  458. foreach ($query->order as $index => $sort) {
  459. $field = $sort['specifier']['field'];
  460. // Skip sorts that don't belong to this storage type.
  461. if ($field['storage']['type'] != 'field_chado_storage') {
  462. continue;
  463. }
  464. $direction = $sort['direction'];
  465. $field_type = $field['type'];
  466. $field_module = $field['module'];
  467. $settings = $field['settings'];
  468. $chado_table = $settings['chado_table'];
  469. $chado_column = $settings['chado_column'];
  470. $sorting[$chado_table][$chado_column] = $direction;
  471. }
  472. // Iterate through the filters and perform the query
  473. $entity_ids = array();
  474. foreach ($filters as $chado_table => $values) {
  475. //print_r($chado_table);
  476. //print_r($values);
  477. // First get the matching record IDs from the Chado table.
  478. $schema = chado_get_schema($chado_table);
  479. $pkey = $schema['primary key'][0];
  480. $results = chado_select_record($chado_table, array($pkey), $values);
  481. $record_ids = array();
  482. foreach ($results as $result) {
  483. $record_ids[] = $result->$pkey;
  484. }
  485. // Next look for matching IDs in the chado_entity table.
  486. $filter_ids = array();
  487. if (count($record_ids) > 0) {
  488. $select = db_select('chado_entity', 'CE');
  489. $select->join('tripal_entity', 'TE', 'TE.id = CE.entity_id');
  490. $select->fields('CE', array('entity_id'));
  491. $select->fields('TE', array('bundle'));
  492. $select->condition('record_id', $record_ids);
  493. // If a bundle is specified then make sure we match on the bundle.
  494. if (array_key_exists('bundle', $query->entityConditions)) {
  495. $select->condition('bundle', $query->entityConditions['bundle']);
  496. }
  497. $results = $select->execute();
  498. while ($result = $results->fetchObject()) {
  499. $entity_ids[] = array($result->entity_id, 0, $result->bundle);
  500. }
  501. }
  502. }
  503. $result = array(
  504. 'TripalEntity' => array()
  505. );
  506. foreach ($entity_ids as $ids) {
  507. $result['TripalEntity'][$ids[0]] = entity_create_stub_entity('TripalEntity', $ids);
  508. }
  509. return $result;
  510. }
  511. /**
  512. *
  513. * @param $subfields
  514. * @param $value
  515. */
  516. function tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value) {
  517. $sub_value = array();
  518. // Get the subvalue for this iteration
  519. $subfield = array_shift($subfields);
  520. // Get the cvterms mapped to this table.
  521. $columns = db_select('chado_semweb', 'CS')
  522. ->fields('CS', array('chado_column', 'cvterm_id'))
  523. ->condition('chado_table', $chado_table)
  524. ->execute();
  525. // Iterate through the columns and find the one with cvterm that matches
  526. // the subfield name.
  527. $chado_column = '';
  528. while($column = $columns->fetchObject()) {
  529. $cvterm_id = $column->cvterm_id;
  530. $cvterm = tripal_get_cvterm(array('cvterm_id' => $cvterm_id));
  531. // Convert the term name to lower-case and replace spaces with underscores
  532. // so we can perform case insensitive comparisions and ingore spacing.
  533. $term_name = strtolower(preg_replace('/ /', '_', $cvterm->name));
  534. if ($subfield == $term_name) {
  535. $chado_column = $column->chado_column;
  536. }
  537. }
  538. // If we have more subfields then this should be a foreign key and we should
  539. // recurse.
  540. if (count($subfields) > 0) {
  541. // Get the foreign keys for this Chado table.
  542. $schema = chado_get_schema($chado_table);
  543. $fkeys = $schema['foreign keys'];
  544. // Iterate through the FKs to find the one that matches this Chado field.
  545. foreach ($fkeys as $fk_table => $details) {
  546. foreach ($details['columns'] as $lkey => $rkey) {
  547. if ($lkey == $chado_column) {
  548. $sub_value = tripal_chado_field_storage_recurse_subfilters($fk_table, $subfields, $value);
  549. return array($chado_column => $sub_value);
  550. }
  551. }
  552. }
  553. }
  554. return array($chado_column => $value);
  555. }