tripal_chado.field_storage.inc 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615
  1. <?php
  2. /**
  3. * Implements hook_field_storage_info().
  4. */
  5. function tripal_chado_field_storage_info() {
  6. return array(
  7. 'field_chado_storage' => array(
  8. 'label' => t('Chado'),
  9. 'description' => t('Stores fields in the local Chado database.'),
  10. 'settings' => array(),
  11. // The logo_url key is supported by Tripal. It's not a Drupal key. It's
  12. // used for adding a logo or picture for the data store to help make it
  13. // more easily recognized on the field_ui_field_overview_form. Ideally
  14. // the URL should point to a relative path on the local Drupal site.
  15. 'logo_url' => url(drupal_get_path('module', 'tripal') . '/theme/images/250px-ChadoLogo.png'),
  16. ),
  17. );
  18. }
  19. /**
  20. * Implements hook_field_storage_write().
  21. */
  22. function tripal_chado_field_storage_write($entity_type, $entity, $op, $fields) {
  23. // Get the bundle and the term for this entity.
  24. $bundle = tripal_load_bundle_entity(array('name' => $entity->bundle));
  25. $term = entity_load('TripalTerm', array('id' => $entity->term_id));
  26. $term = reset($term);
  27. // Convert the Tripal term entity into the appropriate record in Chado.
  28. $dbxref = tripal_get_dbxref(array('accession' => $term->accession, 'db_id' => array('name' => $term->vocab->vocabulary)));
  29. $cvterm = tripal_get_cvterm(array('dbxref_id' => $dbxref->dbxref_id));
  30. // Get the base table, type field and record_id from the entity.
  31. $base_table = $entity->chado_table;
  32. $type_field = $entity->chado_column;
  33. $record = $entity->chado_record;
  34. $record_id = $entity->chado_record_id;
  35. $base_schema = chado_get_schema($base_table);
  36. $base_pkey = $base_schema['primary key'][0];
  37. // Convert the fields into a key/value list of fields and their values.
  38. $field_vals = tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity);
  39. // First, write the record for the base table. If we have a record id then
  40. // this is an upate and we need to set the primary key. If not, then this
  41. // is an insert and we need to set the type_id if the table supports it.
  42. $values = $field_vals[$base_table][0];
  43. if ($record_id) {
  44. $values[$base_pkey] = $record_id;
  45. }
  46. elseif ($type_field) {
  47. $values[$type_field] = $cvterm->cvterm_id;
  48. }
  49. $base_record_id = tripal_chado_field_storage_write_table($base_table, $values);
  50. // If this is an insert then add the chado_entity record.
  51. if ($op == FIELD_STORAGE_INSERT) {
  52. // Add a record to the chado_entity table so that the data for the
  53. // fields can be pulled from Chado when loaded the next time.
  54. $record = array(
  55. 'entity_id' => $entity->id,
  56. 'record_id' => $base_record_id,
  57. 'data_table' => $base_table,
  58. 'type_table' => $base_table,
  59. 'field' => $type_field,
  60. );
  61. $success = drupal_write_record('chado_entity', $record);
  62. if (!$success) {
  63. drupal_set_message('Unable to insert new Chado entity.', 'error');
  64. }
  65. }
  66. // Now that we have handled the base table, we need to handle linking tables.
  67. foreach ($field_vals as $table_name => $details) {
  68. // Skip the base table as we've already dealt with it.
  69. if ($table_name == $base_table) {
  70. continue;
  71. }
  72. foreach ($details as $delta => $values) {
  73. $record_id = tripal_chado_field_storage_write_table($table_name, $values);
  74. }
  75. }
  76. }
  77. /**
  78. * Write (inserts/updates) a nested array of values for a table.
  79. *
  80. * The $values array is of the same format used by chado_insert_record() and
  81. * chado_update_record(). However, both of those methods will use any nested
  82. * arrays (i.e. representing foreign keys) to select an appropriate record ID
  83. * that can be substituted as the value. Here, the nested arrays are
  84. * either inserted or updated as well, but the choice is determined if the
  85. * primary key value is present. If present an update occurs, if not present
  86. * then an insert occurs.
  87. *
  88. * This function is recursive and nested arrays from the lowest point of the
  89. * "tree" are dealt with first.
  90. *
  91. * @param $table_name
  92. * The name of the table on which the insertion/update is performed.
  93. * @param $values
  94. * The values array for the insertion.
  95. * @throws Exception
  96. * @return
  97. * The unique record ID.
  98. */
  99. function tripal_chado_field_storage_write_table($table_name, $values) {
  100. $schema = chado_get_schema($table_name);
  101. $fkeys = $schema['foreign keys'];
  102. $pkey = $schema['primary key'][0];
  103. // Before inserting or updating this table, recurse if there are any
  104. // nested FK array values.
  105. foreach ($values as $column => $value) {
  106. // If this value is an array then it must be a FK... let's recurse.
  107. if (is_array($value)) {
  108. // Find the name of the FK table for this column.
  109. $fktable_name = '';
  110. foreach ($fkeys as $fktable => $details) {
  111. foreach ($details['columns'] as $fkey_lcolumn => $fkey_rcolumn) {
  112. if ($fkey_lcolumn == $column) {
  113. $fktable_name = $fktable;
  114. }
  115. }
  116. }
  117. // Recurse on this recod.
  118. $record_id = tripal_chado_field_storage_write_table($fktable_name, $values[$column]);
  119. $values[$column] = $record_id;
  120. }
  121. }
  122. // Fields with a cardinality greater than 1 will often submit an
  123. // empty form. We want to remove these empty submissions. We can detect
  124. // them if all of the fields are empty.
  125. $num_empty = 0;
  126. foreach ($values as $column => $value) {
  127. if (!$value) {
  128. $num_empty++;
  129. }
  130. }
  131. if ($num_empty == count(array_keys($values))) {
  132. return '';
  133. }
  134. // If the primary key column has a value then this will be an udpate,
  135. // otherwise it's an insert.
  136. if (!array_key_exists($pkey, $values) or !$values[$pkey] or !isset($values[$pkey])) {
  137. // Before inserting, we want to make sure the record does not
  138. // already exist. Using the unique constraint check for a matching record.
  139. $options = array('is_duplicate' => TRUE);
  140. $is_duplicate = chado_select_record($table_name, array('*'), $values, $options);
  141. if($is_duplicate) {
  142. $record = chado_select_record($table_name, array('*'), $values);
  143. return $record[0]->$pkey;
  144. }
  145. // Insert the values array as a new record in the table but remove the
  146. // pkey as it should be set.
  147. $new_vals = $values;
  148. unset($new_vals[$pkey]);
  149. $record = chado_insert_record($table_name, $new_vals);
  150. if ($record === FALSE) {
  151. throw new Exception('Could not insert Chado record into table: "' . $table_name . '".');
  152. }
  153. return $record[$pkey];
  154. }
  155. // We have an incoming record_id so this is an update.
  156. else {
  157. // TODO: what if the unique constraint matches another record? That is
  158. // not being tested for here.
  159. $match[$pkey] = $values[$pkey];
  160. if (!chado_update_record($table_name, $match, $values)) {
  161. drupal_set_message("Could not update Chado record in table: $table_name.", 'error');
  162. }
  163. return $values[$pkey];
  164. }
  165. }
  166. /**
  167. * Implements hook_field_storage_load().
  168. *
  169. * Responsible for loading the fields from the Chado database and adding
  170. * their values to the entity.
  171. */
  172. function tripal_chado_field_storage_load($entity_type, $entities, $age,
  173. $fields, $options) {
  174. $load_current = $age == FIELD_LOAD_CURRENT;
  175. global $language;
  176. $langcode = $language->language;
  177. foreach ($entities as $id => $entity) {
  178. if (property_exists($entity, 'chado_table')) {
  179. // Get the base table and record id for the fields of this entity.
  180. $base_table = $entity->chado_table;
  181. $type_field = $entity->chado_column;
  182. $record_id = $entity->chado_record_id;
  183. }
  184. else {
  185. // Get the base table and record id for the fields of this entity.
  186. $details = db_select('chado_entity', 'ce')
  187. ->fields('ce')
  188. ->condition('entity_id', $entity->id)
  189. ->execute()
  190. ->fetchObject();
  191. if (!$details) {
  192. // TODO: what to do if record is missing!
  193. }
  194. // Get some values needed for loading the values from Chado.
  195. $base_table = isset($details->data_table) ? $details->data_table : '';
  196. $type_field = isset($details->field) ? $details->field : '';
  197. $record_id = isset($details->record_id) ? $details->record_id : '';
  198. }
  199. // Get this table's schema.
  200. $schema = chado_get_schema($base_table);
  201. $pkey_field = $schema['primary key'][0];
  202. // Get the base record if one exists
  203. $columns = array('*');
  204. $match = array($pkey_field => $record_id);
  205. $record = chado_generate_var($base_table, $match);
  206. $entity->chado_record = $record;
  207. // For now, expand all 'text' fields.
  208. // TODO: we want to be a bit smarter and allow the user to configure this
  209. // for now we'll expand.
  210. if (isset($schema['fields'])) {
  211. foreach ($schema['fields'] as $field_name => $details) {
  212. if ($schema['fields'][$field_name]['type'] == 'text') {
  213. $record = chado_expand_var($record, 'field', $base_table . '.' . $field_name);
  214. }
  215. }
  216. }
  217. // Iterate through the entity's fields so we can get the column names
  218. // that need to be selected from each of the tables represented.
  219. $tables = array();
  220. foreach ($fields as $field_id => $ids) {
  221. // By the time this hook runs, the relevant field definitions have been
  222. // populated and cached in FieldInfo, so calling field_info_field_by_id()
  223. // on each field individually is more efficient than loading all fields in
  224. // memory upfront with field_info_field_by_ids().
  225. $field = field_info_field_by_id($field_id);
  226. $field_name = $field['field_name'];
  227. $field_type = $field['type'];
  228. $field_module = $field['module'];
  229. // Skip fields that don't map to a Chado table (e.g. kvproperty_adder).
  230. if (!array_key_exists('settings', $field) or !array_key_exists('chado_table', $field['settings'])) {
  231. continue;
  232. }
  233. // Get the Chado table and column for this field.
  234. $field_table = $field['settings']['chado_table'];
  235. $field_column = $field['settings']['chado_column'];
  236. // There are only two types of fields: 1) fields that represent a single
  237. // column of the base table, or 2) fields that represent a linked record
  238. // in a many-to-one relationship with the base table.
  239. // Type 1: fields from base tables.
  240. if ($field_table == $base_table) {
  241. // Set an empty value by default, and if there is a record, then update.
  242. $entity->{$field_name}['und'][0]['value'] = '';
  243. if ($record and property_exists($record, $field_column)) {
  244. // If the field column is an object then it's a FK to another table.
  245. // and because $record object is created by the chado_generate_var()
  246. // function we must go one more level deeper to get the value
  247. if (is_object($record->$field_column)) {
  248. $entity->{$field_name}['und'][0]['chado' . $field_table . '__' . $field_column] = $record->$field_column->$field_column;
  249. }
  250. else {
  251. // For non FK fields we'll make the field value be the same
  252. // as the column value.
  253. $entity->{$field_name}['und'][0]['value'] = $record->$field_column;
  254. $entity->{$field_name}['und'][0]['chado' . $field_table . '__' . $field_column] = $record->$field_column;
  255. }
  256. }
  257. // Allow the creating module to alter the value if desired. The
  258. // module should do this if the field has any other form elements
  259. // that need populationg besides the value which was set above.
  260. tripal_load_include_field_type($field_type);
  261. if (preg_match('/^chado/', $field_type) and class_exists($field_type)) {
  262. $tfield = new $field_type($field);
  263. $tfield->load($entity, array('record' => $record));
  264. }
  265. }
  266. // Type 2: fields for linked records. These fields will have any number
  267. // of form elements that might need populating so we'll offload the
  268. // loading of these fields to the field itself.
  269. if ($field_table != $base_table) {
  270. // Set an empty value by default, and let the hook function update it.
  271. $entity->{$field_name}['und'][0]['value'] = '';
  272. tripal_load_include_field_type($field_type);
  273. if (class_exists($field_type) && method_exists($field_type, 'load')) {
  274. $tfield = new $field_type($field);
  275. $tfield->load($entity, array('record' => $record));
  276. }
  277. }
  278. } // end: foreach ($fields as $field_id => $ids) {
  279. } // end: foreach ($entities as $id => $entity) {
  280. }
  281. /**
  282. * Merges the values of all fields into a single array keyed by table name.
  283. */
  284. function tripal_chado_field_storage_write_merge_fields($fields, $entity_type, $entity) {
  285. $new_fields = array();
  286. // Iterate through all of the fields and organize them into a
  287. // new fields array keyed by the table name
  288. foreach ($fields as $field_id => $ids) {
  289. // Get the field name and information about it.
  290. $field = field_info_field_by_id($field_id);
  291. $field_name = $field['field_name'];
  292. // Some fields (e.g. chado_linker_cvterm_adder) don't add data to
  293. // Chado so they don't have a table, but they are still attached to the
  294. // entity. Just skip these.
  295. if (!array_key_exists('chado_table', $field['settings'])) {
  296. continue;
  297. }
  298. $chado_table = $field['settings']['chado_table'];
  299. $chado_column = $field['settings']['chado_column'];
  300. // Iterate through the field's items. Fields with cardinality ($delta) > 1
  301. // are multi-valued.
  302. $items = field_get_items($entity_type, $entity, $field_name);
  303. foreach ($items as $delta => $item) {
  304. // A field may have multiple items. The field can use items
  305. // indexed with "chado-" to represent values that should map directly
  306. // to chado tables and fields.
  307. foreach ($item as $item_name => $value) {
  308. $matches = array();
  309. if (preg_match('/^chado-(.*?)__(.*?)$/', $item_name, $matches)) {
  310. $table_name = $matches[1];
  311. $column_name = $matches[2];
  312. // If not seen this table and column then just add it. If we've
  313. // already seen it then it means it's a FK field and we've already
  314. // added subfields so do nothing.
  315. if (!array_key_exists($table_name, $new_fields) or
  316. !array_key_exists($delta, $new_fields[$table_name]) or
  317. !array_key_exists($column_name, $new_fields[$table_name][$delta])) {
  318. $new_fields[$table_name][$delta][$column_name] = $value;
  319. }
  320. }
  321. }
  322. // If there is no value set for the field using the
  323. // chado-[table_name]__[field name] naming schema then check if a 'value' item
  324. // is present and if so use that.
  325. if ((!array_key_exists($chado_table, $new_fields) or
  326. !array_key_exists($delta, $new_fields[$chado_table]) or
  327. !array_key_exists($chado_column, $new_fields[$chado_table][$delta])) and
  328. array_key_exists('value', $items[$delta]) and
  329. !is_array($items[$delta]['value'])) {
  330. $new_fields[$chado_table][$delta][$chado_column] = $items[$delta]['value'];
  331. }
  332. }
  333. }
  334. return $new_fields;
  335. }
  336. /**
  337. * Recurses through a field's items breaking it into a nested array.
  338. */
  339. function tripal_chado_field_storage_expand_field($item_name, $value) {
  340. $matches = array();
  341. if (preg_match('/^(.*?)--(.*?)$/', $item_name, $matches)) {
  342. $parent_item_name = $matches[1];
  343. $sub_item_name = $matches[2];
  344. $sub_item = tripal_chado_field_storage_expand_field($sub_item_name, $value);
  345. return array($parent_item_name => $sub_item);
  346. }
  347. else {
  348. return array($item_name => $value);
  349. }
  350. }
  351. /**
  352. * Implements hook_field_storage_query().
  353. */
  354. function tripal_chado_field_storage_query($query) {
  355. //print_r($query->fieldConditions);
  356. // The conditions and order bys are reorganized into a filters array for the
  357. // chado_select_record function()
  358. $filters = array();
  359. // Iterate through all the conditions and add to the filters array
  360. // a chado_select_record compatible set of filters.
  361. foreach ($query->fieldConditions as $index => $condition) {
  362. $field = $condition['field'];
  363. // Skip conditions that don't belong to this storage type.
  364. if ($field['storage']['type'] != 'field_chado_storage') {
  365. continue;
  366. }
  367. $column = $condition['column'];
  368. $value = $condition['value'];
  369. $field_type = $field['type'];
  370. $field_module = $field['module'];
  371. $settings = $field['settings'];
  372. $chado_table = $settings['chado_table'];
  373. $chado_column = $settings['chado_column'];
  374. // Set the value for this field search.
  375. $subfields = explode('.', $column);
  376. //print_r($subfields);
  377. if (count($subfields) > 1) {
  378. // Get the term for this field's column and replace the field_name with
  379. // the term. We need to do this for the recursive function to work.
  380. // We must lowercase the term and underscore it because that's how we
  381. // can support case-insensitivity and lack of spacing such as for
  382. // web services.
  383. $subfield1 = tripal_get_chado_semweb_term($chado_table, $chado_column, array('return_object' => TRUE));
  384. $subfields[0] = strtolower(preg_replace('/ /', '_', $subfield1->name));
  385. $value = tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value);
  386. $value = array_shift($value);
  387. }
  388. else {
  389. $value = $condition['value'];
  390. }
  391. // Use the appropriate operator.
  392. $operator = $condition['operator'] ? $condition['operator'] : '=';
  393. switch ($operator) {
  394. case '=':
  395. $filters[$chado_table][$chado_column] = $value;
  396. break;
  397. case '>':
  398. case '>=':
  399. case '<':
  400. case '<=':
  401. $filters[$chado_table][$chado_column] = array(
  402. 'op' => $operator,
  403. 'data' => $value,
  404. );
  405. break;
  406. case '<>':
  407. $filters[$chado_table][$chado_column] = array(
  408. 'op' => '<>',
  409. 'data' => $value,
  410. );
  411. break;
  412. case 'CONTAINS':
  413. $filters[$chado_table][$chado_column] = array(
  414. 'op' => 'LIKE',
  415. 'data' => '%' . $value . '%',
  416. );
  417. break;
  418. case 'NOT':
  419. $filters[$chado_table][$chado_column] = array(
  420. 'op' => 'NOT LIKE',
  421. 'data' => '%' . $value . '%',
  422. );
  423. break;
  424. case 'STARTS WITH':
  425. $filters[$chado_table][$chado_column] = array(
  426. 'op' => 'LIKE',
  427. 'data' => $value . '%',
  428. );
  429. break;
  430. case 'NOT STARTS':
  431. $filters[$chado_table][$chado_column] = array(
  432. 'op' => 'NOT LIKE',
  433. 'data' => $value . '%',
  434. );
  435. break;
  436. case 'ENDS WITH':
  437. $filters[$chado_table][$chado_column] = array(
  438. 'op' => 'LIKE',
  439. 'data' => '%' . $value,
  440. );
  441. break;
  442. case 'NOT ENDS':
  443. $filters[$chado_table][$chado_column] = array(
  444. 'op' => 'NOT LIKE',
  445. 'data' => '%' . $value,
  446. );
  447. break;
  448. default:
  449. // unrecognized operation.
  450. break;
  451. }
  452. }
  453. // Now get the list for sorting.
  454. foreach ($query->order as $index => $sort) {
  455. $field = $sort['specifier']['field'];
  456. // Skip sorts that don't belong to this storage type.
  457. if ($field['storage']['type'] != 'field_chado_storage') {
  458. continue;
  459. }
  460. $direction = $sort['direction'];
  461. $field_type = $field['type'];
  462. $field_module = $field['module'];
  463. $settings = $field['settings'];
  464. $chado_table = $settings['chado_table'];
  465. $chado_column = $settings['chado_column'];
  466. $sorting[$chado_table][$chado_column] = $direction;
  467. }
  468. // Iterate through the filters and perform the query
  469. $entity_ids = array();
  470. foreach ($filters as $chado_table => $values) {
  471. //print_r($chado_table);
  472. //print_r($values);
  473. // First get the matching record IDs from the Chado table.
  474. $schema = chado_get_schema($chado_table);
  475. $pkey = $schema['primary key'][0];
  476. $results = chado_select_record($chado_table, array($pkey), $values);
  477. $record_ids = array();
  478. foreach ($results as $result) {
  479. $record_ids[] = $result->$pkey;
  480. }
  481. // Next look for matching IDs in the chado_entity table.
  482. $filter_ids = array();
  483. if (count($record_ids) > 0) {
  484. $select = db_select('chado_entity', 'CE');
  485. $select->join('tripal_entity', 'TE', 'TE.id = CE.entity_id');
  486. $select->fields('CE', array('entity_id'));
  487. $select->fields('TE', array('bundle'));
  488. $select->condition('record_id', $record_ids);
  489. // If a bundle is specified then make sure we match on the bundle.
  490. if (array_key_exists('bundle', $query->entityConditions)) {
  491. $select->condition('bundle', $query->entityConditions['bundle']);
  492. }
  493. $results = $select->execute();
  494. while ($result = $results->fetchObject()) {
  495. $entity_ids[] = array($result->entity_id, 0, $result->bundle);
  496. }
  497. }
  498. }
  499. $result = array(
  500. 'TripalEntity' => array()
  501. );
  502. foreach ($entity_ids as $ids) {
  503. $result['TripalEntity'][$ids[0]] = entity_create_stub_entity('TripalEntity', $ids);
  504. }
  505. return $result;
  506. }
  507. /**
  508. *
  509. * @param $subfields
  510. * @param $value
  511. */
  512. function tripal_chado_field_storage_recurse_subfilters($chado_table, $subfields, $value) {
  513. $sub_value = array();
  514. // Get the subvalue for this iteration
  515. $subfield = array_shift($subfields);
  516. // Get the cvterms mapped to this table.
  517. $columns = db_select('chado_semweb', 'CS')
  518. ->fields('CS', array('chado_column', 'cvterm_id'))
  519. ->condition('chado_table', $chado_table)
  520. ->execute();
  521. // Iterate through the columns and find the one with cvterm that matches
  522. // the subfield name.
  523. $chado_column = '';
  524. while($column = $columns->fetchObject()) {
  525. $cvterm_id = $column->cvterm_id;
  526. $cvterm = tripal_get_cvterm(array('cvterm_id' => $cvterm_id));
  527. // Convert the term name to lower-case and replace spaces with underscores
  528. // so we can perform case insensitive comparisions and ingore spacing.
  529. $term_name = strtolower(preg_replace('/ /', '_', $cvterm->name));
  530. if ($subfield == $term_name) {
  531. $chado_column = $column->chado_column;
  532. }
  533. }
  534. // If we have more subfields then this should be a foreign key and we should
  535. // recurse.
  536. if (count($subfields) > 0) {
  537. // Get the foreign keys for this Chado table.
  538. $schema = chado_get_schema($chado_table);
  539. $fkeys = $schema['foreign keys'];
  540. // Iterate through the FKs to find the one that matches this Chado field.
  541. foreach ($fkeys as $fk_table => $details) {
  542. foreach ($details['columns'] as $lkey => $rkey) {
  543. if ($lkey == $chado_column) {
  544. $sub_value = tripal_chado_field_storage_recurse_subfilters($fk_table, $subfields, $value);
  545. return array($chado_column => $sub_value);
  546. }
  547. }
  548. }
  549. }
  550. return array($chado_column => $value);
  551. }