tripal_chado.cv.api.inc 54 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668
  1. <?php
  2. /**
  3. * @file
  4. * This module provides a set of functions to simplify working with
  5. * controlled vocabularies.
  6. */
  7. $loop_data;
  8. /**
  9. * @defgroup tripal_chado_api Controlled Vocabulary API
  10. * @ingroup tripal_api
  11. * This module provides a set of functions to simplify working with
  12. * controlled vocabularies. Most of the API functions deal with retrieving
  13. * terms or their parent vocabularies.
  14. *
  15. * However, the API also supports
  16. * generation of trees for browsing a vocabulary as well as generation of
  17. * pie graphs for display of hierarchical counts of terms. Version 0.3b of
  18. * Tripal provides a feature browser and a feature summary chart uses
  19. * the API functions provided here. But in general charts and trees can be
  20. * created for any controlled vocabulary.
  21. *
  22. */
  23. /**
  24. * Retrieves a chado controlled vocabulary variable
  25. *
  26. * @param $identifier
  27. * An array with the key stating what the identifier is. Supported keys (only on of the
  28. * following unique keys is required):
  29. * - cv_id: the chado cv.cv_id primary key
  30. * - name: the chado cv.name field (assume unique)
  31. * @param $options
  32. * An array of options. Supported keys include:
  33. * - Any keys supported by chado_generate_var(). See that function definition for
  34. * additional details.
  35. *
  36. * NOTE: the $identifier parameter can really be any array similar to $values passed into
  37. * chado_select_record(). It should fully specify the cv record to be returned.
  38. *
  39. * @return
  40. * If unique values were passed in as an identifier then an object describing the cv
  41. * will be returned (will be a chado variable from chado_generate_var()). Otherwise,
  42. * FALSE will be returned.
  43. *
  44. * @ingroup tripal_chado_api
  45. */
  46. function tripal_get_cv($identifiers, $options = array()) {
  47. // Set Defaults
  48. if (!isset($options['include_fk'])) {
  49. // Tells chado_generate_var not to follow any foreign keys
  50. $options['include_fk'] = array();
  51. }
  52. // Error Checking of parameters
  53. if (!is_array($identifiers)) {
  54. tripal_report_error(
  55. 'tripal_chado_api',
  56. TRIPAL_ERROR,
  57. "tripal_get_cv: The identifier passed in is expected to be an array with the key
  58. matching a column name in the cv table (ie: cv_id or name). You passed in %identifier.",
  59. array(
  60. '%identifier'=> print_r($identifiers, TRUE)
  61. )
  62. );
  63. }
  64. elseif (empty($identifiers)) {
  65. tripal_report_error(
  66. 'tripal_chado_api',
  67. TRIPAL_ERROR,
  68. "tripal_get_cv: You did not pass in anything to identify the cv you want. The identifier
  69. is expected to be an array with the key matching a column name in the cv table
  70. (ie: cv_id or name). You passed in %identifier.",
  71. array(
  72. '%identifier'=> print_r($identifiers, TRUE)
  73. )
  74. );
  75. }
  76. // Try to get the cv
  77. $cv = chado_generate_var(
  78. 'cv',
  79. $identifiers,
  80. $options
  81. );
  82. // Ensure the cv is singular. If it's an array then it is not singular
  83. if (is_array($cv)) {
  84. tripal_report_error(
  85. 'tripal_chado_api',
  86. TRIPAL_ERROR,
  87. "tripal_get_cv: The identifiers you passed in were not unique. You passed in %identifier.",
  88. array(
  89. '%identifier'=> print_r($identifiers, TRUE)
  90. )
  91. );
  92. }
  93. // Report an error if $cv is FALSE since then chado_generate_var has failed
  94. elseif ($cv === FALSE) {
  95. tripal_report_error(
  96. 'tripal_chado_api',
  97. TRIPAL_ERROR,
  98. "tripal_get_cv: chado_generate_var() failed to return a cv based on the identifiers
  99. you passed in. You should check that your identifiers are correct, as well as, look
  100. for a chado_generate_var error for additional clues. You passed in %identifier.",
  101. array(
  102. '%identifier'=> print_r($identifiers, TRUE)
  103. )
  104. );
  105. }
  106. // Else, as far we know, everything is fine so give them their cv :)
  107. else {
  108. return $cv;
  109. }
  110. }
  111. /**
  112. * Create an options array to be used in a form element which provides a
  113. * list of all chado cvs
  114. *
  115. * @return
  116. * An array(cv_id => name) for each cv in the chado cv table
  117. *
  118. * @ingroup tripal_chado_api
  119. */
  120. function tripal_get_cv_select_options() {
  121. $results = chado_select_record('cv', array('cv_id', 'name'), array(), array('order_by' => array('name' => 'ASC')));
  122. $options = array();
  123. $options[] = 'Select a Vocabulary';
  124. foreach ($results as $r) {
  125. $options[$r->cv_id] = $r->name;
  126. }
  127. return $options;
  128. }
  129. /**
  130. * Retrieves a chado controlled vocabulary term variable
  131. *
  132. * @param $identifier
  133. * An array apropriate for use with the chado_generate_var for uniquely
  134. * identifying a cvterm record. Alternativley, there are also some specially
  135. * handled keys. They are:
  136. * - id: an ID for the term of the for [dbname]:[accession], where [dbname]
  137. * is the short name of the vocabulary and accession is the unique ID.
  138. * - cv_id: an integer indicating the cv_id or an array with 'name' => the
  139. * name of the cv.
  140. * - synonym: an array with 'name' => the name of the synonym of the cvterm
  141. * you want returned; 'cv_id' => the cv_id of the synonym; 'cv_name' =>
  142. * the name of the cv of the synonym
  143. * - property: An array/object describing the property to select records
  144. * for. It should at least have either a type_name (if unique across cvs)
  145. * or type_id. Other supported keys include: cv_id/cv_name (of the type),
  146. * value and rank
  147. * @param $options
  148. * An array of options. Supported keys include:
  149. * - Any keys supported by chado_generate_var(). See that function
  150. * definition for additional details.
  151. *
  152. * NOTE: the $identifier parameter can really be any array similar to $values
  153. * passed into chado_select_record(). It should fully specify the cvterm
  154. * record to be returned.
  155. *
  156. * @return
  157. * If unique values were passed in as an identifier then an object describing
  158. * the cvterm will be returned (will be a chado variable from
  159. * chado_generate_var()). Otherwise, FALSE will be returned.
  160. *
  161. * @ingroup tripal_cv_api
  162. */
  163. function tripal_get_cvterm($identifiers, $options = array()) {
  164. // Set Defaults
  165. if (!isset($options['include_fk'])) {
  166. // Tells chado_generate_var to only get the cv
  167. $options['include_fk'] = array('cv_id' => TRUE);
  168. }
  169. // Error Checking of parameters
  170. if (!is_array($identifiers)) {
  171. tripal_report_error('tripal_cv_api', TRIPAL_ERROR,
  172. "tripal_get_cvterm: The identifier passed in is expected to be an array with the key
  173. matching a column name in the cvterm table (ie: cvterm_id or name). You passed in %identifier.",
  174. array('%identifier'=> print_r($identifiers, TRUE))
  175. );
  176. }
  177. elseif (empty($identifiers)) {
  178. tripal_report_error('tripal_cv_api', TRIPAL_ERROR,
  179. "tripal_get_cvterm: You did not pass in anything to identify the cvterm you want. The identifier
  180. is expected to be an array with the key matching a column name in the cvterm table
  181. (ie: cvterm_id or name). You passed in %identifier.",
  182. array('%identifier'=> print_r($identifiers, TRUE))
  183. );
  184. }
  185. // If synonym was passed in, then process this first before calling chado_generate_var()
  186. if (isset($identifiers['synonym'])) {
  187. $synonym = $identifiers['synonym']['name'];
  188. $values = array('synonym' => $synonym);
  189. if (isset($identifiers['synonym']['cv_id'])) {
  190. $values['cvterm_id'] = array('cv_id' => $identifiers['synonym']['cv_id']);
  191. }
  192. if (isset($identifiers['synonym']['cv_name'])) {
  193. $values['cvterm_id'] = array('cv_id' => array('name' => $identifiers['synonym']['cv_name']));
  194. }
  195. $options = array(
  196. 'case_insensitive_columns' => array('name')
  197. );
  198. $result = chado_select_record('cvtermsynonym', array('cvterm_id'), $values, $options);
  199. // if the synonym doens't exist or more than one record is returned then return false
  200. if (count($result) == 0) {
  201. return FALSE;
  202. }
  203. if (count($result) > 1) {
  204. return FALSE;
  205. }
  206. $identifiers = array('cvterm_id' => $result[0]->cvterm_id);
  207. }
  208. // If one of the identifiers is property then use chado_get_record_with_property()
  209. if (isset($identifiers['property'])) {
  210. $property = $identifiers['property'];
  211. unset($identifiers['property']);
  212. $cvterm = chado_get_record_with_property(
  213. array('table' => 'cvterm', 'base_records' => $identifiers),
  214. array('type_name' => $property),
  215. $options
  216. );
  217. }
  218. if (isset($identifiers['id'])) {
  219. list($db_name, $accession) = preg_split('/:/', $identifiers['id']);
  220. $cvterm = chado_generate_var('cvterm',array(
  221. 'dbxref_id' => array(
  222. 'db_id' => array(
  223. 'name' => $db_name,
  224. ),
  225. 'accession' => $accession,
  226. )
  227. ));
  228. }
  229. // Else we have a simple case and we can just use chado_generate_var to get the cvterm
  230. else {
  231. // Try to get the cvterm
  232. $cvterm = chado_generate_var('cvterm', $identifiers, $options);
  233. }
  234. // Ensure the cvterm is singular. If it's an array then it is not singular
  235. if (is_array($cvterm)) {
  236. tripal_report_error(
  237. 'tripal_cv_api',
  238. TRIPAL_ERROR,
  239. "tripal_get_cvterm: The identifiers you passed in were not unique. You passed in %identifier.",
  240. array(
  241. '%identifier'=> print_r($identifiers, TRUE)
  242. )
  243. );
  244. }
  245. // Report an error if $cvterm is FALSE since then chado_generate_var has failed
  246. elseif ($cvterm === FALSE) {
  247. tripal_report_error(
  248. 'tripal_cv_api',
  249. TRIPAL_ERROR,
  250. "tripal_get_cvterm: chado_generate_var() failed to return a cvterm based on the identifiers
  251. you passed in. You should check that your identifiers are correct, as well as, look
  252. for a chado_generate_var error for additional clues. You passed in %identifier.",
  253. array(
  254. '%identifier'=> print_r($identifiers, TRUE)
  255. )
  256. );
  257. }
  258. // Else, as far we know, everything is fine so give them their cvterm :)
  259. else {
  260. return $cvterm;
  261. }
  262. }
  263. /**
  264. * Create an options array to be used in a form element
  265. * which provides a list of all chado cvterms
  266. *
  267. * @param $cv_id
  268. * The chado cv_id; only cvterms with the supplied cv_id will be returned
  269. * @param $rel_type
  270. * Set to TRUE if the terms returned should only be relationship types in
  271. * the vocabulary. This is useful for creating drop-downs of terms
  272. * used for relationship linker tables.
  273. *
  274. * @return
  275. * An associative array with the cvterm_id's as keys. The first
  276. * element in the array has a key of '0' and a value of 'Select a Type'
  277. *
  278. * @ingroup tripal_chado_api
  279. */
  280. function tripal_get_cvterm_select_options($cv_id, $rel_type = FALSE) {
  281. $columns = array('cvterm_id', 'name');
  282. $values = array('cv_id' => $cv_id);
  283. if ($rel_type) {
  284. $values['is_relationshiptype'] = 1;
  285. }
  286. $s_options = array('order_by' => array('name' => 'ASC'));
  287. $cvterms = chado_select_record('cvterm', $columns, $values, $s_options);
  288. $options = array();
  289. $options[0] = 'Select a Type';
  290. foreach ($cvterms as $cvterm) {
  291. $options[$cvterm->cvterm_id] = $cvterm->name;
  292. }
  293. return $options;
  294. }
  295. /**
  296. * Updates the cvtermpath table of Chado for the specified CV.
  297. *
  298. * @param $cv_id
  299. * The chado cv_id;
  300. * @param $job_id
  301. * This function is intended to be used with the Tripal Jobs API.
  302. * When this function is called as a job the $job_id is automatically
  303. * passed to this function.
  304. * @return
  305. * TRUE on success FALSE on failure
  306. *
  307. * @ingroup tripal_chado_api
  308. */
  309. function tripal_update_cvtermpath($cv_id, $job_id = NULL) {
  310. // TODO: need better error checking in this function
  311. // first get the controlled vocabulary name:
  312. $sql = "SELECT * FROM {cv} WHERE cv_id = :cv_id";
  313. $cv = chado_query($sql, array(':cv_id' => $cv_id))->fetchObject();
  314. print "\nUpdating cvtermpath for $cv->name...\n";
  315. // We need to set the chado schema as active because some of the
  316. // functions call other functions which would not be in scope.
  317. $previous = chado_set_active('chado');
  318. try {
  319. $sql = "SELECT * FROM fill_cvtermpath(:name)";
  320. db_query($sql, array(':name' => $cv->name));
  321. chado_set_active($previous);
  322. }
  323. catch (Exception $e) {
  324. chado_set_active($previous);
  325. $error = $e->getMessage();
  326. tripal_report_error('tripal_chado', TRIPAL_ERROR, "Could not fill cvtermpath table: @error", array('@error' => $error));
  327. return FALSE;
  328. }
  329. return TRUE;
  330. }
  331. /**
  332. * Duplicate of fill_cvtermpath() stored procedure in Chado.
  333. *
  334. * Identifies all of the root terms of the controlled vocabulary. These
  335. * root terms are then processed by calling the
  336. * tripal_update_cvtermpath_root_loop() function on each one.
  337. *
  338. * @param $cvid
  339. * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id).
  340. * @param $job_id
  341. */
  342. function tripal_update_cvtermpath_bak($cv_id, $job_id = NULL){
  343. // TODO: there's a function to determine the current Chado instance.
  344. // we should use that.
  345. $prev_db = chado_set_active('chado');
  346. try {
  347. $result = db_query('
  348. SELECT DISTINCT t.*
  349. FROM cvterm t
  350. LEFT JOIN cvterm_relationship r ON (t.cvterm_id = r.subject_id)
  351. INNER JOIN cvterm_relationship r2 ON (t.cvterm_id = r2.object_id)
  352. WHERE t.cv_id = :cvid AND r.subject_id is null',
  353. array(':cvid' => $cv_id)
  354. );
  355. // Iterate through each root level term.
  356. $record = $result->fetchAll();
  357. foreach ($record as $item){
  358. tripal_update_cvtermpath_root_loop($item->cvterm_id, $item->cv_id);
  359. }
  360. }
  361. catch (Exception $e) {
  362. // If there's an exception we have to set the database back. So, do that
  363. // and then rethrow the error.
  364. chado_set_active($prev_db);
  365. throw $e;
  366. }
  367. chado_set_active($prev_db);
  368. }
  369. /**
  370. * Duplicate of _fill_cvtermpath4root() stored procedure in Chado.
  371. *
  372. * This function process a "branch" of the ontology. Initially, the
  373. * "root" starts at the top of the tree. But, as the cvtermpath is populated
  374. * the "root" becomes terms deeper in the tree.
  375. *
  376. * @param $rootid
  377. * The term ID from the cvterm table of Chado (i.e. cvterm.cvterm_id).
  378. * @param $cvid
  379. * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id).
  380. */
  381. function tripal_update_cvtermpath_root_loop($rootid, $cvid){
  382. // Get's the cvterm record for this "root".
  383. chado_set_active('chado');
  384. $ttype = db_select('cvterm', 'cv')
  385. ->fields('cv', array('cvterm_id'));
  386. $db_or = db_or();
  387. $db_or->condition('cv.name', "isa", '=');
  388. $db_or->condition('cv.name', "is_a", '=');
  389. $ttype->condition($db_or);
  390. $result = $ttype->execute()->fetchObject();
  391. // Descends through the branch starting at this "root" term.
  392. tripal_update_cvtermpath_loop($rootid, $rootid, $cvid, $result->cvterm_id, 0, 0, array());
  393. // Get's the children terms of this "root" term and then recursively calls
  394. // this function making each child root.
  395. $cterm = db_query(
  396. 'SELECT *
  397. FROM cvterm_relationship
  398. WHERE object_id = :rootid
  399. ',
  400. array(':rootid' => $rootid)
  401. );
  402. while($cterm_result = $cterm->fetchAssoc()) {
  403. tripal_update_cvtermpath_root_loop($cterm_result['subject_id'], $cvid);
  404. }
  405. }
  406. /**
  407. *
  408. * @param $origin
  409. * The root terms cvterm_id.
  410. * @param $child_id
  411. * The cvterm_id of the current child term. The child term is a descendent
  412. * of the origin.
  413. * @param $cv_id
  414. * The controlled vocabulary ID from the cv table of Chado (i.e. cv.cv_id).
  415. * @param $type_id
  416. * The relationship type between the origin term and the child.
  417. * @param $depth
  418. * The depth of the recursion.
  419. * @param $increment_of_depth.
  420. * An integer ??
  421. * @param $tree_path.
  422. * The array of every term between the current child and the origin. Each
  423. * element in the array is an associative array with the keys:
  424. * -build_id: an string identifier for the child that combines the origin,
  425. * child cvterm_id,cv_id, and the type_id.
  426. * -depth: the depth that a child was inserted into the cvtermpath table.
  427. * @return multitype:
  428. */
  429. function tripal_update_cvtermpath_loop($origin, $child_id, $cv_id, $type_id, $depth,
  430. $increment_of_depth, $tree_path){
  431. // An array of
  432. global $loop_data;
  433. // Check to see if a row with these values already exists.
  434. chado_set_active('chado');
  435. $count = db_query(
  436. 'SELECT *
  437. FROM cvtermpath
  438. WHERE cv_id = :cvid
  439. AND object_id = :origin
  440. AND subject_id = :child_id
  441. AND pathdistance = :depth
  442. ',
  443. array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth)
  444. );
  445. $count_total = $count->rowCount();
  446. // If we've already seen this term then just return, we don't want
  447. // to insert it again.
  448. if ($count_total > 0) {
  449. return $loop_data;
  450. }
  451. // Build the ID.
  452. $child_id = $origin . '|' . $child_id . '|' . $cv_id . '|' . $type_id;
  453. // Now check if the most recent entry already exists in the array.
  454. if ($increment_of_depth != 0 && empty($loop_data)) {
  455. // Search the $tree_path for the new $child_id in the build_id column.
  456. foreach ($tree_path as $parent) {
  457. // If this child is the same as a parent term that has already been
  458. // processed then we have a potential loop.
  459. if ($parent['build_id'] == $child_id) {
  460. // The loop checker function below.
  461. $result_of_loop_checker = tripal_update_cvtermpath_loop_checker($origin,
  462. $child_id, $cv_id, $type_id, $depth, $increment_of_depth, 0,
  463. $parent, array(), $depth);
  464. if (!empty($result_of_loop_checker)) {
  465. $loop_data = $result_of_loop_checker;
  466. //Find the depth of the loop start by finding it in the array_of_children
  467. foreach($tree_path as $children => $child){
  468. if($child['build_id'] == $loop_data['build_id']){
  469. $loop_location = $child['depth'];
  470. }
  471. }
  472. $array_loop_data = (array)$loop_data;
  473. $array_loop_data['depth'] = $loop_location;
  474. $loop_data = $array_loop_data;
  475. break;
  476. }
  477. }
  478. if (!empty($loop_data)) {
  479. return $loop_data;
  480. }
  481. }
  482. }
  483. // We have not detected a loop, so it's safe to insert the term.
  484. $query = db_insert('cvtermpath')
  485. ->fields([
  486. 'object_id' => $origin,
  487. 'subject_id' => $child_id,
  488. 'cv_id' => $cv_id,
  489. 'type_id' => $type_id,
  490. 'pathdistance' => $depth,
  491. ]);
  492. $rows = $query->execute();
  493. // Then add that new entry to the $tree_path.
  494. $tree_path[$increment_of_depth] = [
  495. 'build_id' => $child_id,
  496. 'depth' => $depth
  497. ];
  498. // Get all of the relationships of this child term, and recursively
  499. // call the tripal_update_cvtermpath_loop() function to continue
  500. // descending down the tree.
  501. $query = db_select('cvterm_relationship', 'cvtr')
  502. ->fields('cvtr')
  503. ->condition('cvtr.object_id', $child_id, '=')
  504. ->execute();
  505. $cterm_relationships = $query->fetchAll();
  506. foreach ($cterm_relationships as $item) {
  507. if (!empty($loop_data)) {
  508. if ($loop_data['depth'] < $depth) {
  509. break;
  510. }
  511. elseif ($loop_data['depth'] > $depth) {
  512. $loop_data = NULL;
  513. break;
  514. }
  515. }
  516. else {
  517. $increment_of_depth++;
  518. tripal_update_cvtermpath_loop($origin, $item->subject_id, $cv_id,
  519. $item->type_id, $depth + 1, $increment_of_depth, $tree_path);
  520. }
  521. }
  522. }
  523. /**
  524. * @param $origin
  525. * @param $child_id
  526. * @param $cv_id
  527. * @param $type_id
  528. * @param $depth
  529. * @param $increment_of_depth
  530. * @param $distance_between_parent_child
  531. * @param $possible_start_of_loop
  532. * @param $array_of_possible_loop
  533. * @param $depth_at_start_of_loop
  534. *
  535. * @return bool
  536. */
  537. function tripal_update_cvtermpath_loop_checker($origin, $child_id, $cv_id, $type_id,
  538. $depth, $increment_of_depth, $distance_between_parent_child, $possible_start_of_loop,
  539. $array_of_possible_loop, $depth_at_start_of_loop){
  540. // Find the child terms of the current term via the relationship taboe.
  541. chado_set_active('chado');
  542. $query = db_select('cvterm_relationship', 'cvtr')
  543. ->fields('cvtr')
  544. ->condition('cvtr.object_id', $child_id, '=')
  545. ->execute();
  546. $cterm_relationships = $query->fetchAll();
  547. // Iterate through the child terms via the relationships.
  548. foreach ($cterm_relationships as $item){
  549. // Search the $tree_path for the new $child_id in the build_id column.
  550. foreach ($array_of_possible_loop as $parent) {
  551. if ($parent['build_id'] === $possible_start_of_loop['build_id']) {
  552. // If the search returns something check for a possible loop.
  553. if (!empty($parent)) {
  554. $result = tripal_update_cvtermpath_loop_checker_traverse($origin, $child_id,
  555. $cv_id, $type_id, $depth, $increment_of_depth, $possible_start_of_loop,
  556. $array_of_possible_loop, array(), 0);
  557. if(!empty($result)){
  558. break 2;
  559. }
  560. }
  561. }
  562. }
  563. $increment_of_depth++;
  564. $distance_between_parent_child++;
  565. $child_id = $origin . '|' . $item->subject_id . '|' . $cv_id . '|' . $item->type_id;
  566. $array_of_possible_loop[$distance_between_parent_child] = ['build_id' => $child_id];
  567. $result = tripal_update_cvtermpath_loop_checker($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $increment_of_depth, $distance_between_parent_child, $possible_start_of_loop, $array_of_possible_loop, $depth_at_start_of_loop);
  568. if($result !== FALSE){
  569. return $result;
  570. }
  571. }
  572. if (!empty($result)) {
  573. return $result;
  574. }
  575. else {
  576. return FALSE;
  577. }
  578. }
  579. function tripal_update_cvtermpath_loop_checker_traverse($origin, $child_id, $cv_id,
  580. $type_id, $depth, $increment_of_depth, $possible_start_of_loop, $array_of_possible_loop,
  581. $traverse_of_loop, $increment) {
  582. //watchdog('debug', '<pre>$increment: '. print_r($increment, TRUE) .'</pre>');
  583. /*if ($increment > 10) {
  584. die();
  585. }*/
  586. chado_set_active('chado');
  587. $query = db_select('cvterm_relationship', 'cvtr')
  588. ->fields('cvtr')
  589. ->condition('cvtr.object_id', $child_id, '=')
  590. ->execute();
  591. $cterm = $query->fetchAll();
  592. foreach ($cterm as $item) {
  593. if ($array_of_possible_loop === $traverse_of_loop) {
  594. watchdog('debug', 'LOOP');
  595. //Report the loop.
  596. $loop_found = end($array_of_possible_loop);
  597. break;
  598. }
  599. elseif ($array_of_possible_loop != $traverse_of_loop) {
  600. $increment_of_depth++;
  601. $increment++;
  602. $child_id = $origin . '|' . $item->subject_id . '|' . $cv_id . '|' . $item->type_id;
  603. $traverse_of_loop[$increment] = ['build_id' => $child_id];
  604. $result = tripal_update_cvtermpath_loop_checker_traverse($origin,
  605. $item->subject_id, $cv_id, $item->type_id, $depth + 1,
  606. $increment_of_depth, $possible_start_of_loop, $array_of_possible_loop,
  607. $traverse_of_loop, $increment);
  608. if ($result !== FALSE) {
  609. return $result;
  610. }
  611. }
  612. }
  613. if ($loop_found) {
  614. return $loop_found;
  615. }
  616. else {
  617. return FALSE;
  618. }
  619. }
  620. /*
  621. *
  622. * @param $origin
  623. * @param $subject_id
  624. * @param $cv_idxkcd
  625. * @param $type_id
  626. * @param $depth
  627. * @return multitype:
  628. function tripal_update_cvtermpath_loop($origin, $child_id, $cv_id, $type_id, $depth){
  629. // Variables and arrays needed for loop checking.
  630. $tree_path;
  631. $array_of_possible_loop;
  632. $possible_start_of_loop;
  633. $distance_between_parent_child;
  634. $increment_of_depth;
  635. chado_set_active('chado');
  636. $count = db_query(
  637. 'SELECT *
  638. FROM cvtermpath
  639. WHERE cv_id = :cvid
  640. AND object_id = :origin
  641. AND subject_id = :child_id
  642. AND pathdistance = :depth
  643. ',
  644. array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth)
  645. );
  646. $count_total = $count->rowCount();
  647. //Loop check
  648. chado_set_active('chado');
  649. $loop = db_query(
  650. 'SELECT *
  651. FROM cvtermpath
  652. WHERE cv_id = :cvid
  653. AND object_id = :origin
  654. AND subject_id = :child_id
  655. AND type_id = :type_id
  656. ',
  657. array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':type_id' => $type_id,)
  658. );
  659. $loop_check = $loop->rowCount();
  660. //watchdog('debug', '<pre>tripal_ds_preprocess_TripalEntity $rows ' . print_r($rows, TRUE) . '</pre>');
  661. /*if(!empty($rows)){
  662. foreach($rows as $row){
  663. tripal_update_cvtermpath_loop_check($origin, $child_id, $cv_id, $type_id, $depth, $row->cvtermpath_id, 0);
  664. }
  665. }
  666. else {*/
  667. //If no loop proceed.
  668. /*try{
  669. if($count_total == 0) {
  670. chado_set_active('chado');
  671. $query = db_insert('cvtermpath')
  672. ->fields(array(
  673. 'object_id' => $origin,
  674. 'subject_id' => $child_id,
  675. 'cv_id' => $cv_id,
  676. 'type_id' => $type_id,
  677. 'pathdistance' => $depth,
  678. ));
  679. $rows = $query->execute();
  680. }
  681. if ($loop_check == 0) {
  682. chado_set_active('chado');
  683. $query = db_select('cvterm_relationship', 'cvtr')
  684. ->fields('cvtr')
  685. ->condition('cvtr.object_id', $child_id, '=')
  686. ->execute();
  687. $cterm = $query->fetchAll();
  688. foreach ($cterm as $item) {
  689. //watchdog('debug', '<pre>tripal_ds_preprocess_TripalEntity $item ' . print_r($item, TRUE) . '</pre>');
  690. tripal_update_cvtermpath_loop($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1);
  691. };
  692. //}
  693. }
  694. }
  695. catch(Exception $e){
  696. watchdog_exception('tripal_ds', $e);
  697. return FALSE;
  698. }
  699. return 1;
  700. }
  701. */
  702. /**
  703. *
  704. * @param $origin
  705. * @param $subject_id
  706. * @param $cv_id
  707. * @param $type_id
  708. * @param $depth
  709. * @return multitype:
  710. function tripal_update_cvtermpath_loop_check($origin, $child_id, $cv_id, $type_id, $depth, $cvtermpath_id, $loop_count, $loop_check, $object_id){
  711. //Store the
  712. //Check if the passed parameters match any of the items in the loop_check array.
  713. if(!empty($loop_check)){
  714. foreach($loop_check as $item){
  715. if ($item['type_id'] = $type_id){
  716. if($item['subject_id'] = $child_id){
  717. if($item['object_id'] = $object_id){
  718. //Loop found, roll back all rows until $cvtermpath_id-1 (last correct entry)
  719. // and step into the next loop
  720. }
  721. }
  722. }
  723. }
  724. }
  725. $loop_count + 1;
  726. chado_set_active('chado');
  727. $count = db_query(
  728. 'SELECT *
  729. FROM cvtermpath
  730. WHERE cv_id = :cvid AND object_id = :origin
  731. AND subject_id = :child_id
  732. AND pathdistance = :depth
  733. ',
  734. array(':cvid' => $cv_id, ':origin' => $origin, ':child_id' => $child_id, ':depth' => $depth)
  735. );
  736. $count_total = $count->rowCount();
  737. if ($count_total == 0) {
  738. chado_set_active('chado');
  739. $query = db_insert('cvtermpath')
  740. ->fields(array(
  741. 'object_id' => $origin,
  742. 'subject_id' => $child_id,
  743. 'cv_id' => $cv_id,
  744. 'type_id' => $type_id,
  745. 'pathdistance' => $depth,
  746. ));
  747. $rows = $query->execute();
  748. $cterm = array();
  749. $query = db_select('cvterm_relationship', 'cvtr')
  750. ->fields('cvtr')
  751. ->condition('cvtr.object_id', $child_id, '=' )
  752. ->execute();
  753. $cterm = $query->fetchAll();
  754. foreach ($cterm as $item) {
  755. $loop_check[$loop_count]= $item;
  756. tripal_update_cvtermpath_loop_check($origin, $item->subject_id, $cv_id, $item->type_id, $depth + 1, $loop_count, $loop_check, $item->object_id);
  757. };
  758. }
  759. return 1;
  760. }
  761. */
  762. /**
  763. * Adds a controlled vocabular to the CV table of Chado.
  764. *
  765. * @param $name
  766. * The name of the controlled vocabulary. These are typically all lower case
  767. * with no special characters other than an undrescore (for spaces).
  768. * @param $comment
  769. * A description or definition of the vocabulary.
  770. *
  771. * @return
  772. * An object populated with fields from the newly added database.
  773. *
  774. * @ingroup tripal_chado_api
  775. */
  776. function tripal_insert_cv($name, $definition) {
  777. // insert/update values
  778. $ins_values = array(
  779. 'name' => $name,
  780. 'definition' => $definition
  781. );
  782. // see if the CV default exists already in the database
  783. $sel_values = array('name' => $name);
  784. $results = chado_select_record('cv', array('*'), $sel_values);
  785. // if it does not exists then add it
  786. if (count($results) == 0) {
  787. $success = chado_insert_record('cv', $ins_values);
  788. if (!$success) {
  789. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to create the CV record", NULL);
  790. return FALSE;
  791. }
  792. $results = chado_select_record('cv', array('*'), $sel_values);
  793. }
  794. // if it already exists then do an update
  795. else {
  796. $success = chado_update_record('cv', $sel_values, $ins_values);
  797. if (!$success) {
  798. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to update the CV record", NULL);
  799. return FALSE;
  800. }
  801. $results = chado_select_record('cv', array('*'), $sel_values);
  802. }
  803. // return the cv object
  804. return $results[0];
  805. }
  806. /**
  807. * Add's a controlled vocabulary term to Chado.
  808. *
  809. * This function will add a cvterm record (and a dbxref record if appropriate
  810. * values are provided). If the parent vocabulary does not exist then
  811. * that also is added to the cv table. If the cvterm is a relationship term
  812. * then the 'is_relationship' value should be set. All
  813. * terms must also have a corresponding database. This is specified in the
  814. * term's ID just before the colon (e.g. GO:003824). If the database does not
  815. * exist in the DB table then it will be added automatically. The accession
  816. * (the value just after the colon in the term's ID) will be added to the
  817. * dbxref table. If the CVterm already exists and $update is set (default)
  818. * then the cvterm is updated. If the CVTerm already exists and $update is
  819. * not set, then no changes are made and the CVTerm object is returned.
  820. *
  821. * @param $term
  822. * An associative array with the following keys:
  823. * - id: the term accession. must be of the form <DB>:<ACCESSION>, where
  824. * <DB> is the name of the database to which the cvterm belongs and the
  825. * <ACCESSION> is the term's accession number in the database.
  826. * - name: the name of the term. usually meant to be human-readable.
  827. * - is_obsolete: is present and set to 1 if the term is defunct
  828. * - definition: the definition of the term
  829. * - cv_name: The CV name to which the term belongs. If this arugment is
  830. * null or not provided then the function tries to find a record in the
  831. * CV table with the same name provided in the $term[namespace]. If
  832. * this field is provided then it overrides what the value in
  833. * $term[namespace]
  834. * - is_relationship: If this term is a relationship term then this value
  835. * should be 1.
  836. * - db_name: In some cases the database name will not be part of the
  837. * $term['id'] and it needs to be explicitly set. Use this argument
  838. * only if the database name cannot be specififed in the term ID
  839. * (e.g. <DB>:<ACCESSION>).
  840. * @param $options
  841. * An associative array with the following keys:
  842. * - update_existing: By default this is TRUE. If the term exists it is
  843. * automatically updated.
  844. * - force_db_change: Sometimes a term may need to switch from one
  845. * database to another. If the term already exists, but associated
  846. * with another term the insert (or update, rather) will fail. Set
  847. * this variable to TRUE to force the change to occur.
  848. *
  849. * @return
  850. * A cvterm object
  851. *
  852. * @ingroup tripal_chado_api
  853. */
  854. function tripal_insert_cvterm($term, $options = array()) {
  855. // get the term properties
  856. $id = (isset($term['id'])) ? $term['id'] : '';
  857. $name = '';
  858. $cvname = '';
  859. $definition = '';
  860. $is_obsolete = 0;
  861. $accession = '';
  862. // Set Defaults
  863. if (isset($term['cv_name'])) {
  864. $cvname = $term['cv_name'];
  865. }
  866. else {
  867. $cvname = 'local';
  868. }
  869. // Namespace is deprecated but must be supported for backwards
  870. // compatability
  871. if (array_key_exists('namespace', $term)) {
  872. $cvname = $term['namespace'];
  873. }
  874. if (isset($term['is_relationship'])) {
  875. $is_relationship = $term['is_relationship'];
  876. }
  877. else {
  878. $is_relationship = 0;
  879. }
  880. if (isset($term['db_name'])) {
  881. $dbname = $term['db_name'];
  882. }
  883. else {
  884. $dbname = 'local';
  885. }
  886. if (isset($options['update_existing'])) {
  887. $update = $options['update_existing'];
  888. }
  889. else {
  890. $update = 1;
  891. }
  892. if (array_key_exists('name', $term)) {
  893. $name = $term['name'];
  894. }
  895. else {
  896. $name = $id;
  897. }
  898. if (array_key_exists('definition', $term)) {
  899. $definition = preg_replace('/^\"(.*)\"/', '\1', $term['definition']);
  900. }
  901. else {
  902. $definition = '';
  903. }
  904. if (array_key_exists('is_obsolete', $term)) {
  905. $is_obsolete = $term['is_obsolete'];
  906. if (strcmp($is_obsolete, 'true') == 0) {
  907. $is_obsolete = 1;
  908. }
  909. }
  910. if (!$name and !$id) {
  911. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Cannot find cvterm without 'id' or 'name'", NULL);
  912. return 0;
  913. }
  914. if (!$id) {
  915. $id = $name;
  916. }
  917. // Get the accession and the database from the cvterm id.
  918. if ($dbname) {
  919. $accession = $id;
  920. }
  921. if (preg_match('/^.+?:.*$/', $id)) {
  922. $accession = preg_replace('/^.+?:(.*)$/', '\1', $id);
  923. $dbname = preg_replace('/^(.+?):.*$/', '\1', $id);
  924. }
  925. // Check that we have a database name, give a different message if it's a
  926. // relationship.
  927. if ($is_relationship and !$dbname) {
  928. tripal_report_error('tripal_chado', TRIPAL_WARNING,
  929. "A database name is not provided for this relationship term: $id", NULL);
  930. return 0;
  931. }
  932. if (!$is_relationship and !$dbname) {
  933. tripal_report_error('tripal_chado', TRIPAL_WARNING,
  934. "A database identifier is missing from the term: $id", NULL);
  935. return 0;
  936. }
  937. // Make sure the CV name exists
  938. $cv = tripal_get_cv(array('name' => $cvname));
  939. if (!$cv) {
  940. $cv = tripal_insert_cv($cvname, '');
  941. }
  942. if (!$cv) {
  943. tripal_report_error('tripal_chado', TRIPAL_WARNING,
  944. "Cannot find namespace '$cvname' when adding/updating $id", NULL);
  945. return 0;
  946. }
  947. // This SQL statement will be used a lot to find a cvterm so just set it
  948. // here for easy reference below. Because CV terms can change their names
  949. // but accessions don't change, the following SQL finds cvterms based on
  950. // their accession rather than the name.
  951. $cvtermsql = "
  952. SELECT CVT.name, CVT.cvterm_id, CV.cv_id, CV.name as cvname,
  953. DB.name as dbname, DB.db_id, DBX.accession
  954. FROM {cvterm} CVT
  955. INNER JOIN {dbxref} DBX on CVT.dbxref_id = DBX.dbxref_id
  956. INNER JOIN {db} DB on DBX.db_id = DB.db_id
  957. INNER JOIN {cv} CV on CV.cv_id = CVT.cv_id
  958. WHERE DBX.accession = :accession and DB.name = :name
  959. ";
  960. // Add the database. The function will just return the DB object if the
  961. // database already exists.
  962. $db = tripal_get_db(array('name' => $dbname));
  963. if (!$db) {
  964. $db = tripal_insert_db(array('name' => $dbname));
  965. }
  966. if (!$db) {
  967. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Cannot find database '$dbname' in Chado.", NULL);
  968. return 0;
  969. }
  970. // The cvterm table has two unique dependencies. We need to check both.
  971. // first check the (name, cv_id, is_obsolete) constraint.
  972. $values = array(
  973. 'name' => $name,
  974. 'is_obsolete' => $is_obsolete,
  975. 'cv_id' => array(
  976. 'name' => $cvname,
  977. ),
  978. );
  979. $result = chado_select_record('cvterm', array('*'), $values);
  980. if (count($result) == 1) {
  981. $cvterm = $result[0];
  982. // Get the dbxref record.
  983. $values = array('dbxref_id' => $cvterm->dbxref_id);
  984. $result = chado_select_record('dbxref', array('*'), $values);
  985. $dbxref = $result[0];
  986. if (!$dbxref) {
  987. tripal_report_error('tripal_cv', TRIPAL_ERROR,
  988. 'Unable to access the dbxref record for the :term cvterm. Term Record: !record',
  989. array(':term' => $name, '!record' => print_r($cvterm, TRUE))
  990. );
  991. return FALSE;
  992. }
  993. // Get the db.
  994. $values = array('db_id' => $dbxref->db_id);
  995. $result = chado_select_record('db', array('*'), $values);
  996. $db_check = $result[0];
  997. // If the database from the existing record doesn't match the one that
  998. // has been provided then we have a problem. The term already exists
  999. // but we don't want to just switch the term, the callee must force it.
  1000. if ($db_check->name != $db->name) {
  1001. if (array_key_exists('force_db_change', $options) and
  1002. $options['force_db_change'] != TRUE) {
  1003. tripal_report_error('tripal_cv', TRIPAL_ERROR,
  1004. 'The term already exists, but associated with a different database record: \'!db\'. It cannot be added: !record',
  1005. array(':term' => $name, '!db' => $db_check->name, '!record' => print_r($cvterm, TRUE))
  1006. );
  1007. return FALSE;
  1008. }
  1009. // Look to see if the correct dbxref record already exists for this
  1010. // database.
  1011. $values = array(
  1012. 'db_id' => $db->db_id,
  1013. 'accession' => $accession,
  1014. );
  1015. $result = chado_select_record('dbxref', array('*'), $values);
  1016. // If we already have a good dbxref then we want to update our cvterm
  1017. // to use this dbxref.
  1018. if (count($result) > 0) {
  1019. $dbxref = $result[0];
  1020. $match = array('cvterm_id' => $cvterm->cvterm_id);
  1021. $values = array('dbxref_id' => $dbxref->dbxref_id);
  1022. $success = chado_update_record('cvterm', $match, $values);
  1023. if (!$success) {
  1024. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to correct the dbxref id for the cvterm " .
  1025. "'$name' (id: $accession), for database $dbname", NULL);
  1026. return 0;
  1027. }
  1028. }
  1029. // If we don't have the dbxref then we want to delete our cvterm and let
  1030. // the code below recreate it with the correct info.
  1031. else {
  1032. $match = array('cvterm_id' => $cvterm->cvterm_id);
  1033. chado_delete_record('cvterm', $match);
  1034. }
  1035. }
  1036. // Check that the accession matches. Sometimes an OBO can define a term
  1037. // multiple times but with different accessions. If this is the case we
  1038. // can't do an insert or it will violate the constraint in the cvterm table.
  1039. // So we'll need to add the record to the cvterm_dbxref table instead.
  1040. if ($dbxref->accession != $accession) {
  1041. // Get/add the dbxref for his term.
  1042. $dbxref_new = tripal_insert_dbxref(array(
  1043. 'db_id' => $db->db_id,
  1044. 'accession' => $accession
  1045. ));
  1046. if (!$dbxref_new) {
  1047. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to find or insert the dbxref record for cvterm, " .
  1048. "$name (id: $accession), for database $dbname", NULL);
  1049. return 0;
  1050. }
  1051. // Check to see if the cvterm_dbxref record already exists.
  1052. $values = array(
  1053. 'cvterm_id' => $cvterm->cvterm_id,
  1054. 'dbxref_id' => $dbxref_new->dbxref_id,
  1055. 'is_for_definition' => 1,
  1056. );
  1057. $result = chado_select_record('cvterm_dbxref', array('*'), $values);
  1058. // if the cvterm_dbxref record does not exists then add it
  1059. if (count($result)==0) {
  1060. $options = array(
  1061. 'return_record' => FALSE,
  1062. );
  1063. $success = chado_insert_record('cvterm_dbxref', $values, $options);
  1064. if (!$success) {
  1065. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to find or insert the cvterm_dbxref record for a " .
  1066. "duplicated cvterm: $name (id: $accession), for database $dbname", NULL);
  1067. return 0;
  1068. }
  1069. }
  1070. // get the original cvterm with the same name and return that.
  1071. $result = chado_query($cvtermsql, array(':accession' => $dbxref->accession, ':name' => $dbname));
  1072. $cvterm = $result->fetchObject();
  1073. return $cvterm;
  1074. }
  1075. // Continue on, we've fixed the record if the db_id did not match.
  1076. // We can now perform and updated if we need to.
  1077. }
  1078. // get the CVterm record
  1079. $result = chado_query($cvtermsql, array(':accession' => $accession, ':name' => $dbname));
  1080. $cvterm = $result->fetchObject();
  1081. if (!$cvterm) {
  1082. // Check to see if the dbxref exists if not, add it.
  1083. $dbxref = tripal_insert_dbxref(array(
  1084. 'db_id' => $db->db_id,
  1085. 'accession' => $accession
  1086. ));
  1087. if (!$dbxref) {
  1088. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to find or insert the dbxref record for cvterm, " .
  1089. "$name (id: $accession), for database $dbname", NULL);
  1090. return 0;
  1091. }
  1092. // Check to see if the dbxref already has an entry in the cvterm table.
  1093. $values = array('dbxref_id' => $dbxref->dbxref_id);
  1094. $check = chado_select_record('cvterm', array('cvterm_id'), $values);
  1095. if (count($check) == 0) {
  1096. // now add the cvterm
  1097. $ins_values = array(
  1098. 'cv_id' => $cv->cv_id,
  1099. 'name' => $name,
  1100. 'definition' => $definition,
  1101. 'dbxref_id' => $dbxref->dbxref_id,
  1102. 'is_obsolete' => $is_obsolete,
  1103. 'is_relationshiptype' => $is_relationship,
  1104. );
  1105. $success = chado_insert_record('cvterm', $ins_values);
  1106. if (!$success) {
  1107. if (!$is_relationship) {
  1108. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to insert the term: $name ($dbname)", NULL);
  1109. return 0;
  1110. }
  1111. else {
  1112. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to insert the relationship term: $name (cv: " . $cvname . " db: $dbname)", NULL);
  1113. return 0;
  1114. }
  1115. }
  1116. }
  1117. // This dbxref already exists in the cvterm table.
  1118. else {
  1119. tripal_report_error('tripal_chado', TRIPAL_WARNING, "The dbxref already exists for another cvterm record: $name (cv: " . $cvname . " db: $dbname)", NULL);
  1120. return 0;
  1121. }
  1122. $result = chado_query($cvtermsql, array(':accession' => $accession, ':name' => $dbname));
  1123. $cvterm = $result->fetchObject();
  1124. }
  1125. // Update the cvterm.
  1126. elseif ($update) {
  1127. // First, basic update of the term.
  1128. $match = array('cvterm_id' => $cvterm->cvterm_id);
  1129. $upd_values = array(
  1130. 'name' => $name,
  1131. 'definition' => $definition,
  1132. 'is_obsolete' => $is_obsolete,
  1133. 'is_relationshiptype' => $is_relationship,
  1134. );
  1135. $success = chado_update_record('cvterm', $match, $upd_values);
  1136. if (!$success) {
  1137. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to update the term: $name", NULL);
  1138. return 0;
  1139. }
  1140. // Second, check that the dbxref has not changed and if it has then update it.
  1141. $checksql = "
  1142. SELECT cvterm_id
  1143. FROM {cvterm} CVT
  1144. INNER JOIN {dbxref} DBX on CVT.dbxref_id = DBX.dbxref_id
  1145. INNER JOIN {db} DB on DBX.db_id = DB.db_id
  1146. INNER JOIN {cv} CV on CV.cv_id = CVT.cv_id
  1147. WHERE DBX.accession = :accession and DB.name = :dbname and CVT.name = :term and CV.name = :cvname
  1148. ";
  1149. $check = chado_query($checksql, array(':accession' => $dbxref->accession, ':dbname' => $dbname, ':term' => $name, ':cvname' => $cvname))->fetchObject();
  1150. if (!$check) {
  1151. // check to see if the dbxref exists if not, add it.
  1152. $dbxref = tripal_insert_dbxref(array(
  1153. 'db_id' => $db->db_id,
  1154. 'accession' => $accession
  1155. ));
  1156. if (!$dbxref) {
  1157. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to find or insert the dbxref record for cvterm, " .
  1158. "$name (id: $accession), for database $dbname", NULL);
  1159. return 0;
  1160. }
  1161. $match = array('cvterm_id' => $cvterm->cvterm_id);
  1162. $upd_values = array(
  1163. 'dbxref_id' => $dbxref->dbxref_id,
  1164. );
  1165. $success = chado_update_record('cvterm', $match, $upd_values);
  1166. if (!$success) {
  1167. tripal_report_error('tripal_chado', TRIPAL_WARNING, "Failed to update the term $name with new accession $db:$accession", NULL);
  1168. return 0;
  1169. }
  1170. }
  1171. // Finally grab the updated details.
  1172. $result = chado_query($cvtermsql, array(':accession' => $dbxref->accession, ':name' => $dbname));
  1173. $cvterm = $result->fetchObject();
  1174. }
  1175. else {
  1176. // do nothing, we have the cvterm but we don't want to update
  1177. }
  1178. // return the cvterm
  1179. return $cvterm;
  1180. }
  1181. /**
  1182. * TODO: deprecate this function
  1183. *
  1184. * This function allows other modules to programatically
  1185. * submit an ontology for loading into Chado.
  1186. *
  1187. * This function will add a job to the Jobs subsystem for parsing the ontology.
  1188. * You can either pass a known OBO ID to the function or the URL
  1189. * or full path the the ontology file. If a URL or file name is
  1190. * passed then the $obo_name argument must also be provided. If
  1191. * this is the first time the ontology has been provided to Tripal
  1192. * then it will be added to the database and will be assigned a
  1193. * unique OBO ID.
  1194. *
  1195. * @param $obo_id
  1196. * If the ontology is already loaded into the Tripal tables then
  1197. * use this argument to specify the unique ID for the ontology
  1198. * that will be loaded
  1199. * @param $obo_name
  1200. * If the OBO has not been added before then use this argument
  1201. * to specify the human readable name of the ontology.
  1202. * @param $obo_url
  1203. * If the OBO to be loaded is located on a remote server then
  1204. * use this argument to provide the URL.
  1205. * @param $obo_file
  1206. * If the OBO is housed on the local file system of the server then
  1207. * use this argument to specify the full path.
  1208. *
  1209. * @return
  1210. * returns the job_id of the submitted job or FALSE if the job was not added
  1211. *
  1212. * @ingroup tripal_chado_api
  1213. */
  1214. function tripal_submit_obo_job($obo) {
  1215. global $user;
  1216. // Set Defaults
  1217. $obo['obo_id'] = (isset($obo['obo_id'])) ? $obo['obo_id'] : NULL;
  1218. $obo['name'] = (isset($obo['name'])) ? $obo['name'] : NULL;
  1219. $obo['url'] = (isset($obo['url'])) ? $obo['url'] : NULL;
  1220. $obo['file'] = (isset($obo['file'])) ? $obo['file'] : NULL;
  1221. $includes = array(
  1222. module_load_include('inc', 'tripal_chado', 'includes/loaders/tripal_chado.obo_loader'),
  1223. );
  1224. if ($obo['obo_id']) {
  1225. $sql = "SELECT * FROM {tripal_cv_obo} WHERE obo_id = :obo_id";
  1226. $result = db_query($sql, array(':obo_id' => $obo['obo_id']))->fetchObject();
  1227. $args = array($result->obo_id);
  1228. return tripal_add_job("Load OBO " . $result->name, 'tripal_chado',
  1229. "tripal_chado_load_obo_v1_2_id", $args, $user->uid, 10, $includes);
  1230. }
  1231. else {
  1232. if ($obo['url']) {
  1233. $args = array($obo['name'], $obo['url']);
  1234. return tripal_add_job("Load OBO " . $obo['name'], 'tripal_chado',
  1235. "tripal_chado_load_obo_v1_2_url", $args, $user->uid, 10, $includes);
  1236. }
  1237. elseif ($obo['file']) {
  1238. $args = array($obo['name'], $obo['file']);
  1239. return tripal_add_job("Load OBO " . $obo['name'], 'tripal_chado',
  1240. "tripal_chado_load_obo_v1_2_file", $args, $user->uid, 10, $includes);
  1241. }
  1242. }
  1243. return FALSE;
  1244. }
  1245. /**
  1246. * Add the OBO to the tripal_cv_obo table in the Drupal database.
  1247. *
  1248. * If the OBO name already exists in the table then the path is updated.
  1249. *
  1250. * @param $name
  1251. * The human readable name of this ontology
  1252. * @param $path
  1253. * The file path or URL of the ontology
  1254. *
  1255. * @return
  1256. * Returns the ontology ID
  1257. *
  1258. * @ingroup tripal_chado_api
  1259. */
  1260. function tripal_insert_obo($name, $path) {
  1261. // make sure an OBO with the same name doesn't already exist
  1262. $obo_id = db_select('tripal_cv_obo', 'tco')
  1263. ->fields('tco', array('obo_id'))
  1264. ->condition('name', $name)
  1265. ->execute()
  1266. ->fetchField();
  1267. if ($obo_id) {
  1268. db_update('tripal_cv_obo')
  1269. ->fields(array(
  1270. 'path' => $path,
  1271. ))
  1272. ->condition('name', $name)
  1273. ->execute();
  1274. return $obo_id;
  1275. }
  1276. else {
  1277. $obo_id = db_insert('tripal_cv_obo')
  1278. ->fields(array(
  1279. 'name' => $name,
  1280. 'path' => $path,
  1281. ))
  1282. ->execute();
  1283. return $obo_id;
  1284. }
  1285. }
  1286. /**
  1287. * Retrieves an OBO record.
  1288. *
  1289. * @param $values
  1290. * An associate array with the following allowed keys: obo_id, name
  1291. *
  1292. * @return
  1293. * An instance of an OBO record object.
  1294. */
  1295. function tripal_get_obo($values) {
  1296. $query = db_select('tripal_cv_obo', 'tco')
  1297. ->fields('tco');
  1298. if (array_key_exists('name', $values)) {
  1299. $query->condition('tco.name', $values['name']);
  1300. }
  1301. if (array_key_exists('obo_id', $values)) {
  1302. $query->condition('tco.obo_id', $values['obo_id']);
  1303. }
  1304. return $query->execute()->fetchObject();
  1305. }
  1306. /**
  1307. * This function is intended to be used in autocomplete forms
  1308. * for searching for CV terms that begin with the provided string
  1309. *
  1310. * @param $cv_id
  1311. * The CV ID in which to search for the term
  1312. * @param $string
  1313. * The string to search for
  1314. *
  1315. * @return
  1316. * A json array of terms that begin with the provided string
  1317. *
  1318. * @ingroup tripal_chado_api
  1319. */
  1320. function tripal_autocomplete_cvterm($cv_id, $string = '') {
  1321. if ($cv_id) {
  1322. $sql = "
  1323. SELECT CVT.cvterm_id, CVT.name
  1324. FROM {cvterm} CVT
  1325. WHERE CVT.cv_id = :cv_id and lower(CVT.name) like lower(:name)
  1326. UNION
  1327. SELECT CVT2.cvterm_id, CVTS.synonym as name
  1328. FROM {cvterm} CVT2
  1329. INNER JOIN {cvtermsynonym} CVTS ON CVTS.cvterm_id = CVT2.cvterm_id
  1330. WHERE CVT2.cv_id = :cv_id and lower(CVTS.synonym) like lower(:name)
  1331. ORDER by name
  1332. LIMIT 25 OFFSET 0
  1333. ";
  1334. $results = chado_query($sql, array(':cv_id' => $cv_id, ':name' => $string . '%'));
  1335. $items = array();
  1336. foreach ($results as $term) {
  1337. $items[$term->name] = $term->name;
  1338. }
  1339. }
  1340. // If a CV wasn't provided then search all of them, and include the cv
  1341. // in the results.
  1342. else {
  1343. $sql = "
  1344. SELECT CVT.cvterm_id, CVT.name, CV.name as cvname, CVT.cv_id
  1345. FROM {cvterm} CVT
  1346. INNER JOIN {cv} CV on CVT.cv_id = CV.cv_id
  1347. WHERE lower(CVT.name) like lower(:name)
  1348. UNION
  1349. SELECT CVT2.cvterm_id, CVTS.synonym as name, CV2.name as cvname, CVT2.cv_id
  1350. FROM {cvterm} CVT2
  1351. INNER JOIN {cv} CV2 on CVT2.cv_id = CV2.cv_id
  1352. INNER JOIN {cvtermsynonym} CVTS ON CVTS.cvterm_id = CVT2.cvterm_id
  1353. WHERE lower(CVTS.synonym) like lower(:name)
  1354. ORDER by name
  1355. LIMIT 25 OFFSET 0
  1356. ";
  1357. $results = chado_query($sql, array(':name' => $string . '%'));
  1358. $items = array();
  1359. foreach ($results as $term) {
  1360. $items[$term->name] = $term->name;
  1361. }
  1362. }
  1363. drupal_json_output($items);
  1364. }
  1365. /**
  1366. * Add a record to a cvterm linking table (ie: feature_cvterm)
  1367. *
  1368. * @param $basetable
  1369. * The base table to which the cvterm should be linked/associated. Thus to associate a
  1370. * cvterm to a feature the basetable=feature and cvterm_id is added to the feature_cvterm table.
  1371. * @param $record_id
  1372. * The primary key of the basetable to associate the cvterm with. This should be in integer.
  1373. * @param $cvterm
  1374. * An associative array describing the cvterm. Valid keys include:
  1375. * - name: the name for the cvterm,
  1376. * - cv_name: the name of the cv the cvterm belongs to.
  1377. * - cv_id: the primary key of the cv the cvterm belongs to.
  1378. * @param $options
  1379. * An associative array of options. Valid keys include:
  1380. * - insert_cvterm: Insert the cvterm if it doesn't already exist. FALSE is the default
  1381. *
  1382. * @ingroup tripal_chado_api
  1383. */
  1384. function tripal_associate_cvterm($basetable, $record_id, $cvterm, $options = array()) {
  1385. $linking_table = $basetable . '_cvterm';
  1386. $foreignkey_name = $basetable . '_id';
  1387. // Default Values
  1388. $options['insert_cvterm'] = (isset($options['insert_cvterm'])) ? $options['insert_cvterm'] : FALSE;
  1389. // If the cvterm_id is not set then find the cvterm record using the name and cv_id
  1390. if (!isset($cvterm['cvterm_id'])) {
  1391. $values = array(
  1392. 'name' => $cvterm['name'],
  1393. );
  1394. if (isset($cvterm['cv_id'])) {
  1395. $values['cv_id'] = $cvterm['cv_id'];
  1396. }
  1397. elseif (isset($cvterm['cv_name'])) {
  1398. $values['cv_id'] = array(
  1399. 'name' => $cvterm['cv_name']
  1400. );
  1401. }
  1402. else {
  1403. tripal_report_error('tripal_chado_api', TRIPAL_WARNING,
  1404. "tripal_associate_cvterm: The cvterm needs to have either the cv_name or cv_id
  1405. supplied. You were trying to associate a cvterm with the %base %record_id
  1406. and supplied the cvterm values: %cvterm.",
  1407. array('%base' => $basetable, '%record_id' => $record_id, '%cvterm' => print_r($cvterm,TRUE))
  1408. );
  1409. return FALSE;
  1410. }
  1411. // Get the cvterm. If it doesn't exist then add it if the option
  1412. // 'insert_cvterm' is set.
  1413. $select = chado_select_record('cvterm', array('*'), $values);
  1414. if ($select) {
  1415. $cvterm['cvterm_id'] = $select[0]->cvterm_id;
  1416. }
  1417. elseif ($options['insert_cvterm']) {
  1418. // Insert the cvterm
  1419. $insert = tripal_insert_cvterm($values);
  1420. if (isset($insert->cvterm_id)) {
  1421. $cvterm['cvterm_id'] = $insert->cvterm_id;
  1422. }
  1423. else {
  1424. tripal_report_error('tripal_chado_api', TRIPAL_WARNING,
  1425. "tripal_associate_cvterm: Unable to insert the cvterm using the cvterm values: %cvterm.",
  1426. array('%cvterm' => print_r($cvterm,TRUE))
  1427. );
  1428. return FALSE;
  1429. }
  1430. }
  1431. else {
  1432. tripal_report_error('tripal_api', TRIPAL_WARNING,
  1433. "tripal_associate_cvterm: The cvterm doesn't already exist. You supplied the cvterm values: %cvterm.",
  1434. array('%cvterm' => print_r($cvterm,TRUE))
  1435. );
  1436. return FALSE;
  1437. }
  1438. }
  1439. // Now add the link between the record & cvterm
  1440. if ($cvterm['cvterm_id'] > 0) {
  1441. $values = array(
  1442. 'cvterm_id' => $cvterm['cvterm_id'],
  1443. $foreignkey_name => $record_id,
  1444. 'pub_id' => 1,
  1445. );
  1446. // Check if the cvterm is already associated. If so, don't re-add it.
  1447. $result = chado_select_record($linking_table, array('*'), $values);
  1448. if (!$result) {
  1449. $success = chado_insert_record($linking_table, $values);
  1450. if (!$success) {
  1451. tripal_report_error('tripal_api', TRIPAL_WARNING,
  1452. "Failed to insert the %base record %term",
  1453. array('%base' => $linking_table, '%term' => $cvterm['name'])
  1454. );
  1455. return FALSE;
  1456. }
  1457. $result = chado_select_record($linking_table, array('*'), $values);
  1458. }
  1459. if (isset($result[0])) {
  1460. return $result[0];
  1461. }
  1462. else {
  1463. return FALSE;
  1464. }
  1465. }
  1466. return FALSE;
  1467. }
  1468. /**
  1469. * This function sets the default vocabulary for a given table and field.
  1470. *
  1471. * @param $table
  1472. * The name of the table that contains a field with a foreign key
  1473. * relationship to the cvterm table
  1474. * @param $field
  1475. * The table field name that has the foreign key relationship to the
  1476. * cvterm table for which the default vocabulary will be set
  1477. * @param $cv_name
  1478. * The name of the vocabulary
  1479. *
  1480. * @return
  1481. * TRUE if set, FALSE if an error occured
  1482. */
  1483. function tripal_set_default_cv($table, $field, $cv_name, $cv_id = FALSE) {
  1484. // Get the CV object
  1485. if ($cv_id) {
  1486. $cv = tripal_get_cv(array('cv_id' => $cv_id));
  1487. }
  1488. else {
  1489. $cv = tripal_get_cv(array('name' => $cv_name));
  1490. }
  1491. if ($cv) {
  1492. // first delete any entries for this table and field
  1493. $num_deleted = db_delete('tripal_cv_defaults')
  1494. ->condition('table_name', $table)
  1495. ->condition('field_name', $field)
  1496. ->execute();
  1497. // now add the default value
  1498. $cv_default_id = db_insert('tripal_cv_defaults')
  1499. ->fields(array(
  1500. 'table_name' => $table,
  1501. 'field_name' => $field,
  1502. 'cv_id' => $cv->cv_id,
  1503. ))
  1504. ->execute();
  1505. if (!$cv_default_id) {
  1506. tripal_report_error('tripal_chado', TRIPAL_WARNING,
  1507. "Cannot set default vocabulary for %table.%field. Check the error logs.",
  1508. array('%table' => $table, '%field' => $field));
  1509. return FALSE;
  1510. }
  1511. }
  1512. else {
  1513. tripal_report_error('tripal_chado', TRIPAL_WARNING,
  1514. "Cannot set default vocabulary for %table.%field. The vocabulary name, '%cvname', doesn't exist.",
  1515. array('%table' => $table, '%field' => $field, '%cvname' => $cv_name));
  1516. return FALSE;
  1517. }
  1518. }