12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682 |
- <?php
- class OBOImporter extends TripalImporter {
- // --------------------------------------------------------------------------
- // EDITABLE STATIC CONSTANTS
- //
- // The following constants SHOULD be set for each descendent class. They are
- // used by the static functions to provide information to Drupal about
- // the field and it's default widget and formatter.
- // --------------------------------------------------------------------------
- /**
- * The name of this loader. This name will be presented to the site
- * user.
- */
- public static $name = 'OBO Vocabulary Loader';
- /**
- * The machine name for this loader. This name will be used to construct
- * the URL for the loader.
- */
- public static $machine_name = 'chado_obo_loader';
- /**
- * A brief description for this loader. This description will be
- * presented to the site user.
- */
- public static $description = 'Import vocabularies and terms in OBO format.';
- /**
- * An array containing the extensions of allowed file types.
- */
- public static $file_types = array('obo');
- /**
- * Provides information to the user about the file upload. Typically this
- * may include a description of the file types allowed.
- */
- public static $upload_description = 'Please provide the details for importing a new OBO file. The file must have a .obo extension.';
- /**
- * The title that should appear above the upload button.
- */
- public static $upload_title = 'New OBO File';
- /**
- * If the loader should require an analysis record. To maintain provenance
- * we should always indiate where the data we are uploading comes from.
- * The method that Tripal attempts to use for this by associating upload files
- * with an analysis record. The analysis record provides the details for
- * how the file was created or obtained. Set this to FALSE if the loader
- * should not require an analysis when loading. if $use_analysis is set to
- * true then the form values will have an 'analysis_id' key in the $form_state
- * array on submitted forms.
- */
- public static $use_analysis = FALSE;
- /**
- * If the $use_analysis value is set above then this value indicates if the
- * analysis should be required.
- */
- public static $require_analysis = TRUE;
- /**
- * Text that should appear on the button at the bottom of the importer
- * form.
- */
- public static $button_text = 'Import OBO File';
- /**
- * Indicates the methods that the file uploader will support.
- */
- public static $methods = array(
- // Allow the user to upload a file to the server.
- 'file_upload' => FALSE,
- // Allow the user to provide the path on the Tripal server for the file.
- 'file_local' => FALSE,
- // Allow the user to provide a remote URL for the file.
- 'file_remote' => FALSE,
- );
- /**
- * Be default, all loaders are automaticlly added to the Admin >
- * Tripal > Data Laders menu. However, if this loader should be
- * made available via a different menu path, then set it here. If the
- * value is empty then the path will be the default.
- */
- public static $menu_path = 'admin/tripal/loaders/chado_vocabs/obo_loader';
- public static $file_required = FALSE;
- /**
- * Keep track of vocabularies that have been added.
- *
- * @var array
- */
- private $newcvs = array();
- /**
- * @see TripalImporter::form()
- */
- public function form($form, &$form_state) {
- // get a list of db from chado for user to choose
- $sql = "SELECT * FROM {tripal_cv_obo} ORDER BY name";
- $results = db_query($sql);
- $obos = array();
- $obos[] = 'Select a Vocabulary';
- foreach ($results as $obo) {
- $obos[$obo->obo_id] = $obo->name;
- }
- $obo_id = '';
- if (array_key_exists('values', $form_state)) {
- $obo_id = array_key_exists('obo_id', $form_state['values']) ? $form_state['values']['obo_id'] : '';
- }
- $form['instructions']['info'] = array(
- '#type' => 'item',
- '#markup' => t('This page allows you to load vocabularies and ontologies
- that are in OBO format. Once loaded, the terms from these
- vocabularies can be used to create content.
- You may use the form below to either reload a vocabulary that is already
- loaded (as when new updates to that vocabulary are available) or load a new
- vocabulary.'),
- );
- $form['obo_existing'] = array(
- '#type' => 'fieldset',
- '#title' => t('Use a Saved Ontology OBO Reference'),
- '#prefix' => '<span id="obo-existing-fieldset">',
- '#suffix' => '</span>'
- );
- $form['obo_existing']['existing_instructions']= array(
- '#type' => 'item',
- '#markup' => t('The vocabularies listed in the select box below have bene pre-populated
- upon installation of Tripal or have been previously loaded. Select one to edit
- its settings or submit for loading. You may reload any vocabulary that has
- already been loaded to retrieve any new updates.'),
- );
- $form['obo_existing']['obo_id'] = array(
- '#title' => t('Ontology OBO File Reference'),
- '#type' => 'select',
- '#options' => $obos,
- '#ajax' => array(
- 'callback' => 'tripal_cv_obo_form_ajax_callback',
- 'wrapper' => 'obo-existing-fieldset',
- ),
- '#description' => t('Select a vocabulary to import.')
- );
- // If the user has selected an OBO ID then get the form elements for
- // updating.
- if ($obo_id) {
- $uobo_name = '';
- $uobo_url = '';
- $uobo_file = '';
- $vocab = db_select('tripal_cv_obo', 't')
- ->fields('t', array('name', 'path'))
- ->condition('obo_id', $obo_id)
- ->execute()
- ->fetchObject();
- $uobo_name = $vocab->name;
- if (preg_match('/^http/', $vocab->path)) {
- $uobo_url = $vocab->path;
- }
- else {
- $uobo_file = trim($vocab->path);
- $matches = array();
- if (preg_match('/\{(.*?)\}/', $uobo_file, $matches)) {
- $modpath = drupal_get_path('module', $matches[1]);
- $uobo_file = preg_replace('/\{.*?\}/', $modpath, $uobo_file);
- }
- }
- // We don't want the previous value to remain. We want the new default to
- // show up, so remove the input values
- unset($form_state['input']['uobo_name']);
- unset($form_state['input']['uobo_url']);
- unset($form_state['input']['uobo_file']);
- $form['obo_existing']['uobo_name']= array(
- '#type' => 'textfield',
- '#title' => t('Vocabulary Name'),
- '#description' => t('Please provide a name for this vocabulary. After upload, this name will appear in the drop down
- list above for use again later.'),
- '#default_value' => $uobo_name,
- );
- $form['obo_existing']['uobo_url']= array(
- '#type' => 'textfield',
- '#title' => t('Remote URL'),
- '#description' => t('Please enter a URL for the online OBO file. The file will be downloaded and parsed.
- (e.g. http://www.obofoundry.org/ro/ro.obo)'),
- '#default_value' => $uobo_url,
- );
- $form['obo_existing']['uobo_file']= array(
- '#type' => 'textfield',
- '#title' => t('Local File'),
- '#description' => t('Please enter the file system path for an OBO
- definition file. If entering a path relative to
- the Drupal installation you may use a relative path that excludes the
- Drupal installation directory (e.g. sites/default/files/xyz.obo). Note
- that Drupal relative paths have no preceeding slash.
- Otherwise, please provide the full path on the filesystem. The path
- must be accessible to the web server on which this Drupal instance is running.'),
- '#default_value' => $uobo_file,
- );
- $form['obo_existing']['update_obo_details'] = array(
- '#type' => 'submit',
- '#value' => 'Update Ontology Details',
- '#name' => 'update_obo_details'
- );
- }
- $form['obo_new'] = array(
- '#type' => 'fieldset',
- '#title' => t('Add a New Ontology OBO Reference'),
- '#collapsible' => TRUE,
- '#collapsed' => TRUE,
- );
- $form['obo_new']['path_instructions']= array(
- '#value' => t('Provide the name and path for the OBO file. If the vocabulary OBO file
- is stored local to the server provide a file name. If the vocabulry is stored remotely,
- provide a URL. Only provide a URL or a local file, not both.'),
- );
- $form['obo_new']['obo_name']= array(
- '#type' => 'textfield',
- '#title' => t('New Vocabulary Name'),
- '#description' => t('Please provide a name for this vocabulary. After upload, this name will appear in the drop down
- list above for use again later. Additionally, if a default namespace is not provided in the OBO
- header this name will be used as the default_namespace.'),
- );
- $form['obo_new']['obo_url']= array(
- '#type' => 'textfield',
- '#title' => t('Remote URL'),
- '#description' => t('Please enter a URL for the online OBO file. The file will be downloaded and parsed.
- (e.g. http://www.obofoundry.org/ro/ro.obo)'),
- );
- $form['obo_new']['obo_file']= array(
- '#type' => 'textfield',
- '#title' => t('Local File'),
- '#description' => t('Please enter the file system path for an OBO
- definition file. If entering a path relative to
- the Drupal installation you may use a relative path that excludes the
- Drupal installation directory (e.g. sites/default/files/xyz.obo). Note
- that Drupal relative paths have no preceeding slash.
- Otherwise, please provide the full path on the filesystem. The path
- must be accessible to the web server on which this Drupal instance is running.'),
- );
- return $form;
- }
- /**
- * @see TripalImporter::formSubmit()
- */
- public function formSubmit($form, &$form_state) {
- $obo_id = $form_state['values']['obo_id'];
- $obo_name = trim($form_state['values']['obo_name']);
- $obo_url = trim($form_state['values']['obo_url']);
- $obo_file = trim($form_state['values']['obo_file']);
- $uobo_name = array_key_exists('uobo_name', $form_state['values']) ? trim($form_state['values']['uobo_name']) : '';
- $uobo_url = array_key_exists('uobo_url', $form_state['values']) ? trim($form_state['values']['uobo_url']) : '';
- $uobo_file = array_key_exists('uobo_file', $form_state['values']) ? trim($form_state['values']['uobo_file']) : '';
- // If the user requested to alter the details then do that.
- if ($form_state['clicked_button']['#name'] == 'update_obo_details') {
- $form_state['rebuild'] = TRUE;
- $success = db_update('tripal_cv_obo')
- ->fields(array(
- 'name' => $uobo_name,
- 'path' => $uobo_url ? $uobo_url : $uobo_file,
- ))
- ->condition('obo_id', $obo_id)
- ->execute();
- if ($success) {
- drupal_set_message(t("The vocabulary !vocab has been updated.", array('!vocab' => $uobo_name)));
- }
- else {
- drupal_set_message(t("The vocabulary !vocab could not be updated.", array('!vocab' => $uobo_name)), 'error');
- }
- }
- elseif (!empty($obo_name)) {
- $obo_id = db_insert('tripal_cv_obo')
- ->fields(array(
- 'name' => $obo_name,
- 'path' => $obo_url ? $obo_url : $obo_file,
- ))
- ->execute();
- // Add the obo_id to the form_state vaules.
- $form_state['values']['obo_id'] = $obo_id;
- if ($obo_id) {
- drupal_set_message(t("The vocabulary !vocab has been added.", array('!vocab' => $obo_name)));
- }
- else {
- $form_state['rebuild'] = TRUE;
- drupal_set_message(t("The vocabulary !vocab could not be added.", array('!vocab' => $obo_name)), 'error');
- }
- }
- }
- /**
- * @see TripalImporter::formValidate()
- */
- public function formValidate($form, &$form_state) {
- $obo_id = $form_state['values']['obo_id'];
- $obo_name = trim($form_state['values']['obo_name']);
- $obo_url = trim($form_state['values']['obo_url']);
- $obo_file = trim($form_state['values']['obo_file']);
- $uobo_name = array_key_exists('uobo_name', $form_state['values']) ? trim($form_state['values']['uobo_name']) : '';
- $uobo_url = array_key_exists('uobo_url', $form_state['values']) ? trim($form_state['values']['uobo_url']) : '';
- $uobo_file = array_key_exists('uobo_file', $form_state['values']) ? trim($form_state['values']['uobo_file']) : '';
- // Make sure if the name is changed it doesn't conflict with another OBO.
- if ($form_state['clicked_button']['#name'] == 'update_obo_details' or
- $form_state['clicked_button']['#name'] == 'update_load_obo') {
- // Get the current record
- $vocab = db_select('tripal_cv_obo', 't')
- ->fields('t', array('obo_id', 'name', 'path'))
- ->condition('name', $uobo_name)
- ->execute()
- ->fetchObject();
- if ($vocab and $vocab->obo_id != $obo_id) {
- form_set_error('uobo_name', 'The vocabulary name must be different from existing vocabularies');
- }
- // Make sure the file exists. First check if it is a relative path
- $dfile = $_SERVER['DOCUMENT_ROOT'] . base_path() . $uobo_file;
- if (!file_exists($dfile)) {
- if (!file_exists($uobo_file)) {
- form_set_error('uobo_file', 'The specified path does not exist or cannot be read.');
- }
- }
- if (!$uobo_url and !$uobo_file) {
- form_set_error('uobo_url', 'Please provide a URL or a path for the vocabulary.');
- }
- if ($uobo_url and $uobo_file) {
- form_set_error('uobo_url', 'Please provide only a URL or a path for the vocabulary, but not both.');
- }
- }
- if ($form_state['clicked_button']['#name'] == 'add_new_obo') {
- // Get the current record
- $vocab = db_select('tripal_cv_obo', 't')
- ->fields('t', array('obo_id', 'name', 'path'))
- ->condition('name', $obo_name)
- ->execute()
- ->fetchObject();
- if ($vocab) {
- form_set_error('obo_name', 'The vocabulary name must be different from existing vocabularies');
- }
- // Make sure the file exists. First check if it is a relative path
- $dfile = $_SERVER['DOCUMENT_ROOT'] . base_path() . $obo_file;
- if (!file_exists($dfile)) {
- if (!file_exists($obo_file)) {
- form_set_error('obo_file', 'The specified path does not exist or cannot be read.');
- }
- }
- if (!$obo_url and !$obo_file) {
- form_set_error('obo_url', 'Please provide a URL or a path for the vocabulary.');
- }
- if ($obo_url and $obo_file) {
- form_set_error('obo_url', 'Please provide only a URL or a path for the vocabulary, but not both.');
- }
- }
- }
- /**
- * @see TripalImporter::run()
- *
- * @param $details
- * The following arguments are supported:
- * - obo_id: (required) The ID of the ontology to be imported.
- */
- public function run() {
- $arguments = $this->arguments['run_args'];
- $obo_id = $arguments['obo_id'];
- // Make sure the $obo_id is valid
- $obo = db_select('tripal_cv_obo', 'tco')
- ->fields('tco')
- ->condition('obo_id', $obo_id)
- ->execute()
- ->fetchObject();
- if (!$obo) {
- throw new Exception("Invalid OBO ID provided: '$obo_id'.");
- }
- $this->loadOBO_v1_2_id($obo);
- }
- /**
- * @see TripalImporter::postRun()
- *
- */
- public function postRun() {
- // Update the cv_root_mview materiailzed view.
- $this->logMessage("Updating the cv_root_mview materialized view...");
- $mview_id = tripal_get_mview_id('cv_root_mview');
- tripal_populate_mview($mview_id);
- $this->logMessage("Updating the db2cv_mview materialized view...");
- $mview_id = tripal_get_mview_id('db2cv_mview');
- tripal_populate_mview($mview_id);
- // Upate the cvtermpath table for each newly added CV.
- $this->logMessage("Updating cvtermpath table. This may take a while...");
- foreach ($this->newcvs as $namespace => $cvid) {
- $this->logMessage("- Loading paths for @vocab", array('@vocab' => $namespace));
- tripal_update_cvtermpath($cvid);
- }
- }
- /**
- * A wrapper function for importing the user specified OBO file into Chado by
- * specifying the obo_id of the OBO. It requires that the file be in OBO v1.2
- * compatible format. This function is typically executed via the Tripal jobs
- * management after a user submits a job via the Load Onotloies form.
- *
- * @param $obo_id
- * An obo_id from the tripal_cv_obo file that specifies which OBO file to import
- * @ingroup tripal_obo_loader
- */
- private function loadOBO_v1_2_id($obo) {
- // Convert the module name to the real path if present
- if (preg_match("/\{(.*?)\}/", $obo->path, $matches)) {
- $module = $matches[1];
- $path = drupal_realpath(drupal_get_path('module', $module));
- $obo->path = preg_replace("/\{.*?\}/", $path, $obo->path);
- }
- // if the reference is for a remote URL then run the URL processing function
- if (preg_match("/^https:\/\//", $obo->path) or
- preg_match("/^http:\/\//", $obo->path) or
- preg_match("/^ftp:\/\//", $obo->path)) {
- $this->loadOBO_v1_2_url($obo->name, $obo->path, 0);
- }
- // if the reference is for a local file then run the file processing function
- else {
- // check to see if the file is located local to Drupal
- $dfile = $_SERVER['DOCUMENT_ROOT'] . base_path() . $obo->path;
- if (file_exists($dfile)) {
- $this->loadOBO_v1_2_file($obo->name, $dfile, 0);
- }
- // if not local to Drupal, the file must be someplace else, just use
- // the full path provided
- else {
- if (file_exists($obo->path)) {
- $this->loadOBO_v1_2_file($obo->name, $obo->path, 0);
- }
- else {
- print "ERROR: could not find OBO file: '$obo->path'\n";
- }
- }
- }
- }
- /**
- * A wrapper function for importing the user specified OBO file into Chado by
- * specifying the filename and path of the OBO. It requires that the file be in OBO v1.2
- * compatible format. This function is typically executed via the Tripal jobs
- * management after a user submits a job via the Load Onotloies form.
- *
- * @param $obo_name
- * The name of the OBO (typially the ontology or controlled vocabulary name)
- * @param $file
- * The path on the file system where the ontology can be found
- * @param $is_new
- * Set to TRUE if this is a new ontology that does not yet exist in the
- * tripal_cv_obo table. If TRUE the OBO will be added to the table.
- *
- * @ingroup tripal_obo_loader
- */
- private function loadOBO_v1_2_file($obo_name, $file, $is_new = TRUE) {
- if ($is_new) {
- tripal_insert_obo($obo_name, $file);
- }
- $success = $this->loadOBO_v1_2($file, $obo_name);
- }
- /**
- * A wrapper function for importing the user specified OBO file into Chado by
- * specifying the remote URL of the OBO. It requires that the file be in OBO v1.2
- * compatible format. This function is typically executed via the Tripal jobs
- * management after a user submits a job via the Load Onotloies form.
- *
- * @param $obo_name
- * The name of the OBO (typially the ontology or controlled vocabulary name)
- * @param $url
- * The remote URL of the OBO file.
- * @param $is_new
- * Set to TRUE if this is a new ontology that does not yet exist in the
- * tripal_cv_obo table. If TRUE the OBO will be added to the table.
- *
- * @ingroup tripal_obo_loader
- */
- private function loadOBO_v1_2_url($obo_name, $url, $is_new = TRUE) {
- // first download the OBO
- $temp = tempnam(sys_get_temp_dir(), 'obo_');
- print "Downloading URL $url, saving to $temp\n";
- $url_fh = fopen($url, "r");
- $obo_fh = fopen($temp, "w");
- if (!$url_fh) {
- throw new Exception("Unable to download the remote OBO file at $url. Could a firewall be blocking outgoing connections? " .
- " if you are unable to download the file you may manually downlod the OBO file and use the web interface to " .
- " specify the location of the file on your server.");
- }
- while (!feof($url_fh)) {
- fwrite($obo_fh, fread($url_fh, 255), 255);
- }
- fclose($url_fh);
- fclose($obo_fh);
- if ($is_new) {
- tripal_insert_obo($obo_name, $url);
- }
- // second, parse the OBO
- $this->loadOBO_v1_2($temp, $obo_name);
- // now remove the temp file
- unlink($temp);
- }
- /**
- * Imports a given OBO file into Chado. This function is usually called by
- * one of three wrapper functions: loadOBO_v1_2_id,
- * loadOBO_v1_2_file or tirpal_cv_load_obo_v1_2_url. But, it can
- * be called directly if the full path to an OBO file is available on the
- * file system.
- *
- * @param $flie
- * The full path to the OBO file on the file system
- *
- * @ingroup tripal_obo_loader
- */
- private function loadOBO_v1_2($file, $obo_name) {
- $header = array();
- $ret = array();
- // Empty the temp table.
- $sql = "DELETE FROM {tripal_obo_temp}";
- chado_query($sql);
- $this->logMessage("Step 1: Preloading File $file...");
- // parse the obo file
- $default_db = $this->parse($file, $header);
- // Add the CV for this ontology to the database. The v1.2 definition
- // specifies a 'default-namespace' to be used if a 'namespace' is not
- // present for each stanza. Some ontologies have adopted the v1.4 method
- // in their v1.2 files and not including it.
- if (array_key_exists('default-namespace', $header)) {
- $defaultcv = tripal_insert_cv($header['default-namespace'][0], '');
- if (!$defaultcv) {
- throw new Exception('Cannot add namespace ' . $header['default-namespace'][0]);
- }
- $this->newcvs[$header['default-namespace'][0]] = $defaultcv->cv_id;
- }
- // If the 'default-namespace' is missing.
- else {
- // Grab the first term accession from the file and get the short name for the cv
- $fh = fopen($file, 'r');
- while ($line = fgets($fh)) {
- // Grab the first item's id info to break apart.
- if (preg_match('/^\s*\[/', $line)) {
- $stanza = TRUE;
- continue;
- }
- if ($stanza === TRUE && (substr($line, 0, 3) === "id:")) {
- $parts = explode(':', $line);
- $short_name = strtolower($parts[1]);
- $short_name = preg_replace('/\s+/', '', $short_name);
- break;
- }
- }
- fclose($fh);
- // Check if the EBI ontology search has this ontology:
- try {
- $results = $this->oboEbiLookup($short_name, 'ontology');
- if (array_key_exists('default-namespace', $results['config']['annotations'])) {
- $results = $results['config']['annotations']['default-namespace'];
- if (is_array($results)) {
- $results = $results[0];
- }
- }
- elseif (array_key_exists('namespace', $results['config'])) {
- $results = $results['config']['namespace'];
- }
- else {
- $results = $short_name;
- }
- $defaultcv = tripal_insert_cv(strtoupper($results), '');
- $this->newcvs[$defaultcv->name] = $defaultcv->cv_id;
- }
- catch (Exception $e) {
- watchdog_exception('OBOImporter no such accession found in EBI Ontology Search', $e);
- }
-
- if (empty($defaultcv)) {
- throw new Exception("Could not find a namespace for this OBO file: $file");
- }
- $this->logMessage("This OBO is missing the 'default-namespace' header. It " .
- "is not possible to determine which vocabulary terms without a 'namespace' key " .
- "should go. Instead, those terms will be placed in the '!vocab' vocabulary.",
- array('!vocab' => $defaultcv->name), TRIPAL_WARNING);
- }
- // Add any typedefs to the vocabulary first.
- $this->logMessage("Step 2: Loading type defs...");
- $this->loadTypeDefs($defaultcv, $default_db);
- // Next add terms to the vocabulary.
- $this->logMessage("Step 3: Loading terms...");
- if (!$this->processTerms($defaultcv, $default_db)) {
- throw new Exception('Cannot add terms from this ontology');
- }
- }
- /**
- * OBO files are divided into a typedefs terms section and vocabulary terms section.
- * This function loads the typedef terms from the OBO.
- *
- * @param $defaultcv
- * A database object containing a record from the cv table for the
- * default controlled vocabulary
- * @param $default_db
- * The name of the default database.
- *
- * @ingroup tripal_obo_loader
- */
- private function loadTypeDefs($defaultcv, $default_db) {
- $sql = "SELECT * FROM {tripal_obo_temp} WHERE type = 'Typedef' ";
- $typedefs = chado_query($sql);
- $sql = "
- SELECT count(*) as num_terms
- FROM {tripal_obo_temp}
- WHERE type = 'Typedef'
- ";
- $result = chado_query($sql)->fetchObject();
- $count = $result->num_terms;
- $this->setTotalItems($count);
- $this->setItemsHandled(0);
- $i = 0;
- foreach ($typedefs as $typedef) {
- $this->setItemsHandled($i);
- $term = unserialize(base64_decode($typedef->stanza));
- $this->processTerm($term, $defaultcv->name, 1, $default_db);
- $i++;
- }
- $this->setItemsHandled($i);
- return 1;
- }
- /**
- * OBO files are divided into a typedefs section and a terms section.
- *
- * This function loads the typedef terms from the OBO.
- *
- * @param $defaultcv
- * A database object containing a record from the cv table for the
- * default controlled vocabulary
- * @param $default_db
- * The name of the default database.
- */
- private function processTerms($defaultcv, $default_db) {
- $i = 0;
- $external = FALSE;
- // Iterate through each term from the OBO file and add it.
- $sql = "
- SELECT * FROM {tripal_obo_temp}
- WHERE type = 'Term'
- ORDER BY id
- ";
- $terms = chado_query($sql);
- $sql = "
- SELECT count(*) as num_terms
- FROM {tripal_obo_temp}
- WHERE type = 'Term'
- ";
- $result = chado_query($sql)->fetchObject();
- $count = $result->num_terms;
- $this->setTotalItems($count);
- $this->setItemsHandled(0);
- // Iterate through the terms.
- foreach ($terms as $t) {
- $term = unserialize(base64_decode($t->stanza));
- $this->setItemsHandled($i);
- // Add/update this term.
- $status = $this->processTerm($term, $defaultcv->name, 0, $default_db);
- if (!$status) {
- throw new Exception("Failed to process terms from the ontology");
- }
- else if ($status === 2 && $external == FALSE) {
- $this->logMessage(
- "A term that belongs to another ontology is used within this " .
- "vocabulary. Therefore a lookup was performed with the EBI Ontology " .
- "Lookup Service to retrieve the information for this term. " .
- "Please note, that vocabularies with many non-local terms " .
- "require remote lookups and these lookups can dramatically " .
- "decrease loading time. " ,
- array('!vocab' => $defaultcv->name),
- TRIPAL_WARNING
- );
- $external = TRUE;
- }
- $i++;
- }
- $this->setItemsHandled($i);
- return 1;
- }
- /**
- * Uses the provided term array to add/update information to Chado about the
- * term including the term, dbxref, synonyms, properties, and relationships.
- *
- * @param $term
- * An array representing the cvterm.
- * @param $defaultcv
- * The name of the default controlled vocabulary
- * @is_relationship
- * Set to 1 if this term is a relationship term
- * @default_db
- * The name of the default database.
- *
- * @ingroup tripal_obo_loader
- */
- private function processTerm($term, $defaultcv, $is_relationship = 0, $default_db) {
- // make sure we have a namespace for this term
- if (!array_key_exists('namespace', $term) and !($defaultcv or $defaultcv == '')) {
- throw new Exception("Cannot add the term: no namespace defined. " . $term['id'][0]);
- }
- // construct the term array for sending to the tripal_chado_add_cvterm function
- // for adding a new cvterm
- $t = array();
- $t['id'] = $term['id'][0];
- $t['name'] = $term['name'][0];
- if (array_key_exists('def', $term)) {
- $t['definition'] = $term['def'][0];
- }
- if (array_key_exists('subset', $term)) {
- $t['subset'] = $term['subset'][0];
- }
- if (array_key_exists('namespace', $term)) {
- $t['namespace'] = $term['namespace'][0];
- }
- if (array_key_exists('is_obsolete', $term)) {
- $t['is_obsolete'] = $term['is_obsolete'][0];
- }
- // Check the id isn't a reference to another term.
- //TODO: Check chado for the accession, so we can avoid lookups where possible.
- if (strpos($t['id'], ':')) {
- $pair = explode(":", $t['id']);
- $ontology_id = $pair[0];
- $accession_num = $pair[1];
- if (is_numeric($accession_num) && ($ontology_id != $default_db)) {
- // Check that the term isn't already in Chado.
- $results = $this->oboEbiLookup($t['id'], 'term');
- if (isset($results['label'])) {
- $t['name'] = $results['label'];
- $defaultcv = $results['ontology_name'];
- $default_db = $results['ontology_prefix'];
- $external = TRUE;
- }
- if (!isset($results['label'])) {
- $results = $this->oboEbiLookup($t['id'], 'query');
- if (array_key_exists('docs', $results)) {
- if (!empty($results['response']['docs'])) {
- if (count($results['response']['docs']) > 1) {
- foreach ($results['response']['docs'] as $doc) {
- if ($doc['obo_id'] == $t['id']) {
- $t['name'] = $doc['label'];
- $defaultcv = $doc['ontology_name'];
- $default_db = $doc['ontology_prefix'];
- $external = true;
- }
- }
- } else {
- $t['name'] = $results['response']['docs'][0]['label'];
- $defaultcv = $results['response']['docs'][0]['ontology_name'];
- $default_db = $results['response']['docs'][0]['ontology_prefix'];
- $external = true;
- }
- }
- }
- }
- if ($results['response']['numFound'] == 0 && !isset($results['label'])) {
- // The first search doesn't work, so let's try a broader one.
- $results = $this->oboEbiLookup($t['id'], 'query-non-local');
- if (!empty($results)) {
- if (array_key_exists('docs', $results)) {
- if (!empty($results['docs'])) {
- $accession = $t['id'];
- $accession_underscore = str_replace(":", "_", $accession);
- foreach ($results['response']['docs'] as $item) {
- if ($item['label'] != $accession && $item['label'] != $accession_underscore) {
- //Found the first place a label is other than the accession is used, so take
- // that info and then end the loop.
- $t['name'] = $item['label'];
- $defaultcv = $item['ontology_name'];
- $default_db = $item['ontology_prefix'];
- $external = true;
- break;
- }
- }
- }
- }
- }
- }
- }
- }
- // Check that the default_cv is in the cv table.
- $sql = "
- SELECT CV.name
- FROM {cv} CV
- WHERE CV.name = '$defaultcv'
- ";
- $results = chado_query($sql)->fetchObject();
- if (!$results){
- //The controlled vocabulary is not in the cv term table and needs to be added.
- $ontology_info = $this->oboEbiLookup($defaultcv, 'ontology');
- if (!empty($ontology_info['config'])){
- // CV Name.
- if (array_key_exists('namespace', $ontology_info['config'])) {
- $cv_info = $ontology_info['config']['namespace'];
- }
- elseif (array_key_exists('default-namespace', $ontology_info['config']['annotations'])) {
- $cv_info = $ontology_info['config']['annotations']['default-namespace'];
- }
- //CV Description.
- if (array_key_exists('description', $ontology_info['config'])) {
- $description = $ontology_info['config']['description'];
- }
- else {
- $description = '';
- }
- $cv_returned = chado_insert_cv($cv_info, $description);
- if($cv_returned) {
- $defaultcv = $cv_returned->name;
- // Now add the db entry.
- $values = array(
- 'name' => $ontology_info['config']['preferredPrefix'],
- 'description' => $ontology_info['config']['description'],
- 'url' => $ontology_info['config']['versionIri'],
- );
-
- $db_returned = chado_insert_db($values);
- if ($db_returned) {
- $default_db = $db_returned->name;
- }
- }
- }
- }
- $t['cv_name'] = $defaultcv;
- $t['is_relationship'] = $is_relationship;
- $t['db_name'] = $default_db;
- // The name being empty regularly causes problems, so let's check it's there.
- if (empty($t['name'])){
- $results = $this->oboEbiLookup($t['id'], 'term');
- if (isset($results['label'])) {
- $t['name'] = $results['label'];
- }
- }
- $cvterm = tripal_insert_cvterm($t, array('update_existing' => TRUE));
- if (!$cvterm) {
- throw new Exception("Cannot add the term " . $term['id'][0]);
- }
- // Remove any relationships that this term already has (in case it was
- // updated) and we'll re-add them.
- $sql = "
- DELETE FROM {cvterm_relationship} CVTR
- WHERE CVTR.subject_id = :cvterm_id
- ";
- chado_query($sql, array(':cvterm_id' => $cvterm->cvterm_id));
- if (array_key_exists('namespace', $term)) {
- $this->newcvs[$term['namespace'][0]] = $cvterm->cv_id;
- }
- // now handle other properites
- if (array_key_exists('is_anonymous', $term)) {
- //print "WARNING: unhandled tag: is_anonymous\n";
- }
- if (array_key_exists('alt_id', $term)) {
- foreach ($term['alt_id'] as $alt_id) {
- if (!$this->addCvtermDbxref($cvterm, $alt_id)) {
- throw new Exception("Cannot add alternate id $alt_id");
- }
- }
- }
- if (array_key_exists('subset', $term)) {
- //print "WARNING: unhandled tag: subset\n";
- }
- // add synonyms for this cvterm
- if (array_key_exists('synonym', $term)) {
- if (!$this->addSynonym($term, $cvterm)) {
- throw new Exception("Cannot add synonyms");
- }
- }
- // reformat the deprecated 'exact_synonym, narrow_synonym, and broad_synonym'
- // types to be of the v1.2 standard
- if (array_key_exists('exact_synonym', $term) or array_key_exists('narrow_synonym', $term) or array_key_exists('broad_synonym', $term)) {
- if (array_key_exists('exact_synonym', $term)) {
- foreach ($term['exact_synonym'] as $synonym) {
- $new = preg_replace('/^\s*(\".+?\")(.*?)$/', '$1 EXACT $2', $synonym);
- $term['synonym'][] = $new;
- }
- }
- if (array_key_exists('narrow_synonym', $term)) {
- foreach ($term['narrow_synonym'] as $synonym) {
- $new = preg_replace('/^\s*(\".+?\")(.*?)$/', '$1 NARROW $2', $synonym);
- $term['synonym'][] = $new;
- }
- }
- if (array_key_exists('broad_synonym', $term)) {
- foreach ($term['broad_synonym'] as $synonym) {
- $new = preg_replace('/^\s*(\".+?\")(.*?)$/', '$1 BROAD $2', $synonym);
- $term['synonym'][] = $new;
- }
- }
- if (!$this->addSynonym($term, $cvterm)) {
- throw new Exception("Cannot add/update synonyms");
- }
- }
- // add the comment to the cvtermprop table
- if (array_key_exists('comment', $term)) {
- $comments = $term['comment'];
- $j = 0;
- foreach ($comments as $comment) {
- if (!$this->addCvtermProp($cvterm, 'comment', $comment, $j)) {
- throw new Exception("Cannot add/update cvterm property");
- }
- $j++;
- }
- }
- // add any other external dbxrefs
- if (array_key_exists('xref', $term)) {
- foreach ($term['xref'] as $xref) {
- if (!$this->addCvtermDbxref($cvterm, $xref)) {
- throw new Exception("Cannot add/update cvterm database reference (dbxref).");
- }
- }
- }
- if (array_key_exists('xref_analog', $term)) {
- foreach ($term['xref_analog'] as $xref) {
- if (!$this->addCvtermDbxref($cvterm, $xref)) {
- throw new Exception("Cannot add/update cvterm database reference (dbxref).");
- }
- }
- }
- if (array_key_exists('xref_unk', $term)) {
- foreach ($term['xref_unk'] as $xref) {
- if (!$this->addCvtermDbxref($cvterm, $xref)) {
- throw new Exception("Cannot add/update cvterm database reference (dbxref).");
- }
- }
- }
- // add is_a relationships for this cvterm
- if (array_key_exists('is_a', $term)) {
- foreach ($term['is_a'] as $is_a) {
- if (!$this->addRelationship($cvterm, $defaultcv, 'is_a', $is_a, $is_relationship, $default_db)) {
- throw new Exception("Cannot add relationship is_a: $is_a");
- }
- }
- }
- if (array_key_exists('intersection_of', $term)) {
- //print "WARNING: unhandled tag: intersection_of\n";
- }
- if (array_key_exists('union_of', $term)) {
- //print "WARNING: unhandled tag: union_on\n";
- }
- if (array_key_exists('disjoint_from', $term)) {
- //print "WARNING: unhandled tag: disjoint_from\n";
- }
- if (array_key_exists('relationship', $term)) {
- foreach ($term['relationship'] as $value) {
- $rel = preg_replace('/^(.+?)\s.+?$/', '\1', $value);
- $object = preg_replace('/^.+?\s(.+?)$/', '\1', $value);
- if (!$this->addRelationship($cvterm, $defaultcv, $rel, $object, $is_relationship, $default_db)) {
- throw new Exception("Cannot add relationship $rel: $object");
- }
- }
- }
- if (array_key_exists('replaced_by', $term)) {
- //print "WARNING: unhandled tag: replaced_by\n";
- }
- if (array_key_exists('consider', $term)) {
- //print "WARNING: unhandled tag: consider\n";
- }
- if (array_key_exists('use_term', $term)) {
- //print "WARNING: unhandled tag: user_term\n";
- }
- if (array_key_exists('builtin', $term)) {
- //print "WARNING: unhandled tag: builtin\n";
- }
- if ($external ) {
- return 2;
- }
- return 1;
- }
- /**
- * Adds a cvterm relationship
- *
- * @param $cvterm
- * A database object for the cvterm
- * @param $rel
- * The relationship name
- * @param $objname
- * The relationship term name
- * @param $defaultcv
- * A database object containing a record from the cv table for the
- * default controlled vocabulary
- * @object_is_relationship
- * Set to 1 if this term is a relationship term
- * @default_db
- * The name of the default database.
- *
- * @ingroup tripal_obo_loader
- */
- private function addRelationship($cvterm, $defaultcv, $rel,
- $objname, $object_is_relationship = 0, $default_db = 'OBO_REL') {
- $reference_term = FALSE;
- $in_obo = $this->getTerm($objname);
- // If an accession was passed we need to see if we can find the actual label.
- if (strpos($rel, ':') || strpos($objname, ':') && empty($in_obo['name'])) {
- if (strpos($rel, ':')) {
- $term_id = $rel;
- }
- elseif (strpos($objname, ':')) {
- $term_id = $objname;
- }
- $reference_term = TRUE;
- $pair = explode(":", $term_id);
- $ontology_id = $pair[0];
- $accession_num = $pair[1];
- $rel_name = '';
- if (is_numeric($accession_num)) {
- $results = $this->oboEbiLookup($term_id, 'term');
- if (isset($results['label'])) {
- $rel_name = $results['label'];
- $oterm = $results;
- }
- if (empty($rel_name)) {
- $results = $this->oboEbiLookup($term_id, 'query');
- if (array_key_exists('docs', $results['response'])){
- if(!empty($results['response']['docs'])) {
- if (count($results['response']['docs']) > 1) {
- foreach ($results['response']['docs'] as $doc) {
- if ($doc['obo_id'] == $term_id) {
- $rel_name = $doc['label'];
- $oterm = $doc;
- }
- }
- }
- else {
- $rel_name = $results['response']['docs'][0]['label'];
- $oterm = $results['response']['docs'][0];
- }
- }
- }
- }
- if (empty($rel_name)) {
- // The first search doesn't work, so let's try a broader one.
- $results = $this->oboEbiLookup($term_id, 'query-non-local');
- if (!empty($results)) {
- if (array_key_exists('docs', $results['response'])) {
- if (!empty($results['response']['docs'])) {
- foreach ($results['response']['docs'] as $item) {
- if ($item['obo_id'] == $term_id) {
- //Found the first place a label is other than the accession is used, so take
- // that info and then end the loop.
- $rel_name = $item['label'];
- $oterm = $item;
- break;
- }
- }
- }
- }
- }
- }
- }
- }
- // Make sure the relationship cvterm exists.
- $term = array(
- 'name' => $rel,
- 'id' => "$default_db:$rel",
- 'definition' => '',
- 'is_obsolete' => 0,
- 'cv_name' => $defaultcv,
- 'is_relationship' => TRUE,
- 'db_name' => $default_db
- );
- $relcvterm = tripal_insert_cvterm($term, array('update_existing' => FALSE));
- if (!$relcvterm) {
- // If the relationship term couldn't be found in the default_db provided
- // then do on more check to find it in the relationship ontology
- $term = array(
- 'name' => $rel,
- 'id' => "OBO_REL:$rel",
- 'definition' => '',
- 'is_obsolete' => 0,
- 'cv_name' => $defaultcv,
- 'is_relationship' => TRUE,
- 'db_name' => 'OBO_REL'
- );
- $relcvterm = tripal_insert_cvterm($term, array('update_existing' => FALSE));
- if (!$relcvterm) {
- throw new Exception("Cannot find the relationship term in the current ontology or in the relationship ontology: $rel\n");
- }
- }
- // Get the object term.
- if ($reference_term === TRUE && !empty($oterm)) {
- $objterm = array();
- $objterm['id'] = $oterm['label'];
- $objterm['name'] = $oterm['obo_id'];
- if (array_key_exists('def', $oterm)) {
- $objterm['definition'] = $oterm['def'];
- }
- if (array_key_exists('subset', $oterm)) {
- $objterm['subset'] = $oterm['subset'];
- }
- if (array_key_exists('namespace', $oterm)) {
- $objterm['namespace'] = $oterm['ontology_name'];
- }
- if (array_key_exists('is_obsolete', $oterm)) {
- $objterm['is_obsolete'] = $oterm['is_obsolete'];
- }
- }
- else {
- $oterm = $this->getTerm($objname);
- if (!$oterm) {
- throw new Exception("Could not find object term $objname\n");
- }
- $objterm = array();
- $objterm['id'] = $oterm['id'][0];
- $objterm['name'] = $oterm['name'][0];
- if (array_key_exists('def', $oterm)) {
- $objterm['definition'] = $oterm['def'][0];
- }
- if (array_key_exists('subset', $oterm)) {
- $objterm['subset'] = $oterm['subset'][0];
- }
- if (array_key_exists('namespace', $oterm)) {
- $objterm['namespace'] = $oterm['namespace'][0];
- }
- if (array_key_exists('is_obsolete', $oterm)) {
- $objterm['is_obsolete'] = $oterm['is_obsolete'][0];
- }
- }
- $objterm['cv_name' ] = $defaultcv;
- $objterm['is_relationship'] = $object_is_relationship;
- $objterm['db_name'] = $default_db;
- $objcvterm = tripal_insert_cvterm($objterm, array('update_existing' => TRUE));
- if (!$objcvterm) {
- throw new Exception("Cannot add cvterm " . $objterm['name']);
- }
- // check to see if the cvterm_relationship already exists, if not add it
- $values = array(
- 'type_id' => $relcvterm->cvterm_id,
- 'subject_id' => $cvterm->cvterm_id,
- 'object_id' => $objcvterm->cvterm_id
- );
- $result = chado_select_record('cvterm_relationship', array('*'), $values);
- if (count($result) == 0) {
- $options = array('return_record' => FALSE);
- $success = chado_insert_record('cvterm_relationship', $values, $options);
- if (!$success) {
- throw new Exception("Cannot add term relationship: '$cvterm->name' $rel '$objcvterm->name'");
- }
- }
- return TRUE;
- }
- /**
- * Retrieves the term array from the temp loading table for a given term id.
- *
- * @param id
- * The id of the term to retrieve
- *
- * @ingroup tripal_obo_loader
- */
- private function getTerm($id) {
- $values = array('id' => $id);
- $result = chado_select_record('tripal_obo_temp', array('stanza'), $values);
- if (count($result) == 0) {
- return FALSE;
- }
- return unserialize(base64_decode($result[0]->stanza));
- }
- /**
- * Adds the synonyms to a term
- *
- * @param term
- * An array representing the cvterm. It must have a 'synonym' key/value pair.
- * @param cvterm
- * The database object of the cvterm to which the synonym will be added.
- *
- * @ingroup tripal_obo_loader
- */
- private function addSynonym($term, $cvterm) {
- // make sure we have a 'synonym_type' vocabulary
- $syncv = tripal_insert_cv(
- 'synonym_type',
- 'A local vocabulary added for synonym types.'
- );
- // now add the synonyms
- if (array_key_exists('synonym', $term)) {
- foreach ($term['synonym'] as $synonym) {
- // separate out the synonym definition and the synonym type
- $def = preg_replace('/^\s*"(.*)"\s*.*$/', '\1', $synonym);
- // the scope will be 'EXACT', etc...
- $scope = drupal_strtolower(preg_replace('/^.*"\s+(.*?)\s+.*$/', '\1', $synonym));
- if (!$scope) { // if no scope then default to 'exact'
- $scope = 'exact';
- }
- // make sure the synonym type exists in the 'synonym_type' vocabulary
- $values = array(
- 'name' => $scope,
- 'cv_id' => array(
- 'name' => 'synonym_type',
- ),
- );
- $syntype = tripal_get_cvterm($values);
- // if it doesn't exist then add it
- if (!$syntype) {
- // build a 'term' object so we can add the missing term
- $term = array(
- 'name' => $scope,
- 'id' => "synonym_type:$scope",
- 'definition' => '',
- 'is_obsolete' => 0,
- 'cv_name' => $syncv->name,
- 'is_relationship' => FALSE
- );
- $syntype = tripal_insert_cvterm($term, array('update_existing' => TRUE));
- if (!$syntype) {
- throw new Exception("Cannot add synonym type: internal:$scope");
- }
- }
- // make sure the synonym doesn't already exists
- $values = array(
- 'cvterm_id' => $cvterm->cvterm_id,
- 'synonym' => $def
- );
- $results = chado_select_record('cvtermsynonym', array('*'), $values);
- if (count($results) == 0) {
- $values = array(
- 'cvterm_id' => $cvterm->cvterm_id,
- 'synonym' => $def,
- 'type_id' => $syntype->cvterm_id
- );
- $options = array('return_record' => FALSE);
- $success = chado_insert_record('cvtermsynonym', $values, $options);
- if (!$success) {
- throw new Exception("Failed to insert the synonym for term: $cvterm->name ($def)");
- }
- }
- // now add the dbxrefs for the synonym if we have a comma in the middle
- // of a description then this will cause problems when splitting os lets
- // just change it so it won't mess up our splitting and then set it back
- // later.
- /**
- $synonym = preg_replace('/(".*?),\s(.*?")/','$1,_$2',$synonym);
- $dbxrefs = preg_split("/, /",preg_replace('/^.*\[(.*?)\]$/','\1',$synonym));
- foreach ($dbxrefs as $dbxref) {
- $dbxref = preg_replace('/,_/',", ",$dbxref);
- if ($dbxref) {
- $this->addCvtermDbxref($syn,$dbxref);
- }
- }
- */
- }
- }
- return TRUE;
- }
- /**
- * Parse the OBO file and populate the templ loading table
- *
- * @param $file
- * The path on the file system where the ontology can be found
- * @param $header
- * An array passed by reference that will be populated with the header
- * information from the OBO file
- *
- * @ingroup tripal_obo_loader
- */
- private function parse($obo_file, &$header) {
- $in_header = 1;
- $stanza = array();
- $default_db = '';
- $line_num = 0;
- $num_read = 0;
- $type = '';
- $filesize = filesize($obo_file);
- $this->setTotalItems($filesize);
- $this->setItemsHandled(0);
- // iterate through the lines in the OBO file and parse the stanzas
- $fh = fopen($obo_file, 'r');
- while ($line = fgets($fh)) {
- $line_num++;
- $size = drupal_strlen($line);
- $num_read += $size;
- $line = trim($line);
- $this->setItemsHandled($num_read);
- // remove newlines
- $line = rtrim($line);
- // remove any special characters that may be hiding
- $line = preg_replace('/[^(\x20-\x7F)]*/', '', $line);
- // skip empty lines
- if (strcmp($line, '') == 0) {
- continue;
- }
- //remove comments from end of lines
- $line = preg_replace('/^(.*?)\!.*$/', '\1', $line); // TODO: if the explamation is escaped
-
- // Remove annotations surrounded by brackets. These are found
- // in the Trait Ontology (e.g. TO:1000023 {is_inferred="true"})
- // That construct has useful info, but it is not in the OBO 1.4 format
- // specifications.
- $line = preg_replace('/\{.*?\}/', '', $line);
- // at the first stanza we're out of header
- if (preg_match('/^\s*\[/', $line)) {
- $in_header = 0;
- // store the stanza we just finished reading
- if (sizeof($stanza) > 0) {
- // add the term to the temp table
- $values = array(
- 'id' => $stanza['id'][0],
- 'stanza' => base64_encode(serialize($stanza)),
- 'type' => $type,
- );
- $success = chado_insert_record('tripal_obo_temp', $values);
- if (!$success) {
- throw new Exception("Cannot insert stanza into temporary table.");
- }
- }
- // get the stanza type: Term, Typedef or Instance
- $type = preg_replace('/^\s*\[\s*(.+?)\s*\]\s*$/', '\1', $line);
- // start fresh with a new array
- $stanza = array();
- continue;
- }
- // break apart the line into the tag and value but ignore any escaped colons
- preg_replace("/\\:/", "|-|-|", $line); // temporarily replace escaped colons
- $pair = explode(":", $line, 2);
- $tag = $pair[0];
- $value = ltrim(rtrim($pair[1]));// remove surrounding spaces
- // if this is the ID then look for the default DB
- $matches = array();
- if ($tag == 'id' and preg_match('/^(.+?):.*$/', $value, $matches)) {
- $default_db = $matches[1];
- }
- $tag = preg_replace("/\|-\|-\|/", "\:", $tag); // return the escaped colon
- $value = preg_replace("/\|-\|-\|/", "\:", $value);
- if ($in_header) {
- if (!array_key_exists($tag, $header)) {
- $header[$tag] = array();
- }
- $header[$tag][] = $value;
- }
- else {
- if (!array_key_exists($tag, $stanza)) {
- $stanza[$tag] = array();
- }
- $stanza[$tag][] = $value;
- }
- }
- // now add the last term in the file
- if (sizeof($stanza) > 0) {
- $values = array(
- 'id' => $stanza['id'][0],
- 'stanza' => base64_encode(serialize($stanza)),
- 'type' => $type,
- );
- chado_insert_record('tripal_obo_temp', $values);
- if (!$success) {
- throw new Exception("Cannot insert stanza into temporary table.");
- }
- $this->setItemsHandled($num_read);
- }
- return $default_db;
- }
- /**
- * Adds a database reference to a cvterm
- *
- * @param cvterm
- * The database object of the cvterm to which the synonym will be added.
- * @param xref
- * The cross refernce. It should be of the form from the OBO specification
- *
- * @ingroup tripal_obo_loader
- */
- private function addCvtermDbxref($cvterm, $xref) {
- $dbname = preg_replace('/^(.+?):.*$/', '$1', $xref);
- $accession = preg_replace('/^.+?:\s*(.*?)(\{.+$|\[.+$|\s.+$|\".+$|$)/', '$1', $xref);
- $description = preg_replace('/^.+?\"(.+?)\".*?$/', '$1', $xref);
- $dbxrefs = preg_replace('/^.+?\[(.+?)\].*?$/', '$1', $xref);
- if (!$accession) {
- throw new Exception("Cannot add a dbxref without an accession: '$xref'");
- }
- // if the xref is a database link, handle that specially
- if (strcmp($dbname, 'http') == 0) {
- $accession = $xref;
- $dbname = 'URL';
- }
- // add the database
- $db = tripal_insert_db(array('name' => $dbname));
- if (!$db) {
- throw new Exception("Cannot find database '$dbname' in Chado.");
- }
- // now add the dbxref
- $dbxref = $this->addDbxref($db->db_id, $accession, '', $description);
- if (!$dbxref) {
- throw new Exception("Cannot find or add the database reference (dbxref)");
- }
- // finally add the cvterm_dbxref but first check to make sure it exists
- $values = array(
- 'cvterm_id' => $cvterm->cvterm_id,
- 'dbxref_id' => $dbxref->dbxref_id,
- );
- $result = chado_select_record('cvterm_dbxref', array('*'), $values);
- if (count($result) == 0) {
- $ins_options = array('return_record' => FALSE);
- $result = chado_insert_record('cvterm_dbxref', $values, $ins_options);
- if (!$result) {
- throw new Exception("Cannot add cvterm_dbxref: $xref");
- }
- }
- return TRUE;
- }
- /**
- * Adds a property to a cvterm
- *
- * @param cvterm
- * A database object for the cvterm to which properties will be added
- * @param $property
- * The name of the property to add
- * @param $value
- * The value of the property
- * @param rank
- * The rank of the property
- *
- * @ingroup tripal_obo_loader
- */
- private function addCvtermProp($cvterm, $property, $value, $rank) {
- // make sure the 'cvterm_property_type' CV exists
- $cv = tripal_insert_cv('cvterm_property_type', '');
- if (!$cv) {
- throw new Exception("Cannot add/find cvterm_property_type cvterm");
- }
- // get the property type cvterm. If it doesn't exist then we want to add it
- $values = array(
- 'name' => $property,
- 'cv_id' => $cv->cv_id,
- );
- $results = chado_select_record('cvterm', array('*'), $values);
- if (count($results) == 0) {
- $term = array(
- 'name' => $property,
- 'id' => "internal:$property",
- 'definition' => '',
- 'is_obsolete' => 0,
- 'cv_name' => $cv->name,
- 'is_relationship' => FALSE,
- );
- $cvproptype = tripal_insert_cvterm($term, array('update_existing' => FALSE));
- if (!$cvproptype) {
- throw new Exception("Cannot add cvterm property: internal:$property");
- }
- }
- else {
- $cvproptype = $results[0];
- }
- // remove any properties that currently exist for this term. We'll reset them
- if ($rank == 0) {
- $values = array('cvterm_id' => $cvterm->cvterm_id);
- $success = chado_delete_record('cvtermprop', $values);
- if (!$success) {
- throw new Exception("Could not remove existing properties to update property $property for term\n");
- }
- }
- // now add the property
- $values = array(
- 'cvterm_id' => $cvterm->cvterm_id,
- 'type_id' => $cvproptype->cvterm_id,
- 'value' => $value,
- 'rank' => $rank,
- );
- $options = array('return_record' => FALSE);
- $result = chado_insert_record('cvtermprop', $values, $options);
- if (!$result) {
- throw new Exception("Could not add property $property for term\n");
- }
- return TRUE;
- }
- /**
- * Adds a database cross reference to a cvterm
- *
- * @param db_id
- * The database ID of the cross reference
- * @param accession
- * The cross reference's accession
- * @param $version
- * The version of the dbxref
- * @param $description
- * The description of the cross reference
- *
- * @ingroup tripal_obo_loader
- */
- private function addDbxref($db_id, $accession, $version='', $description='') {
- // check to see if the dbxref exists if not, add it
- $values = array(
- 'db_id' => $db_id,
- 'accession' => $accession,
- );
- $result = chado_select_record('dbxref', array('dbxref_id'), $values);
- if (count($result) == 0) {
- $ins_values = array(
- 'db_id' => $db_id,
- 'accession' => $accession,
- 'version' => $version,
- 'description' => $description,
- );
- $ins_options = array('return_record' => FALSE);
- $result = chado_insert_record('dbxref', $ins_values, $ins_options);
- if (!$result) {
- throw new Exception("Failed to insert the dbxref record $accession");
- }
- $result = chado_select_record('dbxref', array('dbxref_id'), $values);
- }
- return $result[0];
- }
- /**
- * API call to Ontology Lookup Service provided by
- * https://www.ebi.ac.uk/ols/docs/api#resources-terms
- *
- * @param accession
- * Accession term for query
- * @param type_of_search
- * Either ontology, term, query, or query-non-local
- *
- * @ingroup tripal_obo_loader
- */
- private function oboEbiLookup($accession, $type_of_search) {
- //Grab just the ontology from the $accession.
- $parts = explode(':', $accession);
- $ontology = strtolower($parts[0]);
- $ontology = preg_replace('/\s+/', '', $ontology);
- if ($type_of_search == 'ontology') {
- $options = array();
- $full_url = 'http://www.ebi.ac.uk/ols/api/ontologies/' . $ontology;
- $response = drupal_http_request($full_url, $options);
- if(!empty($response)){
- $response = drupal_json_decode($response->data);
- }
- }
- elseif ($type_of_search == 'term') {
- //The IRI of the terms, this value must be double URL encoded
- $iri = urlencode(urlencode("http://purl.obolibrary.org/obo/" . str_replace(':' , '_', $accession)));
- $options = array();
- $full_url = 'http://www.ebi.ac.uk/ols/api/ontologies/' . $ontology . '/' . 'terms/' . $iri;
- $response = drupal_http_request($full_url, $options);
- if(!empty($response)){
- $response = drupal_json_decode($response->data);
- }
- }
- elseif($type_of_search == 'query') {
- $options = array();
- $full_url = 'http://www.ebi.ac.uk/ols/api/search?q=' . $accession . '&queryFields=obo_id&local=true';
- $response = drupal_http_request($full_url, $options);
- if(!empty($response)){
- $response = drupal_json_decode($response->data);
- }
- }
- elseif($type_of_search == 'query-non-local') {
- $options = array();
- $full_url = 'http://www.ebi.ac.uk/ols/api/search?q=' . $accession . '&queryFields=obo_id';
- $response = drupal_http_request($full_url, $options);
- if(!empty($response)){
- $response = drupal_json_decode($response->data);
- }
- }
- return $response;
- }
- }
- /**
- * Ajax callback for the OBOImporter::form() function.
- */
- function tripal_cv_obo_form_ajax_callback($form, $form_state) {
- return $form['obo_existing'];
- }
|