| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647 | 
							- <?php
 
- /**
 
-  * Form to initialize an align library tripal job
 
-  */
 
- function tripal_gbrowse_align_features_form ($form_state) {
 
-   $form = array();
 
-   
 
-   // compile all analysis' as options
 
-   $analysis_options = array();
 
-   $results = tripal_core_chado_select('analysis',array('analysis_id','name', 'program'), array());
 
-   foreach ($results as $r) {
 
-     $analysis_options[ 'A'.$r->analysis_id ] = $r->name .' --'.$r->program;
 
-   }
 
-   
 
-   // compile all libraries as options
 
-   $library_options = array();
 
-   $results = tripal_core_chado_select('library',array('library_id','name', 'uniquename'), array());
 
-   foreach ($results as $r) {
 
-     $library_options[ 'L'.$r->library_id ] = $r->name .' --'.$r->uniquename;
 
-   }  
 
-   
 
-   $form['description'] = array(
 
-     '#type' => 'item',
 
-     '#value' => 'This form allows you to select a query library/analysis and align the '
 
-       .'features that are part of that query library/analysis against those from a database '
 
-       .'library/analysis using BLAST. Depending upon the Alignment Criteria, the top BLAST '
 
-       .'result(s) for each query feature will be used to determine the location of the query '
 
-       .'feature on a database feature.',
 
-   );
 
-   
 
-   $form['q'] = array(
 
-     '#type' => 'fieldset',
 
-     '#title' => 'Features to be Aligned (Query)',
 
-     '#description' => 'Please select the library or analysis below which groups the features you '
 
-       .'want aligned together.',
 
-   );
 
-   
 
-   $form['q']['query'] = array(
 
-     '#type' => 'select',
 
-     '#title' => 'Query Features',
 
-     '#options' => array(
 
-       'Libraries' => $library_options,
 
-       "Analaysis'" => $analysis_options
 
-     ),
 
-     '#default_value' => $form_state['values']['query'],
 
-   );
 
-   
 
-   $form['d'] = array(
 
-     '#type' => 'fieldset',
 
-     '#title' => 'Features to Align To (Database)',
 
-     '#description' => 'Please select the library of analysis below, which contains the features '
 
-       .'you want to align the query features selected above to. Only features in the selected '
 
-       .'library/analysis with sequence data will be used.',
 
-   );
 
-   $form['d']['database'] = array(
 
-     '#type' => 'select',
 
-     '#title' => 'Database Features',
 
-     '#options' => array(
 
-       'Libraries' => $library_options,
 
-       "Analaysis'" => $analysis_options
 
-     ),
 
-     '#default_value' => $form_state['values']['database'],
 
-   );
 
-   
 
-   $form['b'] = array(
 
-     '#type' => 'fieldset',
 
-     '#title' => 'Alignment Criteria',
 
-   );
 
-   
 
-   $form['b']['program'] = array(
 
-   	'#type' => 'radios',
 
-   	'#title' => 'Alignment Program',
 
-   	'#options' => array(
 
-   		'blast' => 'BLAST',
 
-   		'blat' => 'BLAT',
 
-   	),
 
-   	'#default_value' => 'blat',
 
-   );
 
-   $form['b']['blat'] = array(
 
-   	'#type' => 'fieldset',
 
-   	'#title' => 'BLAT Options',
 
-   	'#collapsible' => TRUE,
 
- 		'#collapsed' => TRUE,
 
-   );
 
-   
 
-   $form['b']['blat']['min_identity'] = array(
 
-   	'#type' => 'textfield',
 
-   	'#title' => 'Minimum Identity',
 
-   	'#default_value' => '90',
 
-   );
 
-   
 
-   $form['b']['blast'] = array(
 
-   	'#type' => 'fieldset',
 
-   	'#title' => 'BLAST Options',
 
-   	'#collapsible' => TRUE,
 
- 		'#collapsed' => TRUE,
 
-   );
 
-   
 
-   $form['b']['blast']['gapped_alignment'] = array(
 
-   	'#type' => 'checkbox',
 
-   	'#title' => 'Gapped Alignment?',
 
-   	'#default_value' => TRUE,
 
-   );
 
-   
 
-   $form['b']['blast']['evalue'] = array(
 
-   	'#type' => 'textfield',
 
-   	'#title' => 'Expectation Values (E-value) Cutoff',
 
-   	'#description' => 'To enter in scientific notation (ie: 5 x 10-6), enter [base number]e[power] (ie: 5e-6)',
 
-   	'#default_value' => 10.0
 
-   );
 
-   
 
-   $form['g'] = array(
 
-   	'#type' => 'fieldset',
 
-   	'#title' => 'GBrowse Information',
 
-   );
 
-   
 
-   $form['g']['source'] = array(
 
-   	'#type' => 'textfield',
 
-   	'#title' => 'Source of Features',
 
-   	'#description' => 'The source of the features grouped by the selected query library'
 
-   );
 
-   
 
-   //Sending query to the database
 
-   $resource = db_query('SELECT * FROM {tripal_gbrowse_instances}');
 
- 	$items = array();
 
- 	while($record = db_fetch_object($resource)){
 
- 		$items[$record->gbrowse_id]= $record->gbrowse_name;
 
- 	}
 
-    
 
-   //GBrowse Instances
 
-   $form['g']['gbrowse_id'] = array(
 
-     '#type' => 'select',
 
-     '#title' => t('GBrowse Instances'),
 
-     '#options' => $items,
 
-     '#description' => t('Selected GBrowse Instances to load the query features into.'),
 
-   );
 
-   
 
-   $form['submit'] = array(
 
-     '#type' => 'submit',
 
-     '#name' => 'align',
 
-     '#value' => 'Align Features',
 
-   );
 
-   
 
-   return $form;
 
- }
 
- /**
 
-  * Form submit to initialize an align library tripal job
 
-  */
 
- function tripal_gbrowse_align_features_form_submit ($form, &$form_state) {
 
-   
 
-   switch($form_state['clicked_button']['#name']) {
 
-     case 'align':
 
-       $options = array();
 
-       // Query
 
-       if (preg_match('/(L|A)(\d+)/',$form_state['values']['query'], $matches)) {
 
-         if ($matches[1] == 'L') {
 
-           $options['query_type'] = 'library';
 
-         } else {
 
-           $options['query_type'] = 'analysis';
 
-         }
 
-         $options['query_id'] = $matches[2];
 
-       }
 
-       
 
-       // Database
 
-       if (preg_match('/(L|A)(\d+)/',$form_state['values']['database'], $matches)) {
 
-         if ($matches[1] == 'L') {
 
-           $options['db_type'] = 'library';
 
-         } else {
 
-           $options['db_type'] = 'analysis';
 
-         }
 
-         $options['db_id'] = $matches[2];
 
-       } 
 
-       
 
-       $options['source'] = $form_state['values']['source'];
 
-       
 
-       // db options
 
-       $sql = 'SELECT * FROM {tripal_gbrowse_instances} WHERE gbrowse_id = %d';
 
-       $r = db_fetch_object(db_query($sql,$form_state['values']['gbrowse_id']));
 
-       $options['dbname'] = $r->database_name;
 
-       $options['dbuser'] = $r->database_user;
 
-       $options['dbpass'] = $r->user_password;
 
- 			if ($form_state['values']['program'] == 'blat') { 
 
- 				// blat options
 
- 				$options['min_identity'] = $form_state['values']['min_identity'];
 
- 				
 
- 				global $user;
 
- 				tripal_add_job(
 
- 					'Align '.$options['query_type'].' features ('.$options['query_type'].'_id='.$options['query_id'].')',
 
- 					'tripal_gbrowse',
 
- 					'tripal_gbrowse_align_features_by_blat',
 
- 					array(serialize($options)),
 
- 					$user->uid
 
- 				);			
 
- 			} elseif ($form_state['values']['program'] == 'blast') {      
 
- 				// blast options
 
- 				$options['evalue'] = $form_state['values']['evalue'];
 
- 				$options['gapped_alignment'] = $form_state['values']['gapped_alignment'];
 
- 			
 
- 				global $user;
 
- 				tripal_add_job(
 
- 					'Align '.$options['query_type'].' features ('.$options['query_type'].'_id='.$options['query_id'].')',
 
- 					'tripal_gbrowse',
 
- 					'tripal_gbrowse_align_features_by_blast',
 
- 					array(serialize($options)),
 
- 					$user->uid
 
- 				);
 
-       }
 
-       
 
-     break;
 
-   }
 
- }
 
- /**
 
-  * Aligns feature from a query library/analysis to a database library/analysis,
 
-  * saving the results as a GFF3 file and then loading it into the selected gbrowse instance
 
-  *
 
-  * @param $options
 
-  *   An array containing options needed to align features and create featurelocs
 
-  *    -query_type: the type of chado grouping containing query features (either library or analysis)
 
-  *    -query_id: the library_id/analysis_id containing the query features
 
-  *    -db_type: the type of chado grouping containing database features (either library or analysis)
 
-  *    -db_id: the library_id/analysis_id containing the database features
 
-  *    -dbname: name of the MySQL GBrowse database to load into
 
-  *    -dbuser: name of the user with permission to load into the above database
 
-  *    -dbpass: the password for the above user
 
-  */
 
- function tripal_gbrowse_align_features_by_blast ($options) {
 
-   $options = unserialize($options);
 
-   print 'Query: '.$options['query_type'].' where '.$options['query_type'].'_id='.$options['query_id']."\n";
 
-   print 'Database: '.$options['db_type'].' where '.$options['db_type'].'_id='.$options['db_id']."\n";
 
-   
 
-   // Generate FASTA ---------------------------------------
 
-   print "\nGenerating fasta files for query and database...\n";
 
-   $query_file = tripal_gbrowse_export_fasta_for_features( $options['query_type'], $options['query_id'], TRUE );
 
-   print "\t".$query_file['file']."\n";
 
-   
 
-   $db_file = tripal_gbrowse_export_fasta_for_features( $options['db_type'], $options['db_id'], TRUE, TRUE );
 
-   print "\t".$db_file['file']."\n";
 
-   
 
-   // Align using BLAST ------------------------------------
 
-   print "\nAligning features using BLAST...\n";
 
-   
 
-   print "\tFormating Database FASTA into BLASTdb...\n";
 
-   $db = '/tmp/exported_'.$options['db_type'].'_'.$options['db_id'];
 
-   $formatdb_cmd = 'formatdb -n '.$db.' -p F -i '.$db_file['file'];
 
- 	print "\t\t".$formatdb_cmd."\n";  
 
-   exec($formatdb_cmd);
 
- 	
 
- 	print "\tExecuting BLAST...\n";
 
- 	$blast_outfile = $db.'_by_'.$options['query_type'].'_'.$options['query_id'].'.blast.xml';
 
- 	$blastall_cmd = 'blastall -p blastn -d '.$db.' -i '.$query_file['file'].' -m 7 -o '.$blast_outfile.' -e '.$options['evalue'];
 
- 	if ($options['gapped_alignment']) {
 
- 		$blastall_cmd .= ' -g';
 
- 	}
 
- 	print "\t\t".$blastall_cmd."\n";
 
- 	exec($blastall_cmd);
 
-   
 
-   // Parse BLAST results ----------------------------------
 
-   print "\nParsing Blast Results into GFF3...\n";
 
-   $gff3_file = $db.'_by_'.$options['query_type'].'_'.$options['query_id'].'.gff3';
 
-   $fgff3 = fopen($gff3_file, 'w');
 
-   fwrite($fgff3, "##gff-version 3\n");
 
-   $iteration = tripal_gbrowse_get_next_xml_record ($blast_outfile, "<Iteration>");
 
-   while ($iteration) {
 
-   	//print "Record:".$iteration['record']->asXML()."\n";
 
-   	//print "Query: ".$iteration['record']->{'Iteration_query-def'}."\n";
 
- 		
 
- 		// Find the best Hit by looking at the bit scores of the hsps
 
- 		// the larger the bit score the better the alignment
 
- 		$hits = array();
 
- 		$scores = array();
 
-   	foreach ($iteration['record']->Iteration_hits->Hit as $hit) {
 
-   		$score = 0;
 
-   		$num = 0;
 
-   		foreach ($hit->{'Hit_hsps'}->{'Hsp'} as $hsp) {
 
-   			//print 'HSP:'.$hsp->asXML()."\n";
 
-   			$score = $score + $hsp->{'Hsp_bit-score'};
 
-   			$num++;
 
-   		}
 
-   		$avg = round($score / $num,2);
 
-   		$hit->{'Hit_bit-score'} = $avg;
 
-   		$hits[] = array('score' => $avg, 'hit' => $hit);
 
-   	}
 
-   	usort($hits, 'tripal_gbrowse_sort_by_score');
 
-   	$best_hit = $hits[0]['hit'];
 
-   	//print "\tBest Hit:".$best_hit->Hit_def.' ('.$best_hit->{'Hit_bit-score'}.")\n";
 
-   	
 
-   	// generate gff3 for the best hit 
 
-   	$query_name = $iteration['record']->{'Iteration_query-def'};
 
-   	$db_name = $best_hit->Hit_def;  
 
-   	if (isset($db_file['noseq_features'][$db_name])) {
 
-   	  $db_offset = $db_file['noseq_features'][$db_name]['start'];
 
-   	  $db_name = $db_file['noseq_features'][$db_name]['parent']['uniquename'];
 
-   	} else {
 
-   	  $db_offset = 0;
 
-   	}
 
- 		$lines = array();
 
- 		$hit_start = 99999999999999999999;
 
- 		$hit_end = 0;
 
-   	foreach ($best_hit->{'Hit_hsps'}->{'Hsp'} as $hsp) {
 
-   		if ($hit_start > (int) $hsp->{'Hsp_hit-from'}[0]) { $hit_start = (int) $hsp->{'Hsp_hit-from'}[0]; } 
 
-   		if ($hit_end < (int) $hsp->{'Hsp_hit-to'}[0]) { $hit_end = (int) $hsp->{'Hsp_hit-to'}; }
 
-   		$lines[] = implode("\t", array(
 
-   			$db_name, 
 
-   			$options['source'],
 
-   			'match_part',
 
-   			$hsp->{'Hsp_hit-from'} + $db_offset,
 
-   			$hsp->{'Hsp_hit-to'} + $db_offset,
 
-   			$hsp->{'Hsp_bit-score'},
 
-   			'.',
 
-   			'.',
 
-   			'ID='.$query_name.'_'.$hsp->{'Hsp_num'}.';Parent='.$query_name
 
-   		))."\n";
 
-   	}
 
-   	fwrite($fgff3, implode("\t", array(
 
- 			$db_name, 
 
- 			$options['source'],
 
- 			'match',
 
- 			$hit_start + $db_offset,
 
- 			$hit_end + $db_offset,
 
- 			$best_hit->{'Hit_bit-score'},
 
- 			'.',
 
- 			'.',
 
- 			'ID='.$query_name.';Name='.$query_name
 
- 		))."\n");
 
- 		fwrite($fgff3,implode('',$lines));
 
-   	
 
-   	// get next iteration xml record
 
-   	$last_iteration = $iteration;
 
-   	//print "Getting Iteration...\n";
 
-   	$iteration = tripal_gbrowse_get_next_xml_record ($blast_outfile, "<Iteration>", $last_iteration['start_line_num']);
 
-   }
 
-   
 
-   print "\nLoading GFF3 into GBrowse...\n";
 
-   //The loading script: bp_seqfeature_load.pl, allows loading of data to specific file 
 
-   $command= "bp_seqfeature_load.pl -u '" .$options['dbuser']. "' -p '" .$options['dbpass']. "' -d " .$options['dbname']. " " . $gff3_file;
 
-   print "\t".$command."\n";
 
-   exec($command);
 
- }
 
- /**
 
-  * Aligns feature from a query library/analysis to a database library/analysis,
 
-  * saving the results as a GFF3 file and then loading it into the selected gbrowse instance
 
-  *
 
-  * @param $options
 
-  *   An array containing options needed to align features and create featurelocs
 
-  *    -query_type: the type of chado grouping containing query features (either library or analysis)
 
-  *    -query_id: the library_id/analysis_id containing the query features
 
-  *    -db_type: the type of chado grouping containing database features (either library or analysis)
 
-  *    -db_id: the library_id/analysis_id containing the database features
 
-  *    -dbname: name of the MySQL GBrowse database to load into
 
-  *    -dbuser: name of the user with permission to load into the above database
 
-  *    -dbpass: the password for the above user
 
-  */
 
- function tripal_gbrowse_align_features_by_blat ($options,$job_id) {
 
-   $options = unserialize($options);
 
-   print 'Query: '.$options['query_type'].' where '.$options['query_type'].'_id='.$options['query_id']."\n";
 
-   print 'Database: '.$options['db_type'].' where '.$options['db_type'].'_id='.$options['db_id']."\n";
 
-   
 
-   // Generate FASTA ---------------------------------------
 
-   print "\nGenerating fasta files for query and database...\n";
 
-   $query_file = tripal_gbrowse_export_fasta_for_features( $options['query_type'], $options['query_id'], TRUE );
 
-   print "\t".$query_file['file']."\n";
 
-   tripal_job_set_progress($job_id, 12);
 
-   
 
-   $db_file = tripal_gbrowse_export_fasta_for_features( $options['db_type'], $options['db_id'], TRUE, TRUE );
 
-   print "\t".$db_file['file']."\n";
 
-   tripal_job_set_progress($job_id, 25);
 
-   
 
-   // Align using BLAT ------------------------------------
 
-   print "\nAligning features using BLAT...\n";
 
- 	$blat_outfile = '/tmp/alignment_'.$options['db_type'].'-'.$options['db_id'].'_by_'.$options['query_type'].'-'.$options['query_id'].'.psl';
 
- 	$blat_cmd = 'blat '.$db_file['file'].' '.$query_file['file'].' -q=dnax -t=dnax -noHead -minIdentity='.$options['min_identity'].' '.$blat_outfile;
 
- 	print "\t\t".$blat_cmd."\n";
 
- 	exec($blat_cmd);
 
- 	tripal_job_set_progress($job_id, 50);
 
- 	
 
- 	// Parse BLAST results ----------------------------------
 
- 	$total_lines = trim(`wc --lines < $blat_outfile`);
 
- 	$interval = intval($total_lines/5);
 
- 	$percent_per_line = 25/$total_lines;
 
- 	$num_lines = 0;
 
- 	$query_seq = array();
 
- 	
 
- 	print "\nParsing BLAT results into GFF3 (".$total_lines." lines)...\n";
 
- 	$gff3_file = '/tmp/alignment_'.$options['db_type'].'-'.$options['db_id'].'_by_'.$options['query_type'].'-'.$options['query_id'].'.gff3';
 
-   $fgff3 = fopen($gff3_file, 'w');
 
-   fwrite($fgff3, "##gff-version 3\n");
 
- 	$bh = fopen($blat_outfile, 'r');
 
- 	while (!feof($bh)) {
 
- 		$line = explode("\t", fgets($bh));
 
- 		$num_lines++;
 
- 		if (($num_lines%$interval) == 0) { tripal_job_set_progress($job_id, intval($percent_per_line * $num_lines)); }
 
- 		
 
- 		$print_match = TRUE;
 
-     $db_name = $line[13];
 
-   	if (isset($db_file['noseq_features'][$db_name])) {
 
-   	  $db_offset = $db_file['noseq_features'][$db_name]['start'];
 
-   	  $db_name = $db_file['noseq_features'][$db_name]['parent']['uniquename'];
 
-   	} else {
 
-   	  $db_offset = 0;
 
-   	}
 
-   	
 
-   	$query_id = $line[9];
 
-   	if (!isset($query_seq[ $line[9] ])) {
 
-   		$query_seq[ $line[9] ]['id'] = 0;
 
-   		$query_seq[ $line[9] ]['start'] = $line[15] + $db_offset;
 
-   		$query_seq[ $line[9] ]['end'] = $line[16] + $db_offset;
 
-   		$query_id .= '_0';
 
-   	} elseif ( abs($line[15]+$db_offset-$query_seq[ $line[9] ]['start']) < 5 ) {
 
-   		$print_match = FALSE;
 
-   		$query_id .= '_' . $query_seq[ $line[9] ]['id'];
 
-   	}else {
 
-   		$query_seq[ $line[9] ]['id']++;
 
-   		$query_id .= '_' . $query_seq[ $line[9] ]['id'];
 
-   	}
 
-   	
 
- 		// match line
 
- 		if ($print_match) {
 
- 			fwrite($fgff3, implode("\t", array(
 
- 				$db_name, 
 
- 				$options['source'],
 
- 				'match',
 
- 				$line[15] + $db_offset,
 
- 				$line[16] + $db_offset,
 
- 				'.',
 
- 				$line[8][1],
 
- 				'.',
 
- 				'ID='.$query_id.';Name='.$line[9]
 
- 			))."\n");
 
- 		}
 
- 		
 
- 		// match parts
 
- 		$parts_size = explode(',',trim($line[18]));
 
- 		$parts_start = explode(',',trim($line[20]));
 
- 		foreach ($parts_size as $k => $length) {
 
- 			if (!empty($parts_start[$k])) {
 
- 				fwrite($fgff3, implode("\t", array(
 
- 					$db_name, 
 
- 					$options['source'],
 
- 					'match_part',
 
- 					$parts_start[$k] + $db_offset,
 
- 					$parts_start[$k] + $length + $db_offset,
 
- 					'.',
 
- 					$line[8][1],
 
- 					'.',
 
- 					'ID='.$query_id.'_'.$k.';Parent='.$query_id
 
- 				))."\n");
 
-   		}
 
-   		
 
- 		}
 
- 	}
 
- 	tripal_job_set_progress($job_id, 75);
 
- 	
 
- 	// Load into GBrowse ------------------------------------
 
-   print "\nLoading GFF3 into GBrowse...\n";
 
-   //The loading script: bp_seqfeature_load.pl, allows loading of data to specific file 
 
-   $command= "bp_seqfeature_load.pl -u '" .$options['dbuser']. "' -p '" .$options['dbpass']. "' -d " .$options['dbname']. " " . $gff3_file;
 
-   print "\t".$command."\n";
 
- 	exec($command);
 
- }
 
- /**
 
-  * Creates a fasta file for a given chado grouping of features
 
-  *
 
-  * @param $type
 
-  *   The type of chado grouping. Allowed values are either library or analysis
 
-  * @param $id
 
-  *   The library_id/analysis_id of the chado grouping
 
-  * @return
 
-  *   The name of the multi-fasta file containing records for all features with residues
 
-  *   in the supplied library/analysis
 
-  */
 
- function tripal_gbrowse_export_fasta_for_features ($type, $id, $use_parent_seq = FALSE, $save_offset = FALSE) {
 
-   $fasta_file = '/tmp/exported_fasta-'.$type.'-'.$id.'.fasta';
 
-   $noseq_features = array();
 
-   
 
-   $fh = fopen($fasta_file,'w');
 
-   
 
-   $sql = 'SELECT f.uniquename, f.residues, fl.fmin, fl.fmax, fl.srcfeature_id as parent_feature_id FROM feature f '
 
-   	.'LEFT JOIN featureloc fl ON fl.feature_id=f.feature_id ';
 
-   $parent_sql = 'SELECT p.feature_id as parent_feature_id, p.uniquename as parent_uniquename, count(fl.feature_id) FROM feature p '
 
-   	.'LEFT JOIN featureloc fl ON fl.srcfeature_id=p.feature_id '
 
-   	."WHERE fl.feature_id IN (SELECT feature_id FROM feature WHERE residues='') AND ";
 
-   if ($type == 'library') { 
 
-   	$sql .= 'LEFT JOIN library_feature lf ON f.feature_id=lf.feature_id WHERE lf.library_id=%d';
 
-   	$parent_sql .= 'fl.feature_id IN (SELECT feature_id FROM library_feature WHERE library_id=%d) GROUP BY p.uniquename, p.feature_id';
 
-     
 
-   } elseif ($type == 'analysis') {
 
-   	$sql .= 'LEFT JOIN analysisfeature af ON f.feature_id=af.feature_id WHERE af.analysis_id=%d';
 
- 		$parent_sql .= 'fl.feature_id IN (SELECT feature_id FROM analysisfeature WHERE analysis_id=%d) GROUP BY p.uniquename, p.feature_id';
 
-     $resource = db_query($sql, $id);
 
-   } else {
 
-     print "ERROR: Unable to generate FASTA due to unrecognized type -".$type."!\n";
 
-     return FALSE;
 
-   }
 
-   
 
-   // check if some don't have sequence but are aligned on a parent who does
 
- 	//print "SQL: ".$parent_sql."\n";
 
-   $resource = db_query($parent_sql, $id);
 
- 	$parent_seq = array();
 
- 	$residues_seq = 'SELECT residues FROM feature WHERE feature_id=%d';
 
-   while ($r = db_fetch_object($resource)) {
 
-   	//print 'Creating index for '.$r->parent_feature_id. " (".$r->parent_uniquename.")\n";
 
-   	$seq = db_fetch_object(db_query($residues_seq, $r->parent_feature_id));
 
-   	//print "Residues:".$seq->residues."\n";
 
-   	if (!empty($seq->residues)) {
 
- 	  	//print "\tGot Seq!\n";
 
- 	  }
 
- 		$parent_seq[ $r->parent_feature_id ] = array(
 
- 			'residues' => $seq->residues,
 
- 			'uniquename' => $r->parent_uniquename
 
- 		);
 
-   }
 
-   
 
- 	$resource = db_query($sql, $id);
 
-   while ($r = db_fetch_object($resource)) {
 
-     if (!empty($r->residues)) {
 
-       fwrite($fh, '>'.$r->uniquename."\n");
 
-       fwrite($fh, wordwrap($r->residues,80,"\n",TRUE)."\n");
 
-     } else {
 
- 	    //print $r->uniquename." (based on ".$r->parent_feature_id.' -'.$parent_seq[$r->parent_feature_id]['uniquename'].")\n";
 
-       if (!empty($parent_seq[$r->parent_feature_id]['residues'])) {
 
-       	//print "\tHave Seq\n";
 
-       	fwrite($fh, '>'.$r->uniquename." (based on ".$parent_seq[$r->parent_feature_id]['uniquename'].")\n");
 
-         $seq = substr($parent_seq[$r->parent_feature_id]['residues'], $r->fmin, $r->fmax - $r->fmin);
 
-         fwrite($fh, wordwrap($seq,80,"\n",TRUE)."\n");
 
-         if ($save_offset) {
 
-           $noseq_features[ $r->uniquename ] = array(
 
-             'start' => $r->fmin,
 
-             'end' => $r->fmax,
 
-             'parent' => array(
 
-               'uniquename' => $parent_seq[$r->parent_feature_id]['uniquename'],
 
-             ),
 
-           );
 
-         }
 
-       }
 
-     }
 
-   }
 
-   
 
-   fclose($fh);
 
-   return array(
 
-     'file' => $fasta_file,
 
-     'noseq_features' => $noseq_features
 
-   );
 
- }
 
- /**
 
-  * Retrieves the next xml record with $record_identifier
 
-  *
 
-  * Assumption: the end tag for $record_identifier is one line before the next opening tag
 
-  * @param $xml_file
 
-  *   The file containing the xml records; must supply the full path
 
-  * @param $record_identifier
 
-  *   The opening tag enclosing a record (ie: <Iteration>)
 
-  * @param $last_record_line_num
 
-  *   The line number of the openin tag for the last record
 
-  * 
 
-  * @return
 
-  *   An array describing the next xml record
 
-  *    -record: the simpleXML record
 
-  *    -start_line_num: the line number in the file that this record starts at
 
-  *    -end_line_num: the line number in the file that this record ends at
 
-  */
 
- function tripal_gbrowse_get_next_xml_record ($xml_file, $record_identifier, $last_record_line_num = NULL) {
 
- 	// If first record ------------------------------------------------
 
- 	if (!$last_record_line_num) {
 
- 		$cmd = 'grep -n "'.$record_identifier.'" -m 2 '.$xml_file;
 
- 		exec($cmd, $line_num_raw);
 
- 		// get start of next record
 
- 		if (preg_match('/(\d+):.*/',$line_num_raw[0],$matches)) {
 
- 			$start = $matches[1];
 
- 		} else {
 
- 			return FALSE;
 
- 		}
 
- 		// get end of next record
 
- 		if (preg_match('/(\d+):.*/',$line_num_raw[1],$matches)) {
 
- 			$end = $matches[1] -1;
 
- 		} else {
 
- 			return FALSE;
 
- 		}
 
- 	// If not first record --------------------------------------------
 
- 	} else {
 
- 		$cmd = 'tail --lines=+'.($last_record_line_num+1).' '.$xml_file.' 2>/dev/null | grep -n "'.$record_identifier.'" -m 2 2>/dev/null ';
 
- 		exec($cmd, $line_num_raw);
 
- 		// get start of next record
 
- 		if (preg_match('/(\d+):.*/',$line_num_raw[0],$matches)) {
 
- 			$start = $matches[1] + $last_record_line_num;
 
- 		} else {
 
- 			return FALSE;
 
- 		}
 
- 		// get end of next record
 
- 		if (preg_match('/(\d+):.*/',$line_num_raw[1],$matches)) {
 
- 			$end = $matches[1] + $last_record_line_num -1;
 
- 		} else {
 
- 			return FALSE;
 
- 		}
 
- 		
 
- 	}
 
- 	
 
- 	$cmd = 'tail --lines=+'.$start.' '.$xml_file.' 2>/dev/null | head -n '.($end-$start+1).' 2>/dev/null';
 
- 	exec($cmd, $xml);
 
- 	
 
- 	//print "XML:".implode("\n",$xml)."\n";
 
- 	if (!$xml) {
 
- 		return FALSE;
 
- 	}
 
- 	
 
- 	$xml_record = new SimpleXMLElement(implode("\n",$xml));
 
- 	return array(
 
- 		'record' => $xml_record,
 
- 		'start_line_num' => $start,
 
- 		'end_line_num' => $end,
 
- 	);
 
- }
 
- /**
 
-  * Custom sort function to be used with usort
 
-  * Sorts an array( 'score' => \d+, 'hit' => simplexml obj)
 
-  */
 
- function tripal_gbrowse_sort_by_score ($a, $b) {
 
- 	if ($a['score'] == $b['score']) {
 
- 		return 0;
 
- 	} elseif ($a['score'] < $b['score']) {
 
- 		return 1;
 
- 	} else {
 
- 		return -1;
 
- 	}
 
- }
 
 
  |