123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083 |
- <?php
- function tripal_bulk_loader_add_loader_job_form($form_state, $node) {
- $form = array();
-
- if ($node->job_status == 'Loading...') {
- $progress = tripal_bulk_loader_progess_file_get_progress($node->job_id);
- drupal_set_message(t("The Loading Summary only updates at the end of each constant set.
- %num records have already been inserted; however, they won't be available until the
- current constant set is full loaded and no errors are encountered.", array('%num' => $progress->num_records)), 'warning');
- }
- $form['nid'] = array(
- '#type' => 'hidden',
- '#value' => $node->nid,
- );
- $form['file'] = array(
- '#type' => 'hidden',
- '#value' => $node->file
- );
- $form['job_id'] = array(
- '#type' => 'hidden',
- '#value' => $node->job_id,
- );
- $form['submit'] = array(
- '#type' => 'submit',
- '#value' => ($node->job_id) ? 'Re-Submit Job' : 'Submit Job',
- );
- $form['submit-cancel'] = array(
- '#type' => ($node->job_id)? 'submit' : 'hidden',
- '#value' => 'Cancel Job',
- );
- if ($node->keep_track_inserted) {
- $form['submit-revert'] = array(
- '#type' => ($node->job_id) ? 'submit' : 'hidden',
- '#value' => 'Revert',
- );
- }
- return $form;
- }
- function tripal_bulk_loader_add_loader_job_form_submit($form, $form_state) {
- global $user;
- if (preg_match('/Submit Job/', $form_state['values']['op'])) {
-
- $job_args[1] = $form_state['values']['nid'];
- if (is_readable($form_state['values']['file'])) {
- $fname = basename($form_state['values']['file']);
- $job_id = tripal_add_job("Bulk Loading Job: $fname", 'tripal_bulk_loader', 'tripal_bulk_loader_load_data', $job_args, $user->uid);
-
- $success = db_query("UPDATE {tripal_bulk_loader} SET job_id=%d WHERE nid=%d", $job_id, $form_state['values']['nid']);
-
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", 'Submitted to Queue', $form_state['values']['nid']);
- }
- else {
- drupal_set_message(t("Can not open %file. Job not scheduled.", array('%file' => $form_state['values']['file'])));
- }
- }
- elseif (preg_match('/Re-Submit Job/', $form_state['values']['op'])) {
- tripal_jobs_rerun($form_state['values']['job_id']);
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", 'Submitted to Queue', $form_state['values']['nid']);
- }
- elseif (preg_match('/Cancel Job/', $form_state['values']['op'])) {
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", 'Job Cancelled', $form_state['values']['nid']);
- tripal_jobs_cancel($form_state['values']['job_id']);
- }
- elseif (preg_match('/Revert/', $form_state['values']['op'])) {
-
- $resource = db_query('SELECT * FROM {tripal_bulk_loader_inserted} WHERE nid=%d ORDER BY tripal_bulk_loader_inserted_id DESC', $form_state['values']['nid']);
- while ($r = db_fetch_object($resource)) {
- $ids = preg_split('/,/', $r->ids_inserted);
- db_query('DELETE FROM %s WHERE %s IN (%s)', $r->table_inserted_into, $r->table_primary_key, $r->ids_inserted);
- $result = db_fetch_object(db_query('SELECT true as present FROM %s WHERE %s IN (%s)', $r->table_inserted_into, $r->table_primary_key, $r->ids_inserted));
- if (!$result->present) {
- drupal_set_message(t('Successfully Removed data Inserted into the %tableto table.', array('%tableto' => $r->table_inserted_into)));
- db_query('DELETE FROM {tripal_bulk_loader_inserted} WHERE tripal_bulk_loader_inserted_id=%d', $r->tripal_bulk_loader_inserted_id);
- }
- else {
- drupal_set_message(t('Unable to remove data Inserted into the %tableto table!', array('%tableto' => $r->table_inserted_into)), 'error');
- }
- }
-
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", 'Reverted -Data Deleted', $form_state['values']['nid']);
- }
- }
- function tripal_bulk_loader_load_data($nid, $job_id) {
-
- set_time_limit(0);
-
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", 'Loading...', $nid);
- $node = node_load($nid);
- print "Template: " . $node->template->name . " (" . $node->template_id . ")\n";
- $total_lines = trim(`wc --lines < $node->file`);
- print "File: " . $node->file . " (" . $total_lines . " lines)\n";
-
- print "\nPreparing to load...\n";
- $loaded_without_errors = TRUE;
-
- $default_data = array();
- $field2column = array();
- $record2priority = array();
- $tables = array();
- $template_array = $node->template->template_array;
-
- foreach ($template_array as $priority => $record_array) {
- $record2priority[$record_array['record_id']] = $priority;
- }
-
- foreach ($template_array as $priority => $record_array) {
- if (!is_array($record_array)) {
- continue;
- }
-
-
- if (preg_match('/insert/', $record_array['mode'])) {
- $tables[$record_array['table']] = $record_array['table'];
- }
-
-
- foreach ($record_array['fields'] as $field_index => $field_array) {
- $default_data[$priority]['table'] = $record_array['table'];
- $default_data[$priority]['mode'] = ($record_array['mode']) ? $record_array['mode'] : 'insert';
- $default_data[$priority]['select_if_duplicate'] = ($record_array['select_if_duplicate']) ? $record_array['select_if_duplicate'] : 0;
- $default_data[$priority]['update_if_duplicate'] = ($record_array['update_if_duplicate']) ? $record_array['update_if_duplicate'] : 0;
- $default_data[$priority]['disabled'] = ($record_array['disable']) ? $record_array['disable'] : 0;
- $default_data[$priority]['optional'] = ($record_array['optional']) ? $record_array['optional'] : 0;
- $default_data[$priority]['select_optional'] = ($record_array['select_optional']) ? $record_array['select_optional'] : 0;
- $default_data[$priority]['record_id'] = $record_array['record_id'];
- $default_data[$priority]['required'][$field_array['field']] = $field_array['required'];
- $one = $default_data[$priority];
- if (isset($field_array['regex'])) {
- $default_data[$priority]['regex_transform'][$field_array['field']] = $field_array['regex'];
- }
- $two = $default_data[$priority];
- if (preg_match('/table field/', $field_array['type'])) {
- $default_data[$priority]['values_array'][$field_array['field']] = '';
- $default_data[$priority]['need_further_processing'] = TRUE;
- $field2column[$priority][$field_array['field']] = $field_array['spreadsheet column'];
- }
- elseif (preg_match('/constant/', $field_array['type'])) {
- $default_data[$priority]['values_array'][$field_array['field']] = $field_array['constant value'];
- }
- elseif (preg_match('/foreign key/', $field_array['type'])) {
- $default_data[$priority]['values_array'][$field_array['field']] = array();
- $default_data[$priority]['need_further_processing'] = TRUE;
- $default_data[$priority]['values_array'][$field_array['field']]['foreign record']['record'] = $field_array['foreign key'];
-
- $fk_priority = $record2priority[$field_array['foreign key']];
- $fk_table = $template_array[$fk_priority]['table'];
- $default_data[$priority]['values_array'][$field_array['field']]['foreign record']['table'] = $fk_table;
-
-
-
-
- if (!array_key_exists('foreign field', $field_array)) {
- $tbl_description = tripal_core_get_chado_table_schema($record_array['table']);
- foreach ($tbl_description['foreign keys'] as $key_table => $key_array) {
- if ($key_table == $fk_table) {
- foreach ($key_array['columns'] as $left_field => $right_field) {
- if ($left_field == $field_array['field']) {
- $field_array['foreign field'] = $right_field;
- }
- }
- }
- }
- }
- $default_data[$priority]['values_array'][$field_array['field']]['foreign record']['field'] = $field_array['foreign field'];
- }
- else {
- print 'WARNING: Unsupported type: ' . $field_array['type'] . ' for ' . $table . '.' . $field_array['field'] . "!\n";
- }
- $three = $default_data[$priority];
- }
- }
-
-
-
- print "Loading...\n";
- $original_default_data = $default_data;
- $group_index = 0;
- $total_num_groups = sizeof($node->constants);
- foreach ($node->constants as $group_id => $set) {
-
- $default_data = $original_default_data;
- $group_index++;
-
- if (!empty($set)) {
- print "Constants:\n";
- foreach ($set as $priority => $record) {
- foreach ($record as $field_id => $field) {
- print "\t- " . $field['chado_table'] . '.' . $field['chado_field'] . ' = ' . $field['value'] . "\n";
- if ($default_data[$priority]['table'] == $field['chado_table']) {
- if (isset($default_data[$priority]['values_array'][$field['chado_field']])) {
- if (isset($field2column[$priority][$field['chado_field']])) {
- $field2column[$priority][$field['chado_field']] = $field['value'];
- }
- else {
- $default_data[$priority]['values_array'][$field['chado_field']] = $field['value'];
- }
- }
- else {
- print "ERROR: Template has changed after constants were assigned!\n";
- watchdog('T_bulk_loader', 'Template has changed after constants were assigned', array(), WATCHDOG_NOTICE);
- exit(1);
- }
- }
- else {
- print "ERROR: Template has changed after constants were assigned!\n";
- watchdog('T_bulk_loader', 'Template has changed after constants were assigned', array(), WATCHDOG_NOTICE);
- exit(1);
- }
- }
- }
- }
-
- print "\tPreparing to load the current constant set...\n";
- print "\t\tOpen File...\n";
- $file = new SplFileObject($node->file, 'r');
- if (!$file) {
- watchdog('T_bulk_loader', 'Could not open file %file',
- array($node->file), WATCHDOG_ERROR);
- return;
- }
-
- $header = '';
- if (preg_match('/(t|true|1)/', $node->file_has_header)) {
- $file->next();
- $header = $file->current();
- }
- $num_records = 0;
- $num_lines = 0;
- $num_errors = 0;
- $interval = intval($total_lines * 0.0001);
- if ($interval == 0) {
- $interval = 1;
- }
-
- $savepoint = '';
- switch (variable_get('tripal_bulk_loader_transactions', 'row')) {
- case "none":
- break;
- case "all":
- print "\t\tStart Transaction...\n";
- tripal_db_start_transaction();
- $transactions = TRUE;
- $savepoint = "";
- break;
- case "row":
- print "\t\tStart Transaction...\n";
- tripal_db_start_transaction();
- $transactions = TRUE;
- $savepoint = "last_row_complete";
- break;
- }
-
- $triggers_disabled = FALSE;
- if ($transactions AND variable_get('tripal_bulk_loader_disable_triggers', TRUE)) {
- print "\t\tDefer Constraints...\n";
- $triggers_disabled = TRUE;
- chado_query("SET CONSTRAINTS ALL DEFERRED");
- }
-
- if ($transactions) {
- print "\t\tAcquiring Table Locks...\n";
- $lockmode = variable_get('tripal_bulk_loader_lock', 'ROW EXCLUSIVE');
- foreach ($tables as $table) {
- print "\t\t\t$lockmode for $table\n";
- chado_query("LOCK TABLE %s IN %s MODE", $table, $lockmode);
- }
- }
- print "\tLoading the current constant set...\n";
- tripal_bulk_loader_progress_bar(0, $total_lines);
- while (!$file->eof()) {
- $file->next();
- $raw_line = $file->current();
- $raw_line = trim($raw_line);
- if (empty($raw_line)) {
- continue;
- }
- $line = explode("\t", $raw_line);
- $num_lines++;
-
- if ($node->job_id and $num_lines % $interval == 0) {
-
- $group_progress = round(($num_lines / $total_lines) * 100);
- tripal_bulk_loader_progress_bar($num_lines, $total_lines);
-
-
-
-
-
-
-
- $job_progress = round(((($group_index - 1) * 100) + $group_progress) / $total_num_groups);
- tripal_job_set_progress($node->job_id, $job_progress);
- }
- $data = $default_data;
-
- $data_keys = array_keys($data);
- foreach ($data_keys as $priority) {
- $options = array(
- 'field2column' => $field2column,
- 'record2priority' => $record2priority,
- 'line' => $line,
- 'line_num' => $num_lines,
- 'group_index' => $group_index,
- 'node' => $node,
- 'nid' => $node->nid,
- );
-
- $no_errors = FALSE;
- if (array_key_exists($priority, $data) and
- array_key_exists('disabled', $data[$priority]) and
- $data[$priority]['disabled'] == 0) {
- $no_errors = process_data_array_for_line($priority, $data, $default_data, $options);
- }
- else {
-
- $no_errors = TRUE;
- }
- tripal_bulk_loader_progress_file_track_job($job_id, $no_errors);
- $failed = FALSE;
- if ( !$no_errors ) {
-
- if ($transactions) {
- tripal_db_rollback_transaction($savepoint);
- }
- $failed = TRUE;
- break;
- }
- }
- tripal_bulk_loader_progress_file_track_job($job_id, FALSE, TRUE);
- if ($failed) {
- break;
- }
- else {
-
-
- if ($savepoint) {
- if ($num_lines == 1) {
- tripal_db_set_savepoint_transaction($savepoint);
- }
- else {
-
- tripal_db_set_savepoint_transaction($savepoint, TRUE);
- }
- }
- }
- }
-
- if ($transactions) {
-
- tripal_db_commit_transaction();
- }
- if ($failed) {
- $loaded_without_errors = FALSE;
- break;
- }
- tripal_bulk_loader_progress_bar($total_lines, $total_lines);
- tripal_bulk_loader_progress_file_track_job($job_id, FALSE, FALSE, TRUE);
- }
-
- if ($loaded_without_errors) {
- $status = 'Loading Completed Successfully';
- }
- else {
- $status = 'Errors Encountered';
- }
- db_query("UPDATE {tripal_bulk_loader} SET job_status='%s' WHERE nid=%d", $status, $nid);
- }
- function process_data_array_for_line($priority, &$data, &$default_data, $addt) {
- $table_data = $data[$priority];
- $addt = (object) $addt;
- $no_errors = TRUE;
- $table = $table_data['table'];
- $values = $table_data['values_array'];
-
-
- if (array_key_exists('need_further_processing', $table_data) and $table_data['need_further_processing']) {
- if (array_key_exists($priority, $addt->field2column)) {
- $values = tripal_bulk_loader_add_spreadsheetdata_to_values($values, $addt->line, $addt->field2column[$priority]);
- }
- $values = tripal_bulk_loader_add_foreignkey_to_values($table_data, $values, $data, $addt->record2priority, $addt->nid, $priority, $default_data);
- }
- $values = tripal_bulk_loader_regex_tranform_values($values, $table_data, $addt->line);
- if (!$values) {
-
- }
-
- $table_desc = tripal_core_get_chado_table_schema($table);
-
-
-
- $skip_optional = 0;
- foreach ($table_data['required'] as $field => $required) {
- if ($required) {
-
- if (!isset($values[$field]) or
- (is_array($values[$field]) and count($values[$field]) == 0)) {
-
-
- if ($table_data['optional'] or preg_match('/optional/', $table_data['mode']) or
- $table_data['select_optional']) {
- $skip_optional = 1;
-
-
-
- $values = array();
- }
- else {
- $msg = "\nLine " . $addt->line_num . ' "' . $table_data['record_id'] .
- '" (' . $table_data['mode'] . ') Missing template required value: ' . $table . '.' . $field;
- watchdog('T_bulk_loader', $msg, array(), WATCHDOG_WARNING);
- $data[$priority]['error'] = TRUE;
- $no_errors = FALSE;
- }
- }
- }
- }
-
-
-
- if (!$skip_optional and (preg_match('/insert/', $table_data['mode']) or
- preg_match('/optional/', $table_data['mode']))) {
-
- $fields = $table_desc['fields'];
- foreach ($fields as $field => $def) {
-
-
- if (array_key_exists('not null', $def) and $def['not null'] == 1 and
- !array_key_exists($field, $values) and
- !array_key_exists('default', $def) and
- strcmp($def['type'], 'serial') != 0) {
- $msg = "\nLine " . $addt->line_num . ' ' . $table_data['record_id'] .
- ' (' . $table_data['mode'] . ') Missing Database Required Value: ' . $table . '.' . $field;
- watchdog('T_bulk_loader', $msg, array(), WATCHDOG_ERROR);
- $data[$priority]['error'] = TRUE;
- }
- }
- }
-
- $data[$priority]['values_array'] = $values;
-
- if (array_key_exists('error', $data[$priority]) and $data[$priority]['error']) {
- watchdog('T_bulk_loader','Skipping processing of %table due to previous errors',array('%table'=>$table),WATCHDOG_NOTICE);
- return $no_errors;
- }
-
- if ($skip_optional) {
- watchdog('T_bulk_loader','Skipping an optional record (%record)',array('%record'=>$table_data['record_id']),WATCHDOG_NOTICE);
- return $no_errors;
- }
-
- if (array_key_exists('inserted', $table_data) and $table_data['inserted']) {
- watchdog('T_bulk_loader','Skipping %record since it is already inserted',array('%record'=>$table_data['record_id']),WATCHDOG_NOTICE);
- return $no_errors;
- }
-
-
- if (array_key_exists('selected', $table_data) and $table_data['selected']) {
- $data[$priority]['values_array'] = $default_data[$priority]['values_array'];
- watchdog('T_bulk_loader','%record was already selected thus we are just returning the values previously selected.',array('%record'=>$table_data['record_id']),WATCHDOG_NOTICE);
- return $no_errors;
- }
-
- if (!array_key_exists('select_if_duplicate', $table_data)) {
- $table_data['select_if_duplicate'] = 0;
- }
- if (!array_key_exists('update_if_duplicate', $table_data)) {
- $table_data['update_if_duplicate'] = 0;
- }
-
-
-
- $data[$priority]['is_duplicate'] = 0;
- if (preg_match('/insert_unique/', $table_data['mode']) or
- $table_data['select_if_duplicate'] == 1 or $table_data['update_if_duplicate'] == 1) {
- $options = array('is_duplicate' => TRUE);
- $duplicate = tripal_core_chado_select($table, array_keys($table_desc['fields']), $values, $options);
-
-
- if ($duplicate and is_array($duplicate) and count($duplicate) == 1) {
- $dup_record = $duplicate[0];
-
-
- $data[$priority]['is_duplicate'] = (array) $dup_record;
-
-
-
-
- if (count((array) $dup_record) == 1) {
- foreach ($dup_record as $key => $value) {
- $data[$priority]['values_array'] = $value;
- }
- }
-
-
- else {
-
- $new_values = array();
- foreach ($dup_record as $key => $value) {
- $new_values[$key] = $value;
- }
- $data[$priority]['values_array'] = $new_values;
- }
-
- if ($table_data['select_if_duplicate'] == 1) {
- watchdog('T_bulk_loader','Simply returning values for %record since it was already inserted',array('%record'=>$table_data['record_id']),WATCHDOG_NOTICE);
- return $no_errors;
- }
- }
- }
- else {
-
-
- }
- if (!preg_match('/select/', $table_data['mode'])) {
-
- if (variable_get('tripal_bulk_loader_prepare', TRUE)) {
- $options = array('statement_name' => 'record_' . $addt->nid . '_' . $priority);
- if (($addt->line_num > 1 && $addt->group_index == 1) OR $addt->group_index > 1) {
-
- }
- }
- else {
- $options = array();
- }
-
- if (variable_get('tripal_bulk_loader_skip_validation', FALSE)) {
- $options['skip_validation'] = TRUE;
- }
- if ($table_data['update_if_duplicate'] == 1) {
- if (array_key_exists('statement_name', $options)) {
- $options['statement_name'] = 'upd_' . $options['statement_name'];
- }
- $match = $data[$priority]['is_duplicate'];
- $record = tripal_core_chado_update($table, $match, $values, $options);
- }
- else {
- $record = tripal_core_chado_insert($table, $values, $options);
- }
-
- if (!$record) {
- $msg = "\nLine " . $addt->line_num . ' ' . $table_data['record_id'] . ' (' .
- $table_data['mode'] . ') Unable to insert record into ' . $table .
- ' where values:' . print_r($values, TRUE);
- watchdog('T_bulk_loader', $msg, array(), WATCHDOG_ERROR);
- $data[$priority]['error'] = TRUE;
- $no_errors = FALSE;
- }
-
- else {
-
- if (preg_match('/insert_once/', $table_data['mode'])) {
- $default_data[$priority]['inserted'] = TRUE;
- }
-
- if ($addt->node->keep_track_inserted) {
- $insert_record = db_fetch_object(db_query(
- "SELECT * FROM {tripal_bulk_loader_inserted} WHERE table_inserted_into='%s' AND nid=%d",
- $table,
- $addt->nid
- ));
- if ($insert_record) {
- $insert_record->ids_inserted .= ',' . $record[$table_desc['primary key'][0] ];
- drupal_write_record('tripal_bulk_loader_inserted', $insert_record, 'tripal_bulk_loader_inserted_id');
-
-
- }
- else {
- $insert_record = array(
- 'nid' => $addt->nid,
- 'table_inserted_into' => $table,
- 'table_primary_key' => $table_desc['primary key'][0],
- 'ids_inserted' => $record[ $table_desc['primary key'][0] ],
- );
-
- $success = drupal_write_record('tripal_bulk_loader_inserted', $insert_record);
-
- }
- }
-
-
- if (array_key_exists('primary key', $table_desc)) {
- if (count($table_desc['primary key']) == 1) {
- $pkey_field = $table_desc['primary key'][0];
- $data[$priority]['values_array'] = $record[$pkey_field];
- }
- }
- else {
-
- $data[$priority]['values_array'] = $record;
- $values = $record;
- }
- }
- }
-
- else {
-
- $matches = array();
- if (is_array($values) and count($values) > 0) {
- $matches = tripal_core_chado_select($table, array_keys($table_desc['fields']), $values);
- }
-
- if (count($matches) == 0) {
-
- if ($table_data['select_optional'] != 1) {
- $msg = "\nLine " . $addt->line_num . ' ' . $table_data['record_id'] . ' (' . $table_data['mode'] . ') No Matching record in ' . $table . ' where values:' . print_r($values, TRUE);
- watchdog('T_bulk_loader', $msg, array(), WATCHDOG_ERROR);
- $data[$priority]['error'] = TRUE;
- $no_errors = FALSE;
- }
-
-
- else {
- $data[$priority]['values_array'] = NULL;
- }
- }
-
- if (count($matches) > 1) {
- if ($table_data['select_optional'] != 1) {
- $msg = "\nLine " . $addt->line_num . ' ' . $table_data['record_id'] . ' (' . $table_data['mode'] . ') Too many matching records in ' . $table . ' where values:' . print_r($values, TRUE);
- watchdog('T_bulk_loader', $msg, array(), WATCHDOG_WARNING);
- $data[$priority]['error'] = TRUE;
- $no_errors = FALSE;
- }
-
-
- else {
- $data[$priority]['values_array'] = NULL;
- }
- }
-
- if (preg_match('/select_once/', $table_data['mode'])) {
- $default_data[$priority]['selected'] = TRUE;
-
- if (array_key_exists('primary key', $table_desc)) {
- $new_values = array();
- foreach ($matches[0] as $key => $value) {
- $new_values[$key] = $value;
- }
- $default_data[$priority]['values_default'] = $new_values;
- }
- }
- }
- return $no_errors;
- }
- function tripal_bulk_loader_add_spreadsheetdata_to_values($values, $line, $field2column) {
- foreach ($values as $field => $value) {
- if (is_array($value)) {
- continue;
- }
- $column = $field2column[$field] - 1;
- if ($column < 0) {
- continue;
- }
- if (preg_match('/\S+/', $line[$column])) {
- $values[$field] = $line[$column];
- }
- else {
- unset($values[$field]);
- }
- }
- return $values;
- }
- function tripal_bulk_loader_add_foreignkey_to_values($table_array, $values, $data, $record2priority, $nid,
- $priority, $default_data) {
-
-
- foreach ($values as $field => $value) {
-
- if (is_array($value)) {
-
- $foreign_record = $value['foreign record']['record'];
- $foreign_priority = $record2priority[$foreign_record];
- $foreign_table = $value['foreign record']['table'];
- $foreign_field = $value['foreign record']['field'];
-
- $foreign_values = $data[$foreign_priority]['values_array'];
-
-
-
- if (array_key_exists($foreign_priority, $default_data) and
- array_key_exists('values_default', $default_data[$foreign_priority]) and
- array_key_exists($foreign_field, $default_data[$foreign_priority]['values_default'])) {
- $values[$field] = $default_data[$foreign_priority]['values_default'][$foreign_field];
- continue;
- }
-
-
- $tbl_description = tripal_core_get_chado_table_schema($table_array['table']);
- if ($tbl_description and
- array_key_exists('foreign keys', $tbl_description) and
- array_key_exists($foreign_table, $tbl_description['foreign keys']) and
- array_key_exists($field, $tbl_description['foreign keys'][$foreign_table]['columns']) and
- $foreign_field == $tbl_description['foreign keys'][$foreign_table]['columns'][$field]) {
- $values[$field] = $foreign_values;
- }
-
-
-
- else {
-
-
- $fk_description = tripal_core_get_chado_table_schema($foreign_table);
- if (!is_array($foreign_values)) {
-
- if ($foreign_values) {
- $fvalues = array($fk_description['primary key'][0] => $foreign_values);
- $columns = array($foreign_field);
- $options = array('statement_name' => 'pk_' . $foreign_table);
- $record = tripal_core_chado_select($foreign_table, $columns, $fvalues, $options);
- if ($record) {
- $values[$field] = $record[0]->$foreign_field;
- }
- else {
- unset($values[$field]);
- }
- }
-
-
- else {
- unset($values[$field]);
- }
- }
-
-
- else {
- $fvalues = $foreign_values;
- $columns = array($foreign_field);
- $options = array('statement_name' => 'blk_' . $nid . $priority . $foreign_table);
- $record = tripal_core_chado_select($foreign_table, $columns, $fvalues, $options);
- if ($record) {
- $values[$field] = $record[0]->$foreign_field;
- }
- else {
- unset($values[$field]);
- }
- }
- }
- }
- }
-
- return $values;
- }
- function tripal_bulk_loader_regex_tranform_values($values, $table_data, $line) {
- if (!array_key_exists('regex_transform', $table_data) or
- empty($table_data['regex_transform']) or
- !array_key_exists('regex_transform', $table_data) or
- !is_array($table_data['regex_transform'])) {
- return $values;
- }
-
- foreach ($table_data['regex_transform'] as $field => $regex_array) {
- if (!array_key_exists('replace', $regex_array) or
- !array_key_exists('pattern', $regex_array) or
- !is_array($regex_array['replace'])) {
- continue;
- }
-
-
- foreach ($regex_array['replace'] as $key => $replace) {
- if (preg_match_all('/<#column:(\d+)#>/', $replace, $matches)) {
- foreach ($matches[1] as $k => $column_num) {
- $replace = preg_replace('/' . $matches[0][$k] .'/', $line[$column_num-1], $replace);
- }
- $regex_array['replace'][$key] = $replace;
- }
- }
-
- $old_value = $values[$field];
- $new_value = preg_replace($regex_array['pattern'], $regex_array['replace'], $old_value);
- $values[$field] = $new_value;
- if ($values[$field] === '') {
- unset($values[$field]);
- }
-
- }
- return $values;
- }
- function tripal_bulk_loader_flatten_array($values) {
- $flattened_values = array();
- foreach ($values as $k => $v) {
- if (is_array($v)) {
- $vstr = array();
- foreach ($v as $vk => $vv) {
- if (drupal_strlen($vv) > 20) {
- $vstr[] = $vk . '=>' . drupal_substr($vv, 0, 20) . '...';
- }
- else {
- $vstr[] = $vk . '=>' . $vv;
- }
- }
- $v = '{' . implode(',', $vstr) . '}';
- }
- elseif (drupal_strlen($v) > 20) {
- $v = drupal_substr($v, 0, 20) . '...';
- }
- $flattened_values[] = $k . '=>' . $v;
- }
- return implode(', ', $flattened_values);
- }
- function tripal_bulk_loader_progress_bar($current=0, $total=100, $size=50) {
- $new_bar = FALSE;
- $mem = memory_get_usage();
-
- if ($current == 0) {
- $new_bar = TRUE;
- fputs(STDOUT, "Progress:\n");
- }
-
- $percent = sprintf("%.02f", round(($current/$total) * 100, 2));
-
- for ($i = strlen($percent); $i <= 4; $i++) {
- $percent = ' ' . $percent;
- }
- $total_size = $size + $i + 3 + 2;
- $place = 0;
-
- if (!$new_bar) {
- for ($place = $total_size; $place > 0; $place--) {
-
-
- }
- }
-
-
- echo '[';
- for ($place = 0; $place <= $size; $place++) {
-
- if ($place <= ($current / $total * $size)) {
- echo '|';
- }
- else {
-
- echo '-';
- }
- }
-
- echo ']';
-
- echo " $percent%. ($current of $total) Memory: $mem\r";
-
- if ($current == $total) {
- echo "\n";
- }
- }
- function tripal_bulk_loader_progress_file_track_job($job_id, $record_added, $line_complete = FALSE, $close = FALSE) {
-
- $file_handle = variable_get('tripal_bulk_loader_progress_file_handle', NULL);
-
- if (!$file_handle) {
- $file_handle = fopen('/tmp/tripal_bulk_loader_progress-'. $job_id . '.out', 'w');
- variable_set('tripal_bulk_loader_progress_file_handle', $file_handle);
- }
- if ($record_added) {
- fwrite($file_handle, '.');
- }
- if ($line_complete) {
- fwrite($file_handle, "\n");
- }
-
- if ($close) {
- fclose($file_handle);
- variable_set('tripal_bulk_loader_progress_file_handle', NULL);
- }
- }
|