tripal_bulk_loader.module 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572
  1. <?php
  2. include('tripal_bulk_loader.loader.inc');
  3. include('tripal_bulk_loader.constants.inc');
  4. include('tripal_bulk_loader.admin.inc');
  5. include('tripal_bulk_loader.admin.templates.inc');
  6. /**
  7. * Implements hook_init
  8. * Used to add stylesheets and javascript files to the header
  9. */
  10. function tripal_bulk_loader_init() {
  11. // Add javascript and style sheet
  12. drupal_add_css(drupal_get_path('theme', 'tripal') . '/css/tripal_bulk_loader.css');
  13. drupal_add_js(drupal_get_path('theme', 'tripal') . '/js/tripal_bulk_loader.js');
  14. }
  15. /**
  16. * Implements hook_menu
  17. */
  18. function tripal_bulk_loader_menu() {
  19. $items = array();
  20. // Bulk Loading Job Node
  21. $items['node/%node/constants/%/edit'] = array(
  22. 'title' => 'Edit Constant Set',
  23. 'description' => 'Edit a group of constants associated with the current bulk loader',
  24. 'page callback' => 'drupal_get_form',
  25. 'page arguments' => array('tripal_bulk_loader_edit_constant_set_form', 1, 3),
  26. 'access arguments' => array('administer site configuration'),
  27. 'type' => MENU_CALLBACK,
  28. );
  29. $items['node/%node/constants/%/delete'] = array(
  30. 'title' => 'Delete Constant Set',
  31. 'description' => 'Delete a group of constants associated with the current bulk loader',
  32. 'page callback' => 'drupal_get_form',
  33. 'page arguments' => array('tripal_bulk_loader_delete_constant_set_form', 1, 3),
  34. 'access arguments' => array('administer site configuration'),
  35. 'type' => MENU_CALLBACK,
  36. );
  37. // Admin pages -----------------
  38. $items['admin/tripal/tripal_bulk_loader_template'] = array(
  39. 'title' => 'Bulk Loader',
  40. 'description' => 'Templates for loading tab-delimited data',
  41. 'page callback' => 'tripal_bulk_loader_admin_template',
  42. 'access arguments' => array('administer site configuration'),
  43. 'type' => MENU_NORMAL_ITEM,
  44. );
  45. $items['admin/tripal/tripal_bulk_loader_template/configure'] = array(
  46. 'title' => 'Configure',
  47. 'description' => 'Configuration of global options related to bulk loading jobs',
  48. 'page callback' => 'drupal_get_form',
  49. 'page arguments' => array('tripal_bulk_loader_configuration_form'),
  50. 'access arguments' => array('administer site configuration'),
  51. 'type' => MENU_NORMAL_ITEM,
  52. );
  53. $items['admin/tripal/tripal_bulk_loader_template/manage_templates'] = array(
  54. 'title' => 'Manage Templates',
  55. 'description' => 'Create/Update/Delete/Import/Export Templates',
  56. 'page callback' => 'tripal_bulk_loader_admin_manage_templates',
  57. 'access arguments' => array('administer site configuration'),
  58. 'type' => MENU_NORMAL_ITEM,
  59. );
  60. $items['admin/tripal/tripal_bulk_loader_template/jobs'] = array(
  61. 'title' => 'Bulk Loader Jobs',
  62. 'description' => 'Listing of Bulk Loading Jobs',
  63. 'page callback' => 'tripal_bulk_loader_admin_jobs',
  64. 'access arguments' => array('administer site configuration'),
  65. 'type' => MENU_NORMAL_ITEM,
  66. );
  67. // Create/Edit Template --------
  68. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/create'] = array(
  69. 'title' => 'Create Template',
  70. 'description' => 'Create loader template for loading tab-delimited data',
  71. 'page callback' => 'drupal_get_form',
  72. 'page arguments' => array('tripal_bulk_loader_modify_template_base_form', 'create'),
  73. 'access arguments' => array('administer site configuration'),
  74. 'type' => MENU_NORMAL_ITEM,
  75. );
  76. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/edit'] = array(
  77. 'title' => 'Edit Template',
  78. 'description' => 'Edit loader template for loading tab-delimited data',
  79. 'page callback' => 'drupal_get_form',
  80. 'page arguments' => array('tripal_bulk_loader_modify_template_base_form', 'edit'),
  81. 'access arguments' => array('administer site configuration'),
  82. 'type' => MENU_NORMAL_ITEM,
  83. );
  84. $items['admin/tripal/tripal_bulk_loader_template/edit_record'] = array(
  85. 'title' => 'Edit Template Record',
  86. 'description' => 'Edit a record in an existing tripal bulk loader template.',
  87. 'page callback' => 'drupal_get_form',
  88. 'page arguments' => array('tripal_bulk_loader_edit_template_record_form'),
  89. 'access arguments' => array('administer site configuration'),
  90. 'type' => MENU_CALLBACK,
  91. );
  92. $items['admin/tripal/tripal_bulk_loader_template/add_field'] = array(
  93. 'title' => 'Add Template Field',
  94. 'description' => 'Add a template field to an existing tripal bulk loader template.',
  95. 'page callback' => 'drupal_get_form',
  96. 'page arguments' => array('tripal_bulk_loader_add_template_field_form'),
  97. 'access arguments' => array('administer site configuration'),
  98. 'type' => MENU_CALLBACK,
  99. );
  100. $items['admin/tripal/tripal_bulk_loader_template/edit_field'] = array(
  101. 'title' => 'Edit Template Field',
  102. 'description' => 'Edit an existing field from a tripal bulk loader template.',
  103. 'page callback' => 'drupal_get_form',
  104. 'page arguments' => array('tripal_bulk_loader_edit_template_field_form'),
  105. 'access arguments' => array('administer site configuration'),
  106. 'type' => MENU_CALLBACK,
  107. );
  108. // Delete Template -----
  109. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/delete'] = array(
  110. 'title' => 'Delete Template',
  111. 'description' => 'Delete bulk loader template',
  112. 'page callback' => 'drupal_get_form',
  113. 'page arguments' => array('tripal_bulk_loader_delete_template_base_form'),
  114. 'access arguments' => array('administer site configuration'),
  115. 'type' => MENU_NORMAL_ITEM,
  116. );
  117. // Import/Export ---------
  118. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/import'] = array(
  119. 'title' => 'Import Template',
  120. 'description' => 'Import Loaders',
  121. 'page callback' => 'drupal_get_form',
  122. 'page arguments' => array('tripal_bulk_loader_import_export_template_form', 'import'),
  123. 'access arguments' => array('administer site configuration'),
  124. 'type' => MENU_NORMAL_ITEM,
  125. );
  126. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/export'] = array(
  127. 'title' => 'Export Template',
  128. 'description' => 'Export Loaders',
  129. 'page callback' => 'drupal_get_form',
  130. 'page arguments' => array('tripal_bulk_loader_import_export_template_form', 'export'),
  131. 'access arguments' => array('administer site configuration'),
  132. 'type' => MENU_NORMAL_ITEM,
  133. );
  134. // AHAH ---------
  135. $items['admin/tripal/tripal_bulk_loader_template/add_field_ahah'] = array(
  136. 'page callback' => 'tripal_bulk_loader_add_field_ahah',
  137. 'access arguments' => array('administer site configuration'),
  138. 'type' => MENU_CALLBACK,
  139. );
  140. $items['admin/tripal/tripal_bulk_loader_template/edit_field_ahah'] = array(
  141. 'page callback' => 'tripal_bulk_loader_edit_field_ahah',
  142. 'access arguments' => array('administer site configuration'),
  143. 'type' => MENU_CALLBACK,
  144. );
  145. return $items;
  146. }
  147. /**
  148. * Implements hook_theme
  149. */
  150. function tripal_bulk_loader_theme() {
  151. return array(
  152. 'tripal_bulk_loader_set_constants_form' => array(
  153. 'arguments' => array('form' => NULL),
  154. ),
  155. 'tripal_bulk_loader_template' => array(
  156. 'arguments' => array('template_id' => NULL),
  157. 'template' => 'tripal_bulk_loader_template'
  158. ),
  159. 'tripal_bulk_loader_modify_template_base_form' => array(
  160. 'arguments' => array('form' => NULL),
  161. 'template' => 'tripal_bulk_loader_modify_template_base_form',
  162. ),
  163. 'tripal_bulk_loader_edit_template_field_form' => array(
  164. 'arguments' => array('form' => NULL),
  165. 'template' => 'tripal_bulk_loader_edit_template_field_form',
  166. ),
  167. 'tripal_bulk_loader_add_template_field_form' => array(
  168. 'arguments' => array('form' => NULL),
  169. 'template' => 'tripal_bulk_loader_add_template_field_form',
  170. ),
  171. );
  172. }
  173. /**
  174. * Implements hook_access
  175. */
  176. function tripal_bulk_loader_access($op, $node, $account) {
  177. if ($op == 'create') {
  178. if (!user_access('create tripal_bulk_loader', $account)) {
  179. return FALSE;
  180. }
  181. }
  182. if ($op == 'update') {
  183. if (!user_access('edit tripal_bulk_loader', $account)) {
  184. return FALSE;
  185. }
  186. }
  187. if ($op == 'delete') {
  188. if (!user_access('delete tripal_bulk_loader', $account)) {
  189. return FALSE;
  190. }
  191. }
  192. if ($op == 'view') {
  193. if (!user_access('access tripal_bulk_loader', $account)) {
  194. return FALSE;
  195. }
  196. }
  197. return NULL;
  198. }
  199. /**
  200. * Implements hook_perm
  201. */
  202. function tripal_bulk_loader_perm() {
  203. return array(
  204. 'access tripal_bulk_loader',
  205. 'create tripal_bulk_loader',
  206. 'delete tripal_bulk_loader',
  207. 'edit tripal_bulk_loader',
  208. );
  209. }
  210. //////////////////////////////////////////////////////////////////////////////////////////////
  211. // Node Functions
  212. //////////////////////////////////////////////////////////////////////////////////////////////
  213. /**
  214. * Implements hook_node_info
  215. */
  216. function tripal_bulk_loader_node_info() {
  217. $nodes = array();
  218. $nodes['tripal_bulk_loader'] = array(
  219. 'name' => t('Bulk Loading Job'),
  220. 'module' => 'tripal_bulk_loader',
  221. 'description' => t('A bulk loader for inserting tab-delimited data into chado database'),
  222. 'has_title' => TRUE,
  223. 'has_body' => FALSE,
  224. 'locked' => TRUE
  225. );
  226. return $nodes;
  227. }
  228. /**
  229. * Implements node_form
  230. * Used to gather the extra details stored with a Bulk Loading Job Node
  231. */
  232. function tripal_bulk_loader_form($node, $form_state) {
  233. $form = array();
  234. if (isset($form_state['values'])) {
  235. $node = $form_state['values'] + (array)$node;
  236. $node = (object) $node;
  237. }
  238. $sql = "SELECT * FROM {tripal_bulk_loader_template}";
  239. $results = db_query($sql);
  240. $templates = array();
  241. while ($template = db_fetch_object ($results)) {
  242. $templates [$template->template_id] = $template->name;
  243. }
  244. if (!$templates) {
  245. $form['label'] = array(
  246. '#type' => 'item',
  247. '#description' => t("Loader template needs to be created before any bulk loader can be added. Go to 'Tripal Management > Bulk Loader Template' to create the template."),
  248. '#weight' => -10,
  249. );
  250. return $form;
  251. }
  252. $form['loader'] = array(
  253. '#type' => 'fieldset',
  254. '#title' => t('Basic Details'),
  255. );
  256. $form['loader']['loader_name'] = array(
  257. '#type' => 'textfield',
  258. '#title' => t('Loading Job Name'),
  259. '#weight' => -10,
  260. '#required' => TRUE,
  261. '#default_value' => $node->loader_name
  262. );
  263. $form['loader']['template_id'] = array(
  264. '#type' => 'select',
  265. '#title' => t('Template'),
  266. '#description' => t('Please specify a template for this loader'),
  267. '#options' => $templates,
  268. '#weight' => -9,
  269. '#required' => TRUE,
  270. '#default_value' => $node->template_id,
  271. );
  272. $form['loader']['file']= array(
  273. '#type' => 'textfield',
  274. '#title' => t('Data File'),
  275. '#description' => t('Please specify the data file to be loaded. This must be a tab-delimited text file with UNIX line endings.'),
  276. '#weight' => -8,
  277. '#default_value' => $node->file,
  278. '#maxlength' => 1024,
  279. );
  280. $form['loader']['has_header'] = array(
  281. '#type' => 'radios',
  282. '#title' => t('File has a Header'),
  283. '#options' => array( 1 => 'Yes', 2 => 'No'),
  284. '#weight' => -7,
  285. '#default_value' => $node->file_has_header,
  286. );
  287. $form['loader']['keep_track_inserted'] = array(
  288. '#type' => 'radios',
  289. '#title' => t('Keep track of inserted record IDs'),
  290. '#description' => t('This enables the ability to revert an entire loading job even if '
  291. .'it completed successfully. Furthermore, it displays the number of records '
  292. .'successfully inserted into each table.'),
  293. '#options' => array( 1 => 'Yes', 0 => 'No'),
  294. '#weight' => -7,
  295. '#default_value' => (isset($node->keep_track_inserted)) ? $node->keep_track_inserted : variable_get('tripal_bulk_loader_keep_track_inserted', FALSE),
  296. );
  297. return $form;
  298. }
  299. /**
  300. * Implements node_load
  301. */
  302. function tripal_bulk_loader_load($node) {
  303. $sql = "SELECT * FROM {tripal_bulk_loader} WHERE nid = %d";
  304. $node = db_fetch_object(db_query($sql, $node->nid));
  305. $node->title = 'Bulk Loading Job: ' . $node->loader_name;
  306. // Add job details
  307. $progress = tripal_bulk_loader_progess_file_get_progress($node->job_id);
  308. $sql = "SELECT * FROM {tripal_jobs} WHERE job_id=%d";
  309. $node->job = db_fetch_object(db_query($sql, $node->job_id));
  310. // Add the loader template
  311. $sql = "SELECT * FROM {tripal_bulk_loader_template} WHERE template_id=%d";
  312. $results = db_fetch_object(db_query($sql, $node->template_id));
  313. $template = unserialize($results->template_array);
  314. $node->template = $results;
  315. $node->template->template_array = $template;
  316. // Add inserted records
  317. $sql = 'SELECT * FROM {tripal_bulk_loader_inserted} WHERE nid=%d';
  318. $resource = db_query($sql, $node->nid);
  319. while ($r = db_fetch_object($resource)) {
  320. $r->num_inserted = sizeof(preg_split('/,/', $r->ids_inserted));
  321. $node->inserted_records->{$r->table_inserted_into} = $r;
  322. }
  323. // Add exposed field list
  324. $node->exposed_fields = array();
  325. if ($template) {
  326. foreach ($template as $record_id => $record) {
  327. foreach ($record['fields'] as $field_id => $field) {
  328. if ($field['exposed']) {
  329. $node->exposed_fields[] = array(
  330. 'record_id' => $record_id,
  331. 'field_id' => $field_id,
  332. 'title' => $field['title'],
  333. );
  334. }
  335. }
  336. }
  337. if (empty($node->exposed_fields)) {
  338. $node->exposed_fields[] = array();
  339. }
  340. }
  341. // Add constants
  342. $sql = 'SELECT * FROM {tripal_bulk_loader_constants} WHERE nid=%d ORDER BY group_id, record_id, field_id';
  343. $resource = db_query($sql, $node->nid);
  344. while ($r = db_fetch_object($resource)) {
  345. $node->constants[$r->group_id][$r->record_id][$r->field_id] = array(
  346. 'constant_id' => $r->constant_id,
  347. 'group_id' => $r->group_id,
  348. 'chado_table' => $r->chado_table,
  349. 'chado_field' => $r->chado_field,
  350. 'record_id' => $r->record_id,
  351. 'field_id' => $r->field_id,
  352. 'value' => $r->value
  353. );
  354. }
  355. if (!$node->constants) {
  356. $node->constants[] = array();
  357. }
  358. return $node;
  359. }
  360. /**
  361. * Implements node_insert
  362. * Insert the data from the node form on Create content
  363. */
  364. function tripal_bulk_loader_insert($node) {
  365. // Insert into tripal_bulk_loader
  366. $sql = "INSERT INTO {tripal_bulk_loader} (nid, loader_name, template_id, file, file_has_header, job_status, keep_track_inserted) VALUES (%d, '%s', %d, '%s', %d, '%s', %d)";
  367. db_query($sql, $node->nid, $node->loader_name, $node->template_id, $node->file, $node->has_header, 'Initialized', $node->keep_track_inserted);
  368. // Update title
  369. $node->title =$node->loader_name;
  370. drupal_write_record('node', $node, 'nid');
  371. drupal_write_record('node_revision', $node, 'nid');
  372. drupal_set_message(t('After reviewing the details, please Submit this Job (by clicking the "Submit Job" button below). No data will be loaded until the submitted job is reached in the queue.'));
  373. }
  374. /**
  375. * Implements node_delete
  376. * Deletes the data when the delete button on the node form is clicked
  377. */
  378. function tripal_bulk_loader_delete($node) {
  379. $sql = "DELETE FROM {tripal_bulk_loader} WHERE nid = %d";
  380. db_query($sql, $node->nid);
  381. }
  382. /**
  383. * Implements node_update
  384. * Updates the data submitted by the node form on edit
  385. */
  386. function tripal_bulk_loader_update($node) {
  387. // Update tripal_bulk_loader
  388. $sql = "UPDATE {tripal_bulk_loader} SET nid = %d, loader_name = '%s', template_id = %d, file = '%s', file_has_header = '%s', keep_track_inserted = %d WHERE nid = %d";
  389. db_query($sql, $node->nid, $node->loader_name, $node->template_id, $node->file, $node->has_header, $node->keep_track_inserted, $node->nid);
  390. // Add a job if the user want to load the data
  391. global $user;
  392. if ($node->job) {
  393. $job_args[0] =$node->loader_name;
  394. $job_args[1] = $node->template_id;
  395. $job_args[2] = $node->file;
  396. if (is_readable($node->file)) {
  397. $fname = preg_replace("/.*\/(.*)/", "$1", $node->file);
  398. tripal_add_job("Bulk Load: $fname", 'tripal_bulk_loader', 'tripal_bulk_loader_load_data', $job_args, $user->uid);
  399. }
  400. else {
  401. drupal_set_message(t("Can not open %file. Job not scheduled.", array('%file' => $node->file)));
  402. }
  403. }
  404. }
  405. ///////////////////////////////////////////////////////////
  406. /**
  407. * Preprocessor function for the tripal_bulk_loader template
  408. */
  409. function tripal_bulk_loader_preprocess_tripal_bulk_loader_template(&$variables) {
  410. $sql = "SELECT * FROM {tripal_bulk_loader_template} WHERE template_id=%d";
  411. $template = db_fetch_object(db_query($sql, $variables['template_id']));
  412. $template->template_array = unserialize($template->template_array);
  413. $variables['template'] = $template;
  414. }
  415. /**
  416. * Get the progress of the current constant set from the progress file
  417. *
  418. * When transactions are used, database updates to drupal cannot be made. Thus a separate
  419. * method to keep track of progress was implemented: save a period to the file for each
  420. * record successfully inserted; each line in the file represents a processed line.
  421. *
  422. * @param $job_id
  423. * The id of the tripal job to check the progress of
  424. * @param $node
  425. * The tripal_bulk_loader node associated with the job
  426. *
  427. * @return
  428. * An array with the following keys:
  429. * num_lines = the number of lines in the file processed so far
  430. * total_lines = the total number of lines in the input file
  431. * percent_file = the percent the input file has been loaded
  432. * num_records = the number of records successfully inserted
  433. */
  434. function tripal_bulk_loader_progess_file_get_progress($job_id, $update_progress = TRUE) {
  435. $filename = '/tmp/tripal_bulk_loader_progress-' . $job_id . '.out';
  436. if (!file_exists($filename)) {
  437. return (object) array();
  438. }
  439. $num_lines = trim(`wc --lines < $filename`);
  440. $num_records = trim(`grep -o "." $filename | wc --lines`);
  441. $job = db_fetch_object(db_query("SELECT j.*, b.file, b.file_has_header, c.num as num_constant_sets
  442. FROM {tripal_jobs} j
  443. LEFT JOIN {tripal_bulk_loader} b ON b.job_id=j.job_id
  444. LEFT JOIN (
  445. SELECT nid, count(distinct(group_id)) as num
  446. FROM {tripal_bulk_loader_constants}
  447. GROUP BY nid
  448. ) c ON c.nid=b.nid
  449. WHERE j.job_id=%d", $job_id));
  450. if ($job->num_constant_sets) {
  451. $num_constant_sets_loaded = round($job->progress / (100 / $job->num_constant_sets), 4);
  452. // If the next constant set has started loading
  453. if ($job->num_constant_sets != $num_constant_sets_loaded) {
  454. // total lines in input file
  455. $total_lines = trim(`wc --lines < $job->file`);
  456. if ($job->file_has_header) {
  457. $total_lines--;
  458. }
  459. // percent of the current constant set loaded
  460. $percent = round($num_lines/$total_lines * 100, 2);
  461. // percent of the total job = (<# fully loaded constant sets> * 100 )
  462. // + <percent of current constant set>
  463. // / <total number of constant sets>
  464. $total_percent = (($num_constant_sets_loaded * 100) + $percent) / $job->num_constant_sets;
  465. // update the progress of the job
  466. if ($update_progress AND ($percent != 0 OR $percent != 100)) {
  467. tripal_job_set_progress($job_id, round($total_percent, 0));
  468. }
  469. }
  470. }
  471. return (object) array(
  472. 'num_lines' => $num_lines,
  473. 'total_lines' => $total_lines,
  474. 'percent_file' => $percent,
  475. 'num_constant_sets_loaded' => $num_constant_sets_loaded,
  476. 'total_percent' => $total_percent,
  477. 'num_records' => $num_records
  478. );
  479. }
  480. /**
  481. * Implements hook_job_describe_args()
  482. * Specifically to make viewing past tripal jobs more readable for jobs registered by this module
  483. *
  484. * @params $callback
  485. * The callback passed into tripal_add_job()
  486. * @param $args
  487. * The arguements passed into tripal_add_job()
  488. * @return
  489. * An array where keys are the human readable headers describing each arguement
  490. * and the value is the aguement passed in after formatting
  491. */
  492. function tripal_bulk_loader_job_describe_args($callback, $args) {
  493. $new_args = array();
  494. if ($callback == 'tripal_bulk_loader_load_data') {
  495. //1st arg is the nid for a bulk loader node
  496. $node = node_load($args[0]);
  497. $new_args['Bulk Loading Job'] = l($node->title, 'node/' . $args[0]);
  498. return $new_args;
  499. }
  500. }
  501. /**
  502. * Implements hook_coder_ignore().
  503. * Defines the path to the file (tripal_bulk_loader.coder_ignores.txt) where ignore rules for coder are stored
  504. */
  505. function tripal_bulk_loader_coder_ignore() {
  506. return array(
  507. 'path' => drupal_get_path('module', 'tripal_bulk_loader'),
  508. 'line prefix' => drupal_get_path('module', 'tripal_bulk_loader'),
  509. );
  510. }