tripal_bulk_loader.module 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571
  1. <?php
  2. include('tripal_bulk_loader.loader.inc');
  3. include('tripal_bulk_loader.constants.inc');
  4. include('tripal_bulk_loader.admin.inc');
  5. include('tripal_bulk_loader.admin.templates.inc');
  6. /**
  7. * Implements hook_init
  8. * Used to add stylesheets and javascript files to the header
  9. */
  10. function tripal_bulk_loader_init() {
  11. // Add javascript and style sheet
  12. drupal_add_css(drupal_get_path('theme', 'tripal') . '/css/tripal_bulk_loader.css');
  13. drupal_add_js(drupal_get_path('theme', 'tripal') . '/js/tripal_bulk_loader.js');
  14. }
  15. /**
  16. * Implements hook_menu
  17. */
  18. function tripal_bulk_loader_menu() {
  19. $items = array();
  20. // Bulk Loading Job Node
  21. $items['node/%node/constants/%/edit'] = array(
  22. 'title' => 'Edit Constant Set',
  23. 'description' => 'Edit a group of constants associated with the current bulk loader',
  24. 'page callback' => 'drupal_get_form',
  25. 'page arguments' => array('tripal_bulk_loader_edit_constant_set_form', 1, 3),
  26. 'access arguments' => array('administer site configuration'),
  27. 'type' => MENU_CALLBACK,
  28. );
  29. $items['node/%node/constants/%/delete'] = array(
  30. 'title' => 'Delete Constant Set',
  31. 'description' => 'Delete a group of constants associated with the current bulk loader',
  32. 'page callback' => 'drupal_get_form',
  33. 'page arguments' => array('tripal_bulk_loader_delete_constant_set_form', 1, 3),
  34. 'access arguments' => array('administer site configuration'),
  35. 'type' => MENU_CALLBACK,
  36. );
  37. // Admin pages -----------------
  38. $items['admin/tripal/tripal_bulk_loader_template'] = array(
  39. 'title' => 'Bulk Loader',
  40. 'description' => 'Templates for loading tab-delimited data',
  41. 'page callback' => 'tripal_bulk_loader_admin_template',
  42. 'access arguments' => array('administer site configuration'),
  43. 'type' => MENU_NORMAL_ITEM,
  44. );
  45. $items['admin/tripal/tripal_bulk_loader_template/configure'] = array(
  46. 'title' => 'Configure',
  47. 'description' => 'Configuration of global options related to bulk loading jobs',
  48. 'page callback' => 'drupal_get_form',
  49. 'page arguments' => array('tripal_bulk_loader_configuration_form'),
  50. 'access arguments' => array('administer site configuration'),
  51. 'type' => MENU_NORMAL_ITEM,
  52. );
  53. $items['admin/tripal/tripal_bulk_loader_template/manage_templates'] = array(
  54. 'title' => 'Manage Templates',
  55. 'description' => 'Create/Update/Delete/Import/Export Templates',
  56. 'page callback' => 'tripal_bulk_loader_admin_manage_templates',
  57. 'access arguments' => array('administer site configuration'),
  58. 'type' => MENU_NORMAL_ITEM,
  59. );
  60. $items['admin/tripal/tripal_bulk_loader_template/jobs'] = array(
  61. 'title' => 'Jobs',
  62. 'description' => 'Listing of Bulk Loading Jobs',
  63. 'page callback' => 'tripal_bulk_loader_admin_jobs',
  64. 'access arguments' => array('administer site configuration'),
  65. 'type' => MENU_NORMAL_ITEM,
  66. );
  67. // Create/Edit Template --------
  68. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/create'] = array(
  69. 'title' => 'Create Template',
  70. 'description' => 'Create loader template for loading tab-delimited data',
  71. 'page callback' => 'drupal_get_form',
  72. 'page arguments' => array('tripal_bulk_loader_modify_template_base_form', 'create'),
  73. 'access arguments' => array('administer site configuration'),
  74. 'type' => MENU_NORMAL_ITEM,
  75. );
  76. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/edit'] = array(
  77. 'title' => 'Edit Template',
  78. 'description' => 'Edit loader template for loading tab-delimited data',
  79. 'page callback' => 'drupal_get_form',
  80. 'page arguments' => array('tripal_bulk_loader_modify_template_base_form', 'edit'),
  81. 'access arguments' => array('administer site configuration'),
  82. 'type' => MENU_NORMAL_ITEM,
  83. );
  84. $items['admin/tripal/tripal_bulk_loader_template/edit_record'] = array(
  85. 'title' => 'Edit Template Record',
  86. 'description' => 'Edit a record in an existing tripal bulk loader template.',
  87. 'page callback' => 'drupal_get_form',
  88. 'page arguments' => array('tripal_bulk_loader_edit_template_record_form'),
  89. 'access arguments' => array('administer site configuration'),
  90. 'type' => MENU_CALLBACK,
  91. );
  92. $items['admin/tripal/tripal_bulk_loader_template/add_field'] = array(
  93. 'title' => 'Add Template Field',
  94. 'description' => 'Add a template field to an existing tripal bulk loader template.',
  95. 'page callback' => 'drupal_get_form',
  96. 'page arguments' => array('tripal_bulk_loader_add_template_field_form'),
  97. 'access arguments' => array('administer site configuration'),
  98. 'type' => MENU_CALLBACK,
  99. );
  100. $items['admin/tripal/tripal_bulk_loader_template/edit_field'] = array(
  101. 'title' => 'Edit Template Field',
  102. 'description' => 'Edit an existing field from a tripal bulk loader template.',
  103. 'page callback' => 'drupal_get_form',
  104. 'page arguments' => array('tripal_bulk_loader_edit_template_field_form'),
  105. 'access arguments' => array('administer site configuration'),
  106. 'type' => MENU_CALLBACK,
  107. );
  108. // Delete Template -----
  109. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/delete'] = array(
  110. 'title' => 'Delete Template',
  111. 'description' => 'Delete bulk loader template',
  112. 'page callback' => 'drupal_get_form',
  113. 'page arguments' => array('tripal_bulk_loader_delete_template_base_form'),
  114. 'access arguments' => array('administer site configuration'),
  115. 'type' => MENU_NORMAL_ITEM,
  116. );
  117. // Import/Export ---------
  118. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/import'] = array(
  119. 'title' => 'Import Template',
  120. 'description' => 'Import Loaders',
  121. 'page callback' => 'drupal_get_form',
  122. 'page arguments' => array('tripal_bulk_loader_import_export_template_form', 'import'),
  123. 'access arguments' => array('administer site configuration'),
  124. 'type' => MENU_NORMAL_ITEM,
  125. );
  126. $items['admin/tripal/tripal_bulk_loader_template/manage_templates/export'] = array(
  127. 'title' => 'Export Template',
  128. 'description' => 'Export Loaders',
  129. 'page callback' => 'drupal_get_form',
  130. 'page arguments' => array('tripal_bulk_loader_import_export_template_form', 'export'),
  131. 'access arguments' => array('administer site configuration'),
  132. 'type' => MENU_NORMAL_ITEM,
  133. );
  134. // AHAH ---------
  135. $items['admin/tripal/tripal_bulk_loader_template/add_field_ahah'] = array(
  136. 'page callback' => 'tripal_bulk_loader_add_field_ahah',
  137. 'access arguments' => array('administer site configuration'),
  138. 'type' => MENU_CALLBACK,
  139. );
  140. $items['admin/tripal/tripal_bulk_loader_template/edit_field_ahah'] = array(
  141. 'page callback' => 'tripal_bulk_loader_edit_field_ahah',
  142. 'access arguments' => array('administer site configuration'),
  143. 'type' => MENU_CALLBACK,
  144. );
  145. return $items;
  146. }
  147. /**
  148. * Implements hook_theme
  149. */
  150. function tripal_bulk_loader_theme() {
  151. return array(
  152. 'tripal_bulk_loader_set_constants_form' => array(
  153. 'arguments' => array('form' => NULL),
  154. ),
  155. 'tripal_bulk_loader_template' => array(
  156. 'arguments' => array('template_id' => NULL),
  157. 'template' => 'tripal_bulk_loader_template'
  158. ),
  159. 'tripal_bulk_loader_modify_template_base_form' => array(
  160. 'arguments' => array('form' => NULL),
  161. 'template' => 'tripal_bulk_loader_modify_template_base_form',
  162. ),
  163. 'tripal_bulk_loader_edit_template_field_form' => array(
  164. 'arguments' => array('form' => NULL),
  165. 'template' => 'tripal_bulk_loader_edit_template_field_form',
  166. ),
  167. 'tripal_bulk_loader_add_template_field_form' => array(
  168. 'arguments' => array('form' => NULL),
  169. 'template' => 'tripal_bulk_loader_add_template_field_form',
  170. ),
  171. );
  172. }
  173. /**
  174. * Implements hook_access
  175. */
  176. function tripal_bulk_loader_access($op, $node, $account) {
  177. if ($op == 'create') {
  178. if (!user_access('create tripal_bulk_loader', $account)) {
  179. return FALSE;
  180. }
  181. }
  182. if ($op == 'update') {
  183. if (!user_access('edit tripal_bulk_loader', $account)) {
  184. return FALSE;
  185. }
  186. }
  187. if ($op == 'delete') {
  188. if (!user_access('delete tripal_bulk_loader', $account)) {
  189. return FALSE;
  190. }
  191. }
  192. if ($op == 'view') {
  193. if (!user_access('access tripal_bulk_loader', $account)) {
  194. return FALSE;
  195. }
  196. }
  197. return NULL;
  198. }
  199. /**
  200. * Implements hook_perm
  201. */
  202. function tripal_bulk_loader_perm() {
  203. return array(
  204. 'access tripal_bulk_loader',
  205. 'create tripal_bulk_loader',
  206. 'delete tripal_bulk_loader',
  207. 'edit tripal_bulk_loader',
  208. );
  209. }
  210. //////////////////////////////////////////////////////////////////////////////////////////////
  211. // Node Functions
  212. //////////////////////////////////////////////////////////////////////////////////////////////
  213. /**
  214. * Implements hook_node_info
  215. */
  216. function tripal_bulk_loader_node_info() {
  217. $nodes = array();
  218. $nodes['tripal_bulk_loader'] = array(
  219. 'name' => t('Bulk Loading Job'),
  220. 'module' => 'tripal_bulk_loader',
  221. 'description' => t('A bulk loader for inserting tab-delimited data into chado database'),
  222. 'has_title' => TRUE,
  223. 'has_body' => FALSE,
  224. 'locked' => TRUE
  225. );
  226. return $nodes;
  227. }
  228. /**
  229. * Implements node_form
  230. * Used to gather the extra details stored with a Bulk Loading Job Node
  231. */
  232. function tripal_bulk_loader_form($node, $form_state) {
  233. $form = array();
  234. if (isset($form_state['values'])) {
  235. $node = $form_state['values'] + (array)$node;
  236. $node = (object) $node;
  237. }
  238. $sql = "SELECT * FROM {tripal_bulk_loader_template}";
  239. $results = db_query($sql);
  240. $templates = array();
  241. while ($template = db_fetch_object ($results)) {
  242. $templates [$template->template_id] = $template->name;
  243. }
  244. if (!$templates) {
  245. $form['label'] = array(
  246. '#type' => 'item',
  247. '#description' => t("Loader template needs to be created before any bulk loader can be added. Go to 'Tripal Management > Bulk Loader Template' to create the template."),
  248. '#weight' => -10,
  249. );
  250. return $form;
  251. }
  252. $form['loader'] = array(
  253. '#type' => 'fieldset',
  254. '#title' => t('Basic Details'),
  255. );
  256. $form['loader']['loader_name'] = array(
  257. '#type' => 'textfield',
  258. '#title' => t('Loading Job Name'),
  259. '#weight' => -10,
  260. '#required' => TRUE,
  261. '#default_value' => $node->loader_name
  262. );
  263. $form['loader']['template_id'] = array(
  264. '#type' => 'select',
  265. '#title' => t('Template'),
  266. '#description' => t('Please specify a template for this loader'),
  267. '#options' => $templates,
  268. '#weight' => -9,
  269. '#required' => TRUE,
  270. '#default_value' => $node->template_id,
  271. );
  272. $form['loader']['file']= array(
  273. '#type' => 'textfield',
  274. '#title' => t('Data File'),
  275. '#description' => t('Please specify the data file to be loaded. This must be a tab-delimited text file with UNIX line endings.'),
  276. '#weight' => -8,
  277. '#default_value' => $node->file
  278. );
  279. $form['loader']['has_header'] = array(
  280. '#type' => 'radios',
  281. '#title' => t('File has a Header'),
  282. '#options' => array( 1 => 'Yes', 2 => 'No'),
  283. '#weight' => -7,
  284. '#default_value' => $node->file_has_header,
  285. );
  286. $form['loader']['keep_track_inserted'] = array(
  287. '#type' => 'radios',
  288. '#title' => t('Keep track of inserted record IDs'),
  289. '#description' => t('This enables the ability to revert an entire loading job even if '
  290. .'it completed successfully. Furthermore, it displays the number of records '
  291. .'successfully inserted into each table.'),
  292. '#options' => array( 1 => 'Yes', 0 => 'No'),
  293. '#weight' => -7,
  294. '#default_value' => (isset($node->keep_track_inserted)) ? $node->keep_track_inserted : variable_get('tripal_bulk_loader_keep_track_inserted', FALSE),
  295. );
  296. return $form;
  297. }
  298. /**
  299. * Implements node_load
  300. */
  301. function tripal_bulk_loader_load($node) {
  302. $sql = "SELECT * FROM {tripal_bulk_loader} WHERE nid = %d";
  303. $node = db_fetch_object(db_query($sql, $node->nid));
  304. $node->title = 'Bulk Loading Job: ' . $node->loader_name;
  305. // Add job details
  306. $progress = tripal_bulk_loader_progess_file_get_progress($node->job_id);
  307. $sql = "SELECT * FROM {tripal_jobs} WHERE job_id=%d";
  308. $node->job = db_fetch_object(db_query($sql, $node->job_id));
  309. // Add the loader template
  310. $sql = "SELECT * FROM {tripal_bulk_loader_template} WHERE template_id=%d";
  311. $results = db_fetch_object(db_query($sql, $node->template_id));
  312. $template = unserialize($results->template_array);
  313. $node->template = $results;
  314. $node->template->template_array = $template;
  315. // Add inserted records
  316. $sql = 'SELECT * FROM {tripal_bulk_loader_inserted} WHERE nid=%d';
  317. $resource = db_query($sql, $node->nid);
  318. while ($r = db_fetch_object($resource)) {
  319. $r->num_inserted = sizeof(preg_split('/,/', $r->ids_inserted));
  320. $node->inserted_records->{$r->table_inserted_into} = $r;
  321. }
  322. // Add exposed field list
  323. $node->exposed_fields = array();
  324. if ($template) {
  325. foreach ($template as $record_id => $record) {
  326. foreach ($record['fields'] as $field_id => $field) {
  327. if ($field['exposed']) {
  328. $node->exposed_fields[] = array(
  329. 'record_id' => $record_id,
  330. 'field_id' => $field_id,
  331. 'title' => $field['title'],
  332. );
  333. }
  334. }
  335. }
  336. if (empty($node->exposed_fields)) {
  337. $node->exposed_fields[] = array();
  338. }
  339. }
  340. // Add constants
  341. $sql = 'SELECT * FROM {tripal_bulk_loader_constants} WHERE nid=%d ORDER BY group_id, record_id, field_id';
  342. $resource = db_query($sql, $node->nid);
  343. while ($r = db_fetch_object($resource)) {
  344. $node->constants[$r->group_id][$r->record_id][$r->field_id] = array(
  345. 'constant_id' => $r->constant_id,
  346. 'group_id' => $r->group_id,
  347. 'chado_table' => $r->chado_table,
  348. 'chado_field' => $r->chado_field,
  349. 'record_id' => $r->record_id,
  350. 'field_id' => $r->field_id,
  351. 'value' => $r->value
  352. );
  353. }
  354. if (!$node->constants) {
  355. $node->constants[] = array();
  356. }
  357. return $node;
  358. }
  359. /**
  360. * Implements node_insert
  361. * Insert the data from the node form on Create content
  362. */
  363. function tripal_bulk_loader_insert($node) {
  364. // Insert into tripal_bulk_loader
  365. $sql = "INSERT INTO {tripal_bulk_loader} (nid, loader_name, template_id, file, file_has_header, job_status, keep_track_inserted) VALUES (%d, '%s', %d, '%s', %d, '%s', %d)";
  366. db_query($sql, $node->nid, $node->loader_name, $node->template_id, $node->file, $node->has_header, 'Initialized', $node->keep_track_inserted);
  367. // Update title
  368. $node->title =$node->loader_name;
  369. drupal_write_record('node', $node, 'nid');
  370. drupal_write_record('node_revision', $node, 'nid');
  371. drupal_set_message(t('After reviewing the details, please Submit this Job (by clicking the "Submit Job" button below). No data will be loaded until the submitted job is reached in the queue.'));
  372. }
  373. /**
  374. * Implements node_delete
  375. * Deletes the data when the delete button on the node form is clicked
  376. */
  377. function tripal_bulk_loader_delete($node) {
  378. $sql = "DELETE FROM {tripal_bulk_loader} WHERE nid = %d";
  379. db_query($sql, $node->nid);
  380. }
  381. /**
  382. * Implements node_update
  383. * Updates the data submitted by the node form on edit
  384. */
  385. function tripal_bulk_loader_update($node) {
  386. // Update tripal_bulk_loader
  387. $sql = "UPDATE {tripal_bulk_loader} SET nid = %d, loader_name = '%s', template_id = %d, file = '%s', file_has_header = '%s', keep_track_inserted = %d WHERE nid = %d";
  388. db_query($sql, $node->nid, $node->loader_name, $node->template_id, $node->file, $node->has_header, $node->keep_track_inserted, $node->nid);
  389. // Add a job if the user want to load the data
  390. global $user;
  391. if ($node->job) {
  392. $job_args[0] =$node->loader_name;
  393. $job_args[1] = $node->template_id;
  394. $job_args[2] = $node->file;
  395. if (is_readable($node->file)) {
  396. $fname = preg_replace("/.*\/(.*)/", "$1", $node->file);
  397. tripal_add_job("Bulk Load: $fname", 'tripal_bulk_loader', 'tripal_bulk_loader_load_data', $job_args, $user->uid);
  398. }
  399. else {
  400. drupal_set_message(t("Can not open %file. Job not scheduled.", array('%file' => $node->file)));
  401. }
  402. }
  403. }
  404. ///////////////////////////////////////////////////////////
  405. /**
  406. * Preprocessor function for the tripal_bulk_loader template
  407. */
  408. function tripal_bulk_loader_preprocess_tripal_bulk_loader_template(&$variables) {
  409. $sql = "SELECT * FROM {tripal_bulk_loader_template} WHERE template_id=%d";
  410. $template = db_fetch_object(db_query($sql, $variables['template_id']));
  411. $template->template_array = unserialize($template->template_array);
  412. $variables['template'] = $template;
  413. }
  414. /**
  415. * Get the progress of the current constant set from the progress file
  416. *
  417. * When transactions are used, database updates to drupal cannot be made. Thus a separate
  418. * method to keep track of progress was implemented: save a period to the file for each
  419. * record successfully inserted; each line in the file represents a processed line.
  420. *
  421. * @param $job_id
  422. * The id of the tripal job to check the progress of
  423. * @param $node
  424. * The tripal_bulk_loader node associated with the job
  425. *
  426. * @return
  427. * An array with the following keys:
  428. * num_lines = the number of lines in the file processed so far
  429. * total_lines = the total number of lines in the input file
  430. * percent_file = the percent the input file has been loaded
  431. * num_records = the number of records successfully inserted
  432. */
  433. function tripal_bulk_loader_progess_file_get_progress($job_id, $update_progress = TRUE) {
  434. $filename = '/tmp/tripal_bulk_loader_progress-' . $job_id . '.out';
  435. if (!file_exists($filename)) {
  436. return (object) array();
  437. }
  438. $num_lines = trim(`wc --lines < $filename`);
  439. $num_records = trim(`grep -c "." $filename`);
  440. $job = db_fetch_object(db_query("SELECT j.*, b.file, b.file_has_header, c.num as num_constant_sets
  441. FROM {tripal_jobs} j
  442. LEFT JOIN {tripal_bulk_loader} b ON b.job_id=j.job_id
  443. LEFT JOIN (
  444. SELECT nid, count(distinct(group_id)) as num
  445. FROM {tripal_bulk_loader_constants}
  446. GROUP BY nid
  447. ) c ON c.nid=b.nid
  448. WHERE j.job_id=%d", $job_id));
  449. if ($job->num_constant_sets) {
  450. $num_constant_sets_loaded = round($job->progress / (100 / $job->num_constant_sets), 4);
  451. // If the next constant set has started loading
  452. if ($job->num_constant_sets != $num_constant_sets_loaded) {
  453. // total lines in input file
  454. $total_lines = trim(`wc --lines < $job->file`);
  455. if ($job->file_has_header) {
  456. $total_lines--;
  457. }
  458. // percent of the current constant set loaded
  459. $percent = round($num_lines/$total_lines * 100, 2);
  460. // percent of the total job = (<# fully loaded constant sets> * 100 )
  461. // + <percent of current constant set>
  462. // / <total number of constant sets>
  463. $total_percent = (($num_constant_sets_loaded * 100) + $percent) / $job->num_constant_sets;
  464. // update the progress of the job
  465. if ($update_progress AND ($percent != 0 OR $percent != 100)) {
  466. tripal_job_set_progress($job_id, round($total_percent, 0));
  467. }
  468. }
  469. }
  470. return (object) array(
  471. 'num_lines' => $num_lines,
  472. 'total_lines' => $total_lines,
  473. 'percent_file' => $percent,
  474. 'num_constant_sets_loaded' => $num_constant_sets_loaded,
  475. 'total_percent' => $total_percent,
  476. 'num_records' => $num_records
  477. );
  478. }
  479. /**
  480. * Implements hook_job_describe_args()
  481. * Specifically to make viewing past tripal jobs more readable for jobs registered by this module
  482. *
  483. * @params $callback
  484. * The callback passed into tripal_add_job()
  485. * @param $args
  486. * The arguements passed into tripal_add_job()
  487. * @return
  488. * An array where keys are the human readable headers describing each arguement
  489. * and the value is the aguement passed in after formatting
  490. */
  491. function tripal_bulk_loader_job_describe_args($callback, $args) {
  492. $new_args = array();
  493. if ($callback == 'tripal_bulk_loader_load_data') {
  494. //1st arg is the nid for a bulk loader node
  495. $node = node_load($args[0]);
  496. $new_args['Bulk Loading Job'] = l($node->title, 'node/' . $args[0]);
  497. return $new_args;
  498. }
  499. }
  500. /**
  501. * Implements hook_coder_ignore().
  502. * Defines the path to the file (tripal_bulk_loader.coder_ignores.txt) where ignore rules for coder are stored
  503. */
  504. function tripal_bulk_loader_coder_ignore() {
  505. return array(
  506. 'path' => drupal_get_path('module', 'tripal_bulk_loader'),
  507. 'line prefix' => drupal_get_path('module', 'tripal_bulk_loader'),
  508. );
  509. }