TripalJob.inc 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665
  1. <?php
  2. class TripalJob {
  3. /**
  4. * The ID of the job.
  5. */
  6. protected $job_id = NULL;
  7. /**
  8. * Contains the job record for this job.
  9. */
  10. protected $job = NULL;
  11. /**
  12. * The number of items that this importer needs to process. A progress
  13. * can be calculated by dividing the number of items process by this
  14. * number.
  15. */
  16. private $total_items;
  17. /**
  18. * The number of items that have been handled so far. This must never
  19. * be below 0 and never exceed $total_items;
  20. */
  21. private $num_handled;
  22. /**
  23. * The interval when the job progress should be updated. Updating the job
  24. * progress incurrs a database write which takes time and if it occurs to
  25. * frequently can slow down the loader. This should be a value between
  26. * 0 and 100 to indicate a percent interval (e.g. 1 means update the
  27. * progress every time the num_handled increases by 1%).
  28. */
  29. private $interval;
  30. /**
  31. * Each time the job progress is updated this variable gets set. It is
  32. * used to calculate if the $interval has passed for the next update.
  33. */
  34. private $prev_update;
  35. /**
  36. * The time stamp when the job begins.
  37. *
  38. * @var integer
  39. */
  40. private $start_time;
  41. /**
  42. * The time from when the setTotalItems is called to the present time.
  43. *
  44. * @var
  45. */
  46. private $progress_start_time;
  47. /**
  48. * Instantiates a new TripalJob object.
  49. *
  50. * By default the job object is "empty". It must be associated with
  51. * job details either by calling the load() function or the
  52. * create() function.
  53. */
  54. public function __construct() {
  55. }
  56. /**
  57. * Loads a job for this object.
  58. *
  59. * @param $job_id
  60. * The ID of the job.
  61. */
  62. public function load($job_id) {
  63. // Make sure we have a numeric job_id.
  64. if (!$job_id or !is_numeric($job_id)) {
  65. // If we don't then do a quick double check in case this is a
  66. // TripalJob object in which case, I still have the job_id.
  67. if (is_object($job_id) AND is_a($job_id, 'TripalJob')) {
  68. $job_id = $job_id->job->job_id;
  69. }
  70. // Finally just throw an exception.
  71. // I can't load a job if I don't know which one.
  72. else {
  73. throw new Exception("You must provide the job_id to load the job.");
  74. }
  75. }
  76. $sql = 'SELECT j.* FROM {tripal_jobs} j WHERE j.job_id = :job_id';
  77. $args = array(':job_id' => $job_id);
  78. $this->job = db_query($sql, $args)->fetchObject();
  79. if (!$this->job) {
  80. throw new Exception("Cannot find a job with this ID provided.");
  81. }
  82. // Fix the date/time fields.
  83. $this->job->submit_date_string = $this->job->submit_date ? format_date($this->job->submit_date) : '';
  84. $this->job->start_time_string = $this->job->start_time ? format_date($this->job->start_time): '';
  85. $this->job->end_time_string = $this->job->end_time ? format_date($this->job->end_time): '';
  86. // Unserialize the includes.
  87. $this->job->includes = unserialize($this->job->includes);
  88. // Arguments for jobs used to be stored as plain string with a double colon
  89. // separating them. But as of Tripal v2.0 the arguments are stored as
  90. // a serialized array. To be backwards compatible, we should check for
  91. // serialization and if not then we will use the old style
  92. $this->job->arguments = unserialize($this->job->arguments);
  93. if (!is_array($this->job->arguments)) {
  94. $this->job->arguments = explode("::", $this->job->arguments);
  95. }
  96. }
  97. /**
  98. * Creates a new job.
  99. *
  100. * @param $details
  101. * An associative array of the job details or a single job_id. If the
  102. * details are provided then the job is created and added to the database
  103. * otherwise if a job_id is provided then the object is loaded from the
  104. * database. The following keys are allowed:
  105. * - job_name: The human readable name for the job.
  106. * - modulename: The name of the module adding the job.
  107. * - callback: The name of a function to be called when the job is executed.
  108. * - arguments: An array of arguments to be passed on to the callback.
  109. * - uid: The uid of the user adding the job
  110. * - priority: The priority at which to run the job where the highest
  111. * priority is 10 and the lowest priority is 1. The default
  112. * priority is 10.
  113. * - includes: An array of paths to files that should be included in order
  114. * to execute the job. Use the module_load_include function to get a path
  115. * for a given file.
  116. * - ignore_duplicate: (Optional). Set to TRUE to ignore a job if it has
  117. * the same name as another job which has not yet run. If TRUE and a job
  118. * already exists then this object will reference the job already in the
  119. * queue rather than a new submission. The default is TRUE.
  120. *
  121. * @throws Exception
  122. * On failure an exception is thrown.
  123. *
  124. * @return
  125. * Returns TRUE if the job was succesfully created. Returns FALSE otherwise.
  126. * A return of FALSE does not mean the job creation failed. If the
  127. * ignore_duplicate is set to false and the job already is present in the
  128. * queue then the return value will be FALSE.
  129. */
  130. public function create($details) {
  131. // Set some defaults
  132. if (!array_key_exists('prority', $details)) {
  133. $details['priority'] = 10;
  134. }
  135. if (!array_key_exists('includes', $details)) {
  136. $details['includes'] = array();
  137. }
  138. if (!array_key_exists('ignore_duplicate', $details)) {
  139. $details['ignore_duplicate'] = FALSE;
  140. }
  141. // Make sure the arguments are correct.
  142. if (!$details['job_name']) {
  143. throw new Exception("Must provide a 'job_name' to create a job.");
  144. }
  145. if (!$details['modulename']) {
  146. throw new Exception("Must provide a 'modulename' to create a job.");
  147. }
  148. if (!$details['callback']) {
  149. throw new Exception("Must provide a 'callback' to create a job.");
  150. }
  151. if ($details['ignore_duplicate'] !== FALSE and $details['ignore_duplicate'] !== TRUE) {
  152. throw new Exception("Must provide either TRUE or FALSE for the ignore_duplicate option when creating a job.");
  153. }
  154. $includes = $details['includes'];
  155. if ($includes and is_array($includes)) {
  156. foreach ($includes as $path) {
  157. $full_path = $_SERVER['DOCUMENT_ROOT'] . base_path() . $path;
  158. if (!empty($path)) {
  159. if (file_exists($path)) {
  160. require_once($path);
  161. }
  162. elseif (file_exists($full_path)) {
  163. require_once($path);
  164. }
  165. elseif (!empty($path)) {
  166. throw new Exception("Included files for Tripal Job must exist. This path ($full_path) doesn't exist.");
  167. }
  168. }
  169. }
  170. }
  171. if (!function_exists($details['callback'])) {
  172. throw new Exception("Must provide a valid callback function to the tripal_add_job() function.");
  173. }
  174. if (!is_numeric($details['uid'])) {
  175. throw new Exception("Must provide a numeric \$uid argument to the tripal_add_job() function.");
  176. }
  177. $priority = $details['priority'];
  178. if (!$priority or !is_numeric($priority) or $priority < 1 or $priority > 10) {
  179. throw new Exception("Must provide a numeric \$priority argument between 1 and 10 to the tripal_add_job() function.");
  180. }
  181. $arguments = $details['arguments'];
  182. if (!is_array($arguments)) {
  183. throw new Exception("Must provide an array as the \$arguments argument to the tripal_add_job() function.");
  184. }
  185. // convert the arguments into a string for storage in the database
  186. $args = array();
  187. if (is_array($arguments)) {
  188. $args = serialize($arguments);
  189. }
  190. try {
  191. // Before inserting a new record, and if ignore_duplicate is TRUE then
  192. // check to see if the job already exists.
  193. if ($details['ignore_duplicate'] === TRUE) {
  194. $query = db_select('tripal_jobs', 'tj');
  195. $query->fields('tj', array('job_id'));
  196. $query->condition('job_name', $details['job_name']);
  197. $query->isNull('start_time');
  198. $job_id = $query->execute()->fetchField();
  199. if ($job_id) {
  200. $this->load($job_id);
  201. return FALSE;
  202. }
  203. }
  204. $job_id = db_insert('tripal_jobs')
  205. ->fields(array(
  206. 'job_name' => $details['job_name'],
  207. 'modulename' => $details['modulename'],
  208. 'callback' => $details['callback'],
  209. 'status' => 'Waiting',
  210. 'submit_date' => time(),
  211. 'uid' => $details['uid'],
  212. 'priority' => $priority,
  213. 'arguments' => $args,
  214. 'includes' => serialize($includes),
  215. ))
  216. ->execute();
  217. // Now load the job into this object.
  218. $this->load($job_id);
  219. return TRUE;
  220. }
  221. catch (Exception $e) {
  222. throw new Exception('Cannot create job: ' . $e->getMessage());
  223. }
  224. }
  225. /**
  226. * Cancels the job and prevents it from running.
  227. */
  228. public function cancel() {
  229. if (!$this->job) {
  230. throw new Exception("There is no job associated with this object. Cannot cancel");
  231. }
  232. if ($this->job->status == 'Running') {
  233. throw new Exception("Job Cannot be cancelled it is currently running.");
  234. }
  235. if ($this->job->status == 'Completed') {
  236. throw new Exception("Job Cannot be cancelled it has already finished.");
  237. }
  238. if ($this->job->status == 'Error') {
  239. throw new Exception("Job Cannot be cancelled it is in an error state.");
  240. }
  241. if ($this->job->status == 'Cancelled') {
  242. throw new Exception("Job Cannot be cancelled it is already cancelled.");
  243. }
  244. // Set the end time for this job.
  245. try {
  246. if ($this->job->start_time == 0) {
  247. $record = new stdClass();
  248. $record->job_id = $this->job->job_id;
  249. $record->status = 'Cancelled';
  250. $record->progress = '0';
  251. drupal_write_record('tripal_jobs', $record, 'job_id');
  252. }
  253. }
  254. catch (Exception $e) {
  255. throw new Exception('Cannot cancel job: ' . $e->getMessage());
  256. }
  257. }
  258. /**
  259. * Executes the job.
  260. */
  261. public function run() {
  262. $this->start_time = time();
  263. $this->progress_start_time = time();
  264. if (!$this->job) {
  265. throw new Exception('Cannot launch job as no job is associated with this object.');
  266. }
  267. try {
  268. // Include the necessary files needed to run the job.
  269. if (is_array($this->job->includes)) {
  270. foreach ($this->job->includes as $path) {
  271. if ($path) {
  272. require_once $path;
  273. }
  274. }
  275. }
  276. // Set the start time for this job.
  277. $record = new stdClass();
  278. $record->job_id = $this->job->job_id;
  279. $record->start_time = $this->start_time;
  280. $record->status = 'Running';
  281. $record->pid = getmypid();
  282. drupal_write_record('tripal_jobs', $record, 'job_id');
  283. // Callback functions need the job in order to update
  284. // progress. But prior to Tripal v3 the job callback functions
  285. // only accepted a $job_id as the final argument. So, we need
  286. // to see if the callback is Tv3 compatible or older. If older
  287. // we want to still support it and pass the job_id.
  288. $arguments = $this->job->arguments;
  289. $callback = $this->job->callback;
  290. $ref = new ReflectionFunction($callback);
  291. $refparams = $ref->getParameters();
  292. if (count($refparams) > 0) {
  293. $lastparam = $refparams[count($refparams)-1];
  294. if ($lastparam->getName() == 'job_id') {
  295. $arguments[] = $this->job->job_id;
  296. }
  297. else {
  298. $arguments[] = $this;
  299. }
  300. }
  301. // Launch the job.
  302. call_user_func_array($callback, $arguments);
  303. // Set the end time for this job.
  304. $record = new stdClass();
  305. $record->job_id = $this->job->job_id;
  306. $record->end_time = time();
  307. $record->error_msg = $this->job->error_msg;
  308. $record->progress = 100;
  309. $record->status = 'Completed';
  310. $record->pid = '';
  311. drupal_write_record('tripal_jobs', $record, 'job_id');
  312. $this->load($this->job->job_id);
  313. }
  314. catch (Exception $e) {
  315. $record->end_time = time();
  316. $record->error_msg = $this->job->error_msg;
  317. $record->progress = $this->job->progress;
  318. $record->status = 'Error';
  319. $record->pid = '';
  320. drupal_write_record('tripal_jobs', $record, 'job_id');
  321. drupal_set_message('Job execution failed: ' . $e->getMessage(), 'error');
  322. }
  323. }
  324. /**
  325. * Inidcates if the job is running.
  326. *
  327. * @return
  328. * TRUE if the job is running, FALSE otherwise.
  329. */
  330. public function isRunning() {
  331. if (!$this->job) {
  332. throw new Exception('Cannot check running status as no job is associated with this object.');
  333. }
  334. $status = shell_exec('ps -p ' . escapeshellarg($this->job->pid) . ' -o pid=');
  335. if ($this->job->pid && $status) {
  336. // The job is still running.
  337. return TRUE;
  338. }
  339. // return FALSE to indicate that no jobs are currently running.
  340. return FALSE;
  341. }
  342. /**
  343. * Retrieve the job object as if from a database query.
  344. */
  345. public function getJob(){
  346. return $this->job;
  347. }
  348. /**
  349. * Retrieves the job ID.
  350. */
  351. public function getJobID(){
  352. return $this->job->job_id;
  353. }
  354. /**
  355. * Retrieves the user ID of the user that submitted the job.
  356. */
  357. public function getUID() {
  358. return $this->job->uid;
  359. }
  360. /**
  361. * Retrieves the job name.
  362. */
  363. public function getJobName() {
  364. return $this->job->job_name;
  365. }
  366. /**
  367. * Retrieves the name of the module that submitted the job.
  368. */
  369. public function getModuleName() {
  370. return $this->job->modulename;
  371. }
  372. /**
  373. * Retrieves the callback function for the job.
  374. */
  375. public function getCallback() {
  376. return $this->job->callback;
  377. }
  378. /**
  379. * Retrieves the array of arguments for the job.
  380. */
  381. public function getArguments() {
  382. return $this->job->arguments;
  383. }
  384. /**
  385. * Retrieves the current percent complete (i.e. progress) of the job.
  386. */
  387. public function getProgress() {
  388. return $this->job->progress;
  389. }
  390. /**
  391. * Sets the current percent complete of a job.
  392. *
  393. * @param $percent_done
  394. * A value between 0 and 100 indicating the percentage complete of the job.
  395. */
  396. public function setProgress($percent_done) {
  397. if (!$this->job) {
  398. throw new Exception('Cannot set progress as no job is associated with this object.');
  399. }
  400. $this->job->progress = $percent_done;
  401. $progress = sprintf("%d", $percent_done);
  402. db_update('tripal_jobs')
  403. ->fields(array(
  404. 'progress' => $progress,
  405. ))
  406. ->condition('job_id', $this->job->job_id)
  407. ->execute();
  408. }
  409. /**
  410. * Sets the total number if items to be processed.
  411. *
  412. * This should typically be called near the beginning of the loading process
  413. * to indicate the number of items that must be processed.
  414. *
  415. * @param $total_items
  416. * The total number of items to process.
  417. */
  418. public function setTotalItems($total_items) {
  419. $this->progress_start_time = time();
  420. $this->total_items = $total_items;
  421. }
  422. /**
  423. * Adds to the count of the total number of items that have been handled.
  424. *
  425. * @param $num_handled
  426. */
  427. public function addItemsHandled($num_handled) {
  428. $items_handled = $this->num_handled = $this->num_handled + $num_handled;
  429. $this->setItemsHandled($items_handled);
  430. }
  431. /**
  432. * Sets the number of items that have been processed.
  433. *
  434. * This should be called anytime the loader wants to indicate how many
  435. * items have been processed. The amount of progress will be
  436. * calculated using this number. If the amount of items handled exceeds
  437. * the interval specified then the progress is reported to the user. If
  438. * this loader is associated with a job then the job progress is also updated.
  439. *
  440. * @param $total_handled
  441. * The total number of items that have been processed.
  442. */
  443. public function setItemsHandled($total_handled) {
  444. // First set the number of items handled.
  445. $this->num_handled = $total_handled;
  446. if ($total_handled == 0) {
  447. $memory = number_format(memory_get_usage());
  448. print "Percent complete: 0%. Memory: " . $memory . " bytes.\r";
  449. return;
  450. }
  451. // Now see if we need to report to the user the percent done. A message
  452. // will be printed on the command-line if the job is run there.
  453. $percent = sprintf("%.2f", ($this->num_handled / $this->total_items) * 100);
  454. $diff = $percent - $this->prev_update;
  455. if ($diff >= $this->interval) {
  456. $duration = (time() - $this->progress_start_time) / 60;
  457. $duration = sprintf("%.2f", $duration);
  458. $memory = memory_get_usage();
  459. $fmemory = number_format($memory);
  460. print "Percent complete: " . $percent . "%. Memory: " . $fmemory . " bytes. Duration: " . $duration . " mins\r";
  461. $this->prev_update = $diff;
  462. $this->setProgress($percent);
  463. }
  464. }
  465. /**
  466. * Updates the percent interval when the job progress is updated.
  467. *
  468. * Updating the job
  469. * progress incurrs a database write which takes time and if it occurs to
  470. * frequently can slow down the loader. This should be a value between
  471. * 0 and 100 to indicate a percent interval (e.g. 1 means update the
  472. * progress every time the num_handled increases by 1%).
  473. *
  474. * @param $interval
  475. * A number between 0 and 100.
  476. */
  477. public function setInterval($interval) {
  478. $this->interval = $interval;
  479. }
  480. /**
  481. * Retrieves the status of the job.
  482. */
  483. public function getStatus() {
  484. return $this->job->status;
  485. }
  486. /**
  487. * Retrieves the time the job was submitted.
  488. */
  489. public function getSubmitTime() {
  490. return $this->job->submit_date;
  491. }
  492. /**
  493. * Retieves the time the job began execution (i.e. the start time).
  494. */
  495. public function getStartTime() {
  496. return $this->job->start_time;
  497. }
  498. /**
  499. * Retieves the time the job completed execution (i.e. the end time).
  500. */
  501. public function getEndTime() {
  502. return $this->job->end_time;
  503. }
  504. /**
  505. * Retieves the log for the job.
  506. *
  507. * @return
  508. * A large string containing the text of the job log. It contains both
  509. * status upates and errors.
  510. */
  511. public function getLog() {
  512. return $this->job->error_msg;
  513. }
  514. /**
  515. * Retrieves the process ID of the job.
  516. */
  517. public function getPID() {
  518. return $this->job->pid;
  519. }
  520. /**
  521. * Retreieves the priority that is currently set for the job.
  522. */
  523. public function getPriority() {
  524. return $this->job->priority;
  525. }
  526. /**
  527. * Get the MLock value of the job.
  528. *
  529. * The MLock value indicates if no other jobs from a give module
  530. * should be executed while this job is running.
  531. */
  532. public function getMLock() {
  533. return $this->job->mlock;
  534. }
  535. /**
  536. * Get the lock value of the job.
  537. *
  538. * The lock value indicates if no other jobs from any module
  539. * should be executed while this job is running.
  540. */
  541. public function getLock() {
  542. return $this->job->lock;
  543. }
  544. /**
  545. * Get the list of files that must be included prior to job execution.
  546. */
  547. public function getIncludes() {
  548. return $this->job->includes;
  549. }
  550. /**
  551. * Logs a message for the job.
  552. *
  553. * There is no distinction between status messages and error logs. Any
  554. * message that is intended for the user to review the status of the job
  555. * can be provided here.
  556. *
  557. * Messages that are are of severity TRIPAL_CRITICAL or TRIPAL_ERROR
  558. * are also logged to the watchdog.
  559. *
  560. * Logging works regardless if the job uses a transaction. If the
  561. * transaction must be rolled back to to an error the error messages will
  562. * persist.
  563. *
  564. * If a function can be executed by the Tripal job system (and hence the
  565. * job object is passed in) then you can directly use this function to
  566. * log messages. However, if the function can be run via drush on the
  567. * command-line, consider using the tripal_report_error() function which can
  568. * accept a job object as an $option and will print to both the terminal
  569. * and to the job object. If you use the tripal_report_error() be sure
  570. * to set the 'watchdog' option only if you need log messages also going
  571. * to the watchdog.
  572. *
  573. * @param $message
  574. * The message to store in the log. Keep $message translatable by not
  575. * concatenating dynamic values into it! Variables in the message should
  576. * be added by using placeholder strings alongside the variables argument
  577. * to declare the value of the placeholders. See t() for documentation on
  578. * how $message and $variables interact.
  579. * @param $variables
  580. * Array of variables to replace in the message on display or NULL if
  581. * message is already translated or not possible to translate.
  582. * @param $severity
  583. * The severity of the message; one of the following values:
  584. * - TRIPAL_CRITICAL: Critical conditions.
  585. * - TRIPAL_ERROR: Error conditions.
  586. * - TRIPAL_WARNING: Warning conditions.
  587. * - TRIPAL_NOTICE: Normal but significant conditions.
  588. * - TRIPAL_INFO: (default) Informational messages.
  589. * - TRIPAL_DEBUG: Debug-level messages.
  590. */
  591. public function logMessage($message, $variables = array(), $severity = TRIPAL_INFO) {
  592. // Generate a translated message.
  593. $tmessage = t($message, $variables);
  594. // For the sake of the command-line user, print the message to the
  595. // terminal.
  596. print $tmessage . "\n";
  597. // Add this message to the job's log.
  598. $this->job->error_msg .= "\n" . $tmessage;
  599. // Report this message to watchdog or set a message.
  600. if ($severity == TRIPAL_CRITICAL or $severity == TRIPAL_ERROR) {
  601. tripal_report_error('tripal_job', $severity, $message, $variables);
  602. $this->job->status = 'Error';
  603. }
  604. }
  605. }