From c01a3433271be59bd1920a49fe1f3390e6045cc0 Mon Sep 17 00:00:00 2001
From: Jessica Severin <jessica@ebi.ac.uk>
Date: Tue, 9 Aug 2005 16:04:49 +0000
Subject: [PATCH] added code to catch an exception at the job level, reset/fail
 that job yet allow the worker to continue working.  Previous design killed
 the worker when one of it's jobs fails.  This new design should be more
 efficient yet still provide some level of inter-job-mangle-proof-ness.

---
 modules/Bio/EnsEMBL/Hive/Worker.pm | 22 ++++++++++++++--------
 1 file changed, 14 insertions(+), 8 deletions(-)

diff --git a/modules/Bio/EnsEMBL/Hive/Worker.pm b/modules/Bio/EnsEMBL/Hive/Worker.pm
index 24f254f4a..35e9ba30d 100755
--- a/modules/Bio/EnsEMBL/Hive/Worker.pm
+++ b/modules/Bio/EnsEMBL/Hive/Worker.pm
@@ -418,15 +418,21 @@ sub run
     }
     
     foreach my $job (@{$jobs}) {
-    
-      $self->redirect_job_output($job);
-      $self->run_module_with_job($job);
-      $self->close_and_update_job_output($job);      
-            
-      $self->queen->worker_register_job_done($self, $job);
-
-      $self->{'_work_done'}++;
+      eval {
+        $self->redirect_job_output($job);
+        $self->run_module_with_job($job);
+        $self->close_and_update_job_output($job);      
+              
+        $self->queen->worker_register_job_done($self, $job);
+        $self->work_done($self->work_done + 1);
+      };
+      if($@) {
+        #job threw an exception so it had a problem
+        printf("job %d failed with exception: $@\n", $job->dbID);
+        $self->queen->db->get_AnalysisJobAdaptor->reset_dead_job_by_dbID($job->dbID);
+      }
     }
+    
     my $batch_end = time() * 1000;
     #printf("batch start:%f end:%f\n", $batch_start, $batch_end);
     $self->db->get_AnalysisStatsAdaptor->
-- 
GitLab