Better exception handling during autohold Our autohold can linger longer than we requested if we get an exception during node iteration. Let's handle that particular exception better, and also handle ANY exceptions that may bubble up by deleting the autohold if that occurs. Change-Id: I9d64995406e86cbad7536b85a3206fda7faac253

commit: f21bb2893ab6c1650ef896e9144b22d5177fe900 [log] [tgz]
author: David Shrewsbury <shrewsbury.dave@gmail.com> Fri Oct 13 11:10:00 2017 -0400
committer: David Shrewsbury <shrewsbury.dave@gmail.com> Fri Oct 13 11:26:45 2017 -0400
tree: b978ba423ade18afd64bec77e7463c44dd6547eb
parent: 76fc525d1449b54d4ab63a77c4ba0631ad9734c0 [diff]
diff --git a/zuul/scheduler.py b/zuul/scheduler.py
index cfcd865..bca62dc 100644
--- a/zuul/scheduler.py
+++ b/zuul/scheduler.py

@@ -855,8 +855,12 @@
             try:
                 self.nodepool.holdNodeSet(nodeset, autohold_key)
             except Exception:
-                self.log.exception("Unable to process autohold for %s",
+                self.log.exception("Unable to process autohold for %s:",
                                    autohold_key)
+                if autohold_key in self.autohold_requests:
+                    self.log.debug("Removing autohold %s due to exception",
+                                   autohold_key)
+                    del self.autohold_requests[autohold_key]
 
             self.nodepool.returnNodeSet(nodeset)
         except Exception:

diff --git a/zuul/zk.py b/zuul/zk.py
index 2fca749..ede78be 100644
--- a/zuul/zk.py
+++ b/zuul/zk.py

@@ -269,6 +269,9 @@
         for nodeid in nodes:
             node_path = '%s/%s' % (self.NODE_ROOT, nodeid)
             node_data, node_stat = self.client.get(node_path)
+            if not node_data:
+                self.log.warning("Node ID %s has no data", nodeid)
+                continue
             node_data = self._strToDict(node_data)
             if (node_data['state'] == zuul.model.STATE_HOLD and
                     node_data.get('hold_job') == identifier):
commit	f21bb2893ab6c1650ef896e9144b22d5177fe900	[log] [tgz]
author	David Shrewsbury <shrewsbury.dave@gmail.com>	Fri Oct 13 11:10:00 2017 -0400
committer	David Shrewsbury <shrewsbury.dave@gmail.com>	Fri Oct 13 11:26:45 2017 -0400
tree	b978ba423ade18afd64bec77e7463c44dd6547eb
parent	76fc525d1449b54d4ab63a77c4ba0631ad9734c0 [diff]