jenkinsci · dbnicholson · Oct 31, 2019 · Oct 31, 2019 · res0nance · Nov 1, 2019
diff --git a/src/main/java/hudson/plugins/ec2/CloudHelper.java b/src/main/java/hudson/plugins/ec2/CloudHelper.java
@@ -16,11 +16,12 @@
 final class CloudHelper {
     private static final Logger LOGGER = LoggerFactory.getLogger(CloudHelper.class);
 
-    static Instance getInstanceWithRetry(String instanceId, EC2Cloud cloud) throws AmazonClientException, InterruptedException {
+    static Instance getInstanceWithRetry(String instanceId, EC2Cloud cloud, int timeout) throws AmazonClientException, InterruptedException {
         // Sometimes even after a successful RunInstances, DescribeInstances
         // returns an error for a few seconds. We do a few retries instead of
         // failing instantly. See [JENKINS-15319].
-        for (int i = 0; i < 5; i++) {
+        int waitCount = timeout / 5;
+        for (int i = 0; i < waitCount; i++) {
             try {
                 return getInstance(instanceId, cloud);
             } catch (AmazonServiceException e) {
@@ -36,6 +37,10 @@ static Instance getInstanceWithRetry(String instanceId, EC2Cloud cloud) throws A
         return getInstance(instanceId, cloud);
     }
 
+    static Instance getInstanceWithRetry(String instanceId, EC2Cloud cloud) throws AmazonClientException, InterruptedException {
+        return getInstanceWithRetry(instanceId, cloud, 25);
+    }
+
     @CheckForNull
     static Instance getInstance(String instanceId, EC2Cloud cloud) throws AmazonClientException {
         if (StringUtils.isEmpty(instanceId) || cloud == null)

diff --git a/src/main/java/hudson/plugins/ec2/EC2AbstractSlave.java b/src/main/java/hudson/plugins/ec2/EC2AbstractSlave.java
@@ -162,7 +162,19 @@ public EC2AbstractSlave(String name, String instanceId, String templateDescripti
         this.amiType = amiType;
         this.maxTotalUses = maxTotalUses;
         readResolve();
-        fetchLiveInstanceData(true);
+        try {
+            // Wait up to 1 minute for the instance to show up
+            fetchLiveInstanceData(true, 60);
+        } catch (com.amazonaws.AmazonClientException e) {
+            /*
+             * If DescribeInstances didn't return any information about this
+             * instance, try to terminate it so that if it does come up later
+             * it doesn't affect capacity calculations.
+             */
+            LOGGER.log(Level.WARNING, "Failed to get instance data for new instance " + getInstanceId() + ", terminating");
+            terminateInstance();
+            throw e;
+        }
     }
 
     @Deprecated
@@ -541,7 +553,7 @@ protected boolean isAlive(boolean force) {
      * Much of the EC2 data is beyond our direct control, therefore we need to refresh it from time to time to ensure we
      * reflect the reality of the instances.
      */
-    private void fetchLiveInstanceData(boolean force) throws AmazonClientException {
+    private void fetchLiveInstanceData(boolean force, int timeout) throws AmazonClientException {
         /*
          * If we've grabbed the data recently, don't bother getting it again unless we are forced
          */
@@ -563,7 +575,7 @@ private void fetchLiveInstanceData(boolean force) throws AmazonClientException {
 
         Instance i = null;
         try {
-            i = CloudHelper.getInstanceWithRetry(getInstanceId(), getCloud());
+            i = CloudHelper.getInstanceWithRetry(getInstanceId(), getCloud(), timeout);
         } catch (InterruptedException e) {
             // We'll just retry next time we test for idleness.
             LOGGER.fine("InterruptedException while get " + getInstanceId()
@@ -594,6 +606,10 @@ private void fetchLiveInstanceData(boolean force) throws AmazonClientException {
         }
     }
 
+    private void fetchLiveInstanceData(boolean force) throws AmazonClientException {
+        fetchLiveInstanceData(force, 25);
+    }
+
     /*
      * Clears all existing tag data so that we can force the instance into a known state
      */