From 29f15bb14c9edd0bd1a4f485a299a3329a62c87b Mon Sep 17 00:00:00 2001 From: Clark Boylan Date: Tue, 24 Sep 2024 15:25:56 -0700 Subject: [PATCH] Set launch-timeout on nodepool providers The nodepool openstack provider implementation has a launch timeout default of 3600 seconds or one hour. This is problematic for us because a node request will be attempted three times by a provider before being passed onto the next provider. This means we may wait up to three hours per failed provider to launch a single node. Fix this by setting a timeout of 10 minutes on the three providers that didn't already set a lower timeout (raxflex and the two vexxhost providers). Looking at grafana graphs for time to ready this should be plenty of time for normal booting conditions and reduces the time we wait from 3 hours per provider to 30 minutes. Change-Id: I0a4af9f5519ff2b64c737b1822590fbb2608e8bb --- nodepool/nl01.opendev.org.yaml | 1 + nodepool/nl03.opendev.org.yaml | 2 ++ 2 files changed, 3 insertions(+) diff --git a/nodepool/nl01.opendev.org.yaml b/nodepool/nl01.opendev.org.yaml index cfe47552c7..c1caad9f40 100644 --- a/nodepool/nl01.opendev.org.yaml +++ b/nodepool/nl01.opendev.org.yaml @@ -198,6 +198,7 @@ providers: # It should be changed carefully. cloud: raxflex boot-timeout: 120 + launch-timeout: 600 diskimages: *provider_diskimages pools: - name: main diff --git a/nodepool/nl03.opendev.org.yaml b/nodepool/nl03.opendev.org.yaml index 6b91faa9fd..fa2f4e0b74 100644 --- a/nodepool/nl03.opendev.org.yaml +++ b/nodepool/nl03.opendev.org.yaml @@ -107,6 +107,7 @@ providers: # It should be changed carefully. cloud: vexxhost boot-timeout: 120 + launch-timeout: 600 rate: 0.001 diskimages: &provider_diskimages - name: centos-9-stream @@ -214,6 +215,7 @@ providers: # It should be changed carefully. cloud: vexxhost boot-timeout: 120 + launch-timeout: 600 rate: 0.001 diskimages: *provider_diskimages pools: