container_manage: introduce create_retries and exec_retries vars

tripleo_container_manage_create_retries and
tripleo_container_manage_exec_retries (default to 60) will allow a
timeout of 10 minutes for both podman exec and podman run commands.

Indeed, some containers (db-sync or when puppet runs) can take up to 10
minute to execute and finish.

Change-Id: Iff752cd124546bdd7cf857b0dacfc7d33b9a71a6
This commit is contained in:
Emilien Macchi 2020-05-01 10:57:41 -04:00
parent 6cab1448db
commit 5a54d57fda
3 changed files with 8 additions and 2 deletions

View File

@ -26,6 +26,12 @@ tripleo_container_manage_config_id: tripleo
tripleo_container_manage_config_overrides: {}
tripleo_container_manage_config_patterns: '*.json'
tripleo_container_manage_debug: false
# Some containers where Puppet is run, can take up to 10 minutes to finish
# in slow environments.
tripleo_container_manage_create_retries: 60
# Default delay is 10s so 60 retries makes a timeout of 10 minutes which is
# what we have observed a necessary value for nova and neutron db-sync execs.
tripleo_container_manage_exec_retries: 60
tripleo_container_manage_healthcheck_disabled: false
tripleo_container_manage_log_path: '/var/log/containers/stdouts'
tripleo_container_manage_systemd_order: false

View File

@ -91,7 +91,7 @@
loop_var: "create_async_result_item"
register: create_async_poll_results
until: create_async_poll_results.finished
retries: 60
retries: "{{ tripleo_container_manage_create_retries }}"
# We fail later if a container has failed to start
failed_when: false
when:

View File

@ -42,7 +42,7 @@
loop_var: "exec_async_result_item"
register: exec_async_poll_results
until: exec_async_poll_results.finished
retries: 30
retries: "{{ tripleo_container_manage_exec_retries }}"
when: not ansible_check_mode|bool
- name: Block for container commands