Skip to content

Commit

Permalink
Make AnsibleTower checkout/execute actions more resilient
Browse files Browse the repository at this point in the history
We've been seeing some issues with service interruptions in AAP under
high load. While the jobs do complete successfully, awxkit bails when
encountering the connection issue.
With this change, we simple enter a retry loop when monitoring job
status.
  • Loading branch information
JacobCallahan committed Jan 14, 2025
1 parent d0b1192 commit 4d1453f
Showing 1 changed file with 15 additions and 1 deletion.
16 changes: 15 additions & 1 deletion broker/providers/ansible_tower.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@
import click
from dynaconf import Validator
from logzero import logger
from requests.exceptions import ConnectionError

from broker import exceptions
from broker.helpers import eval_filter, find_origin, yaml
Expand Down Expand Up @@ -41,6 +42,19 @@ def convert_pseudonamespaces(attr_dict):
return out_dict


def resilient_job_wait(job, timeout=None):
"""Wait for a job to complete. Retry on errors."""
timeout = timeout or settings.ANSIBLETOWER.workflow_timeout
completed = False
while not completed:
try:
job.wait_until_completed(timeout=timeout)
completed = True
except ConnectionError as err:
logger.error(f"Error occurred while waiting for job: {err}")
logger.info("Retrying job wait...")


class JobExecutionError(exceptions.ProviderError):
"""Raised when a job execution fails."""

Expand Down Expand Up @@ -605,7 +619,7 @@ def execute(self, **kwargs): # noqa: PLR0912,PLR0915 - Possible TODO refactor
job_ui_url = url_parser.urljoin(self.url, f"/#/{subject}s/{job_number}")
helpers.emit(api_url=job_api_url, ui_url=job_ui_url)
logger.info(f"Waiting for job: \nAPI: {job_api_url}\nUI: {job_ui_url}")
job.wait_until_completed(timeout=settings.ANSIBLETOWER.workflow_timeout)
resilient_job_wait(job)
if job.status != "successful":
message_data = {
f"{subject.capitalize()} Status": job.status,
Expand Down

0 comments on commit 4d1453f

Please sign in to comment.