Add retry for salttimeout errors and ceph sporadic
Related-Prod:PROD-37137
Change-Id: I217d09db4be27e68f2bd7c23fd2e7dfbd253b857
diff --git a/tcp_tests/utils/run_jenkins_job.py b/tcp_tests/utils/run_jenkins_job.py
index bf3bb01..403cc00 100755
--- a/tcp_tests/utils/run_jenkins_job.py
+++ b/tcp_tests/utils/run_jenkins_job.py
@@ -127,24 +127,39 @@
if job_parameters is not None: # job_parameters = {}
job_params.update(job_parameters)
- build = jenkins.run_build(job_name,
- job_params,
- verbose=verbose,
- timeout=start_timeout)
- if verbose:
- print_build_header(build, job_params, build_timeout)
+ job_attempts = 2
+ count = 1
+ while (job_attempts != 0):
+ print('Attempt ' + str(count))
+ count += 1
+ job_attempts -= 1
+ build = jenkins.run_build(job_name,
+ job_params,
+ verbose=verbose,
+ timeout=start_timeout)
- try:
- jenkins.wait_end_of_build(
- name=build[0],
- build_id=build[1],
- timeout=build_timeout,
- interval=1,
- verbose=verbose,
- job_output_prefix=job_output_prefix)
- except Exception as e:
- print(str(e))
- raise
+ if verbose:
+ print_build_header(build, job_params, build_timeout)
+
+ try:
+ jenkins.wait_end_of_build(
+ name=build[0],
+ build_id=build[1],
+ timeout=build_timeout,
+ interval=1,
+ verbose=verbose,
+ job_output_prefix=job_output_prefix)
+ except Exception as e:
+ print(str(e))
+ raise
+ job_log = jenkins.get_build_output(job_name, build[1])
+ # Workaround for restart jobs that failed by salt-timeout errors
+ # or by sporadic fail in attach disks
+ if ('SaltReqTimeoutError' not in job_log and
+ 'not a block device' not in job_log):
+ break
+ else:
+ print('Job returns known infra fail!')
result = jenkins.build_info(name=build[0],
build_id=build[1])['result']