blob: b20cb5adecf9bcb442648065be21604374627ce0 [file] [log] [blame]
#!/usr/bin/env python
import getopt
import logging
import os
import sys
import time
import random
from kubernetes import client
# extract env variables.
namespace = os.environ['NAMESPACE']
cert = os.environ['CERT']
host = os.environ['KUBERNETES_SERVICE_HOST']
token_path = os.environ['TOKEN']
with open(token_path, 'r') as token_file:
token = token_file.read().replace('\n', '')
# setup logging
log = logging.getLogger(__name__)
handler = logging.StreamHandler(sys.stdout)
handler.setFormatter(logging.Formatter('%(asctime)s - %(levelname)s - %(message)s'))
handler.setLevel(logging.INFO)
log.addHandler(handler)
log.setLevel(logging.INFO)
configuration = client.Configuration()
configuration.host = "https://" + host
configuration.ssl_ca_cert = cert
configuration.api_key['authorization'] = token
configuration.api_key_prefix['authorization'] = 'Bearer'
batchV1Api = client.BatchV1Api(client.ApiClient(configuration))
def is_job_complete(job_name):
complete = False
log.info("Checking if " + job_name + " is complete")
response = ""
try:
response = batchV1Api.read_namespaced_job_status(job_name, namespace)
if response.status.succeeded == 1:
job_status_type = response.status.conditions[0].type
if job_status_type == "Complete":
complete = True
else:
log.info(job_name + " is not complete")
else:
log.info(job_name + " has not succeeded yet")
return complete
except Exception as e:
log.error("Exception when calling read_namespaced_job_status: %s\n" % e)
DEF_TIMEOUT = 10
DESCRIPTION = "Kubernetes container job complete check utility"
USAGE = "Usage: job_complete.py [-t <timeout>] -j <job_name> [-j <job_name> ...]\n" \
"where\n" \
"<timeout> - wait for container job complete timeout in min, default is " + str(DEF_TIMEOUT) + "\n" \
"<job_name> - name of the job to wait for\n"
def main(argv):
# args are a list of job names
job_names = []
timeout = DEF_TIMEOUT
try:
opts, args = getopt.getopt(argv, "hj:t:", ["job-name=", "timeout=", "help"])
for opt, arg in opts:
if opt in ("-h", "--help"):
print("%s\n\n%s" % (DESCRIPTION, USAGE))
sys.exit()
elif opt in ("-j", "--job-name"):
job_names.append(arg)
elif opt in ("-t", "--timeout"):
timeout = float(arg)
except (getopt.GetoptError, ValueError) as e:
print("Error parsing input parameters: %s\n" % e)
print(USAGE)
sys.exit(2)
if job_names.__len__() == 0:
print("Missing required input parameter(s)\n")
print(USAGE)
sys.exit(2)
for job_name in job_names:
timeout = time.time() + timeout * 60
while True:
complete = is_job_complete(job_name)
if complete is True:
break
elif time.time() > timeout:
log.warning("timed out waiting for '" + job_name + "' to be completed")
exit(1)
else:
# spread in time potentially parallel execution in multiple containers
time.sleep(random.randint(5, 11))
if __name__ == "__main__":
main(sys.argv[1:])