# Copyright 2015 gRPC authors. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. """Helpers to run docker instances as jobs.""" from __future__ import print_function import tempfile import time import uuid import os import subprocess import json import jobset _DEVNULL = open(os.devnull, 'w') def random_name(base_name): """Randomizes given base name.""" return '%s_%s' % (base_name, uuid.uuid4()) def docker_kill(cid): """Kills a docker container. Returns True if successful.""" return subprocess.call( ['docker', 'kill', str(cid)], stdin=subprocess.PIPE, stdout=_DEVNULL, stderr=subprocess.STDOUT) == 0 def docker_mapped_port(cid, port, timeout_seconds=15): """Get port mapped to internal given internal port for given container.""" started = time.time() while time.time() - started < timeout_seconds: try: output = subprocess.check_output( 'docker port %s %s' % (cid, port), stderr=_DEVNULL, shell=True) return int(output.split(':', 2)[1]) except subprocess.CalledProcessError as e: pass raise Exception('Failed to get exposed port %s for container %s.' % (port, cid)) def docker_ip_address(cid, timeout_seconds=15): """Get port mapped to internal given internal port for given container.""" started = time.time() while time.time() - started < timeout_seconds: cmd = 'docker inspect %s' % cid try: output = subprocess.check_output(cmd, stderr=_DEVNULL, shell=True) json_info = json.loads(output) assert len(json_info) == 1 out = json_info[0]['NetworkSettings']['IPAddress'] if not out: continue return out except subprocess.CalledProcessError as e: pass raise Exception( 'Non-retryable error: Failed to get ip address of container %s.' % cid) def wait_for_healthy(cid, shortname, timeout_seconds): """Wait timeout_seconds for the container to become healthy""" started = time.time() while time.time() - started < timeout_seconds: try: output = subprocess.check_output( [ 'docker', 'inspect', '--format="{{.State.Health.Status}}"', cid ], stderr=_DEVNULL) if output.strip('\n') == 'healthy': return except subprocess.CalledProcessError as e: pass time.sleep(1) raise Exception('Timed out waiting for %s (%s) to pass health check' % (shortname, cid)) def finish_jobs(jobs, suppress_failure=True): """Kills given docker containers and waits for corresponding jobs to finish""" for job in jobs: job.kill(suppress_failure=suppress_failure) while any(job.is_running() for job in jobs): time.sleep(1) def image_exists(image): """Returns True if given docker image exists.""" return subprocess.call( ['docker', 'inspect', image], stdin=subprocess.PIPE, stdout=_DEVNULL, stderr=subprocess.STDOUT) == 0 def remove_image(image, skip_nonexistent=False, max_retries=10): """Attempts to remove docker image with retries.""" if skip_nonexistent and not image_exists(image): return True for attempt in range(0, max_retries): if subprocess.call( ['docker', 'rmi', '-f', image], stdin=subprocess.PIPE, stdout=_DEVNULL, stderr=subprocess.STDOUT) == 0: return True time.sleep(2) print('Failed to remove docker image %s' % image) return False class DockerJob: """Encapsulates a job""" def __init__(self, spec): self._spec = spec self._job = jobset.Job( spec, newline_on_success=True, travis=True, add_env={}) self._container_name = spec.container_name def mapped_port(self, port): return docker_mapped_port(self._container_name, port) def ip_address(self): return docker_ip_address(self._container_name) def wait_for_healthy(self, timeout_seconds): wait_for_healthy(self._container_name, self._spec.shortname, timeout_seconds) def kill(self, suppress_failure=False): """Sends kill signal to the container.""" if suppress_failure: self._job.suppress_failure_message() return docker_kill(self._container_name) def is_running(self): """Polls a job and returns True if given job is still running.""" return self._job.state() == jobset._RUNNING