| #! /usr/bin/env python |
| # -*- coding: utf-8 -*- |
| |
| # COPYRIGHT NOTICE STARTS HERE |
| |
| # Copyright 2019 © Samsung Electronics Co., Ltd. |
| # |
| # Licensed under the Apache License, Version 2.0 (the "License"); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| |
| # COPYRIGHT NOTICE ENDS HERE |
| |
| import concurrent.futures |
| import logging |
| from abc import ABC, abstractmethod |
| |
| from downloader import AbstractDownloader |
| |
| log = logging.getLogger(__name__) |
| |
| |
| class ConcurrentDownloader(AbstractDownloader, ABC): |
| def __init__(self, list_type, *list_args, workers=None): |
| super().__init__(list_type, *list_args) |
| self._workers = workers |
| |
| @abstractmethod |
| def _download_item(self, item): |
| """ |
| Download item from list |
| :param item: item to be downloaded |
| """ |
| pass |
| |
| def download(self): |
| """ |
| Download images concurrently from data lists. |
| """ |
| if not self._initial_log(): |
| return |
| items_left = len(self._missing) |
| try: |
| for _ in self.run_concurrent(self._download_item, self._missing.items()): |
| items_left -= 1 |
| log.info('{} {} left to download.'.format(items_left, self._list_type)) |
| except RuntimeError as err: |
| log.error('{} {} were not downloaded.'.format(items_left, self._list_type)) |
| raise err |
| |
| def run_concurrent(self, fn, iterable, *args): |
| """ |
| Run function concurrently for iterable |
| :param fn: function to run |
| :param iterable: iterable to process |
| :param args: arguments for function (fn) |
| """ |
| with concurrent.futures.ThreadPoolExecutor(max_workers=self._workers) as executor: |
| futures = [executor.submit(fn, item, *args) for item in iterable] |
| error_occurred = False |
| |
| for future in concurrent.futures.as_completed(futures): |
| error = future.exception() |
| if error: |
| error_occurred = True |
| else: |
| yield |
| if error_occurred: |
| raise RuntimeError('One or more errors occurred') |