Refactor http files download

Original download scripts got out of hand. This series of commits improves style of code (code duplicates, etc.) Issue-ID: OOM-1803 Change-Id: I7b82c1711d27fe450430fbe6d962a450301b0be0 Signed-off-by: Milan Verespej <m.verespej@partner.samsung.com>
author: Milan Verespej <m.verespej@partner.samsung.com> 2019-06-18 13:40:08 +0200
committer: Milan Verespej <m.verespej@partner.samsung.com> 2019-06-18 18:41:41 +0200
commit: 2e1328a8867190f203043fb5758dc8117ba3d673 (patch)
tree: 485de0595f1dcd275f8c7d9d14a1137bbe3e04f6 /build/download/concurrent_downloader.py
parent: f2f06700b7b9ad99c9c182fc01ee5cc0782ead78 (diff)
1 files changed, 77 insertions, 0 deletions
diff --git a/build/download/concurrent_downloader.py b/build/download/concurrent_downloader.py
new file mode 100644
index 00000000..c84dac86
--- /dev/null
+++ b/build/download/concurrent_downloader.py
@@ -0,0 +1,77 @@
+#! /usr/bin/env python
+# -*- coding: utf-8 -*-
+
+#   COPYRIGHT NOTICE STARTS HERE
+
+#   Copyright 2019 © Samsung Electronics Co., Ltd.
+#
+#   Licensed under the Apache License, Version 2.0 (the "License");
+#   you may not use this file except in compliance with the License.
+#   You may obtain a copy of the License at
+#
+#       http://www.apache.org/licenses/LICENSE-2.0
+#
+#   Unless required by applicable law or agreed to in writing, software
+#   distributed under the License is distributed on an "AS IS" BASIS,
+#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#   See the License for the specific language governing permissions and
+#   limitations under the License.
+
+#   COPYRIGHT NOTICE ENDS HERE
+
+import concurrent.futures
+import logging
+from abc import ABC, abstractmethod
+
+from downloader import AbstractDownloader
+
+log = logging.getLogger(__name__)
+
+
+class ConcurrentDownloader(AbstractDownloader, ABC):
+    def __init__(self, list_type, *list_args, workers=None):
+        super().__init__(list_type, *list_args)
+        self._workers = workers
+
+    @abstractmethod
+    def _download_item(self, item):
+        """
+        Download item from list
+        :param item: item to be downloaded
+        """
+        pass
+
+    def download(self):
+        """
+        Download images concurrently from data lists.
+        """
+        if not self._initial_log():
+            return
+        items_left = len(self._missing)
+        try:
+            for _ in self.run_concurrent(self._download_item, self._missing.items()):
+                items_left -= 1
+                log.info('{} {} left to download.'.format(items_left, self._list_type))
+        except RuntimeError as err:
+            log.error('{} {} were not downloaded.'.format(items_left, self._list_type))
+            raise err
+
+    def run_concurrent(self, fn, iterable, *args):
+        """
+        Run function concurrently for iterable
+        :param fn: function to run
+        :param iterable: iterable to process
+        :param args: arguments for function (fn)
+        """
+        with concurrent.futures.ThreadPoolExecutor(max_workers=self._workers) as executor:
+            futures = [executor.submit(fn, item, *args) for item in iterable]
+            error_occurred = False
+
+            for future in concurrent.futures.as_completed(futures):
+                error = future.exception()
+                if error:
+                    error_occurred = True
+                else:
+                    yield
+            if error_occurred:
+                raise RuntimeError('One or more errors occurred')
author	Milan Verespej <m.verespej@partner.samsung.com>	2019-06-18 13:40:08 +0200
committer	Milan Verespej <m.verespej@partner.samsung.com>	2019-06-18 18:41:41 +0200
commit	2e1328a8867190f203043fb5758dc8117ba3d673 (patch)
tree	485de0595f1dcd275f8c7d9d14a1137bbe3e04f6 /build/download/concurrent_downloader.py
parent	f2f06700b7b9ad99c9c182fc01ee5cc0782ead78 (diff)