From 4a9608f31c247b5b1284844609703f3ea4f95423 Mon Sep 17 00:00:00 2001
From: "Antoine R. Dumont (@ardumont)" <antoine.romain.dumont@gmail.com>
Date: Mon, 2 Dec 2019 15:49:38 +0100
Subject: [PATCH] lister/tasks: Standardize return statements

The following commit adapts the return statements from both lister and their
associated tasks. This standardizes on what other modules (e.g. both dvcs and
package loaders) do.
---
 swh/lister/bitbucket/tasks.py          |  5 +++--
 swh/lister/cgit/lister.py              |  4 ++++
 swh/lister/cgit/tasks.py               |  2 +-
 swh/lister/core/indexing_lister.py     |  3 +++
 swh/lister/core/page_by_page_lister.py |  4 ++++
 swh/lister/core/simple_lister.py       |  5 +++++
 swh/lister/cran/tasks.py               |  2 +-
 swh/lister/debian/lister.py            | 12 +++++++-----
 swh/lister/debian/tasks.py             |  2 +-
 swh/lister/github/tasks.py             |  5 +++--
 swh/lister/gitlab/tasks.py             |  5 +++--
 swh/lister/gnu/tasks.py                |  4 ++--
 swh/lister/npm/tasks.py                |  4 ++--
 swh/lister/phabricator/tasks.py        |  4 ++--
 swh/lister/pypi/tasks.py               |  2 +-
 15 files changed, 42 insertions(+), 21 deletions(-)

diff --git a/swh/lister/bitbucket/tasks.py b/swh/lister/bitbucket/tasks.py
index 28b29d64..3b64de01 100644
--- a/swh/lister/bitbucket/tasks.py
+++ b/swh/lister/bitbucket/tasks.py
@@ -14,13 +14,13 @@ GROUP_SPLIT = 10000
 def list_bitbucket_incremental(**lister_args):
     '''Incremental update of the BitBucket forge'''
     lister = BitBucketLister(**lister_args)
-    lister.run(min_bound=lister.db_last_index(), max_bound=None)
+    return lister.run(min_bound=lister.db_last_index(), max_bound=None)
 
 
 @shared_task(name=__name__ + '.RangeBitBucketLister')
 def _range_bitbucket_lister(start, end, **lister_args):
     lister = BitBucketLister(**lister_args)
-    lister.run(min_bound=start, max_bound=end)
+    return lister.run(min_bound=start, max_bound=end)
 
 
 @shared_task(name=__name__ + '.FullBitBucketRelister', bind=True)
@@ -44,6 +44,7 @@ def list_bitbucket_full(self, split=None, **lister_args):
         promise.save()  # so that we can restore the GroupResult in tests
     except (NotImplementedError, AttributeError):
         self.log.info('Unable to call save_group with current result backend.')
+    # FIXME: what to do in terms of return here?
     return promise.id
 
 
diff --git a/swh/lister/cgit/lister.py b/swh/lister/cgit/lister.py
index 37464c08..a8da6c6a 100644
--- a/swh/lister/cgit/lister.py
+++ b/swh/lister/cgit/lister.py
@@ -78,6 +78,7 @@ class CGitLister(ListerBase):
         }
 
     def run(self):
+        status = 'uneventful'
         total = 0
         for repos in grouper(self.get_repos(), 10):
             models = list(filter(None, (self.build_model(repo)
@@ -87,6 +88,9 @@ class CGitLister(ListerBase):
             self.db_session.commit()
             total += len(injected_repos)
             logger.debug('Scheduled %s tasks for %s', total, self.url)
+            status = 'eventful'
+
+        return {'status': status}
 
     def get_repos(self):
         """Generate git 'project' URLs found on the current CGit server
diff --git a/swh/lister/cgit/tasks.py b/swh/lister/cgit/tasks.py
index 12952485..2d60e36d 100644
--- a/swh/lister/cgit/tasks.py
+++ b/swh/lister/cgit/tasks.py
@@ -10,7 +10,7 @@ from .lister import CGitLister
 @shared_task(name=__name__ + '.CGitListerTask')
 def list_cgit(**lister_args):
     '''Lister task for CGit instances'''
-    CGitLister(**lister_args).run()
+    return CGitLister(**lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/core/indexing_lister.py b/swh/lister/core/indexing_lister.py
index 48be968c..2e7f3005 100644
--- a/swh/lister/core/indexing_lister.py
+++ b/swh/lister/core/indexing_lister.py
@@ -213,6 +213,7 @@ class IndexingLister(ListerBase):
         Returns:
             nothing
         """
+        status = 'uneventful'
         self.min_index = min_bound
         self.max_index = max_bound
 
@@ -243,9 +244,11 @@ class IndexingLister(ListerBase):
                 logger.debug('Flushing updates at index %s', i)
                 self.db_session.commit()
                 self.db_session = self.mk_session()
+                status = 'eventful'
 
         self.db_session.commit()
         self.db_session = self.mk_session()
+        return {'status': status}
 
 
 class IndexingHttpLister(ListerHttpTransport, IndexingLister):
diff --git a/swh/lister/core/page_by_page_lister.py b/swh/lister/core/page_by_page_lister.py
index 3d6d9c74..8bcce45c 100644
--- a/swh/lister/core/page_by_page_lister.py
+++ b/swh/lister/core/page_by_page_lister.py
@@ -110,6 +110,7 @@ class PageByPageLister(ListerBase):
             nothing
 
         """
+        status = 'uneventful'
         page = min_bound or 0
         loop_count = 0
 
@@ -127,6 +128,7 @@ class PageByPageLister(ListerBase):
             elif not injected_repos:
                 logging.info('Repositories already seen, stopping')
                 break
+            status = 'eventful'
 
             next_page = self.get_next_target_from_response(response)
 
@@ -149,6 +151,8 @@ class PageByPageLister(ListerBase):
         self.db_session.commit()
         self.db_session = self.mk_session()
 
+        return {'status': status}
+
 
 class PageByPageHttpLister(ListerHttpTransport, PageByPageLister):
     """Convenience class for ensuring right lookup and init order when
diff --git a/swh/lister/core/simple_lister.py b/swh/lister/core/simple_lister.py
index a355d9df..fa09ed88 100644
--- a/swh/lister/core/simple_lister.py
+++ b/swh/lister/core/simple_lister.py
@@ -89,3 +89,8 @@ class SimpleLister(ListerBase):
         response, injected_repos = self.ingest_data(dump_not_used_identifier)
         if not response and not injected_repos:
             logging.info('No response from api server, stopping')
+            status = 'uneventful'
+        else:
+            status = 'eventful'
+
+        return {'status': status}
diff --git a/swh/lister/cran/tasks.py b/swh/lister/cran/tasks.py
index 6802619f..74eef746 100644
--- a/swh/lister/cran/tasks.py
+++ b/swh/lister/cran/tasks.py
@@ -10,7 +10,7 @@ from swh.lister.cran.lister import CRANLister
 @shared_task(name=__name__ + '.CRANListerTask')
 def list_cran(**lister_args):
     '''Lister task for the CRAN registry'''
-    CRANLister(**lister_args).run()
+    return CRANLister(**lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/debian/lister.py b/swh/lister/debian/lister.py
index cc9ecd38..ef9853be 100644
--- a/swh/lister/debian/lister.py
+++ b/swh/lister/debian/lister.py
@@ -216,12 +216,14 @@ class DebianLister(ListerHttpTransport, ListerBase):
                            .one_or_none()
 
         if not distribution:
-            raise ValueError("Distribution %s is not registered" %
-                             self.distribution)
+            logger.error("Distribution %s is not registered" %
+                         self.distribution)
+            return {'status': 'failed'}
 
         if not distribution.type == 'deb':
-            raise ValueError("Distribution %s is not a Debian derivative" %
-                             distribution)
+            logger.error("Distribution %s is not a Debian derivative" %
+                         distribution)
+            return {'status': 'failed'}
 
         date = self.date
 
@@ -250,4 +252,4 @@ class DebianLister(ListerHttpTransport, ListerBase):
 
         self.db_session.commit()
 
-        return True
+        return {'status': 'eventful'}
diff --git a/swh/lister/debian/tasks.py b/swh/lister/debian/tasks.py
index d542d04c..04d12977 100644
--- a/swh/lister/debian/tasks.py
+++ b/swh/lister/debian/tasks.py
@@ -10,7 +10,7 @@ from .lister import DebianLister
 @shared_task(name=__name__ + '.DebianListerTask')
 def list_debian_distribution(distribution, **lister_args):
     '''List a Debian distribution'''
-    DebianLister(distribution=distribution, **lister_args).run()
+    return DebianLister(distribution=distribution, **lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/github/tasks.py b/swh/lister/github/tasks.py
index 207ddf9d..1b9f37e7 100644
--- a/swh/lister/github/tasks.py
+++ b/swh/lister/github/tasks.py
@@ -15,13 +15,13 @@ GROUP_SPLIT = 10000
 def list_github_incremental(**lister_args):
     'Incremental update of GitHub'
     lister = GitHubLister(**lister_args)
-    lister.run(min_bound=lister.db_last_index(), max_bound=None)
+    return lister.run(min_bound=lister.db_last_index(), max_bound=None)
 
 
 @shared_task(name=__name__ + '.RangeGitHubLister')
 def _range_github_lister(start, end, **lister_args):
     lister = GitHubLister(**lister_args)
-    lister.run(min_bound=start, max_bound=end)
+    return lister.run(min_bound=start, max_bound=end)
 
 
 @shared_task(name=__name__ + '.FullGitHubRelister', bind=True)
@@ -44,6 +44,7 @@ def list_github_full(self, split=None, **lister_args):
         promise.save()  # so that we can restore the GroupResult in tests
     except (NotImplementedError, AttributeError):
         self.log.info('Unable to call save_group with current result backend.')
+    # FIXME: what to do in terms of return here?
     return promise.id
 
 
diff --git a/swh/lister/gitlab/tasks.py b/swh/lister/gitlab/tasks.py
index bdb23cd9..e6a17552 100644
--- a/swh/lister/gitlab/tasks.py
+++ b/swh/lister/gitlab/tasks.py
@@ -20,13 +20,13 @@ def list_gitlab_incremental(**lister_args):
     lister = GitLabLister(**lister_args)
     total_pages = lister.get_pages_information()[1]
     # stopping as soon as existing origins for that instance are detected
-    lister.run(min_bound=1, max_bound=total_pages, check_existence=True)
+    return lister.run(min_bound=1, max_bound=total_pages, check_existence=True)
 
 
 @shared_task(name=__name__ + '.RangeGitLabLister')
 def _range_gitlab_lister(start, end, **lister_args):
     lister = GitLabLister(**lister_args)
-    lister.run(min_bound=start, max_bound=end)
+    return lister.run(min_bound=start, max_bound=end)
 
 
 @shared_task(name=__name__ + '.FullGitLabRelister', bind=True)
@@ -43,6 +43,7 @@ def list_gitlab_full(self, **lister_args):
         promise.save()
     except (NotImplementedError, AttributeError):
         self.log.info('Unable to call save_group with current result backend.')
+    # FIXME: what to do in terms of return here?
     return promise.id
 
 
diff --git a/swh/lister/gnu/tasks.py b/swh/lister/gnu/tasks.py
index 1eb70612..edcde7e3 100644
--- a/swh/lister/gnu/tasks.py
+++ b/swh/lister/gnu/tasks.py
@@ -9,8 +9,8 @@ from .lister import GNULister
 
 @shared_task(name=__name__ + '.GNUListerTask')
 def list_gnu_full(**lister_args):
-    'List lister for the GNU source code archive'
-    GNULister(**lister_args).run()
+    """List lister for the GNU source code archive"""
+    return GNULister(**lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/npm/tasks.py b/swh/lister/npm/tasks.py
index 94b991b1..1e4a51ca 100644
--- a/swh/lister/npm/tasks.py
+++ b/swh/lister/npm/tasks.py
@@ -45,7 +45,7 @@ def list_npm_full(**lister_args):
     'Full lister for the npm (javascript) registry'
     lister = NpmLister(**lister_args)
     with save_registry_state(lister):
-        lister.run()
+        return lister.run()
 
 
 @shared_task(name=__name__ + '.NpmIncrementalListerTask')
@@ -54,7 +54,7 @@ def list_npm_incremental(**lister_args):
     lister = NpmIncrementalLister(**lister_args)
     update_seq_start = get_last_update_seq(lister)
     with save_registry_state(lister):
-        lister.run(min_bound=update_seq_start)
+        return lister.run(min_bound=update_seq_start)
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/phabricator/tasks.py b/swh/lister/phabricator/tasks.py
index 361feddb..614f4f2a 100644
--- a/swh/lister/phabricator/tasks.py
+++ b/swh/lister/phabricator/tasks.py
@@ -9,8 +9,8 @@ from swh.lister.phabricator.lister import PhabricatorLister
 
 @shared_task(name=__name__ + '.FullPhabricatorLister')
 def list_phabricator_full(**lister_args):
-    'Full update of a Phabricator instance'
-    PhabricatorLister(**lister_args).run()
+    """Full update of a Phabricator instance"""
+    return PhabricatorLister(**lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
diff --git a/swh/lister/pypi/tasks.py b/swh/lister/pypi/tasks.py
index 2412f26c..b59e6b0f 100644
--- a/swh/lister/pypi/tasks.py
+++ b/swh/lister/pypi/tasks.py
@@ -10,7 +10,7 @@ from .lister import PyPILister
 @shared_task(name=__name__ + '.PyPIListerTask')
 def list_pypi(**lister_args):
     'Full update of the PyPI (python) registry'
-    PyPILister(**lister_args).run()
+    return PyPILister(**lister_args).run()
 
 
 @shared_task(name=__name__ + '.ping')
-- 
GitLab