From b1f70bb81890eeb7d8502e5273144cecdc92ed79 Mon Sep 17 00:00:00 2001 From: msramalho <19508417+msramalho@users.noreply.github.com> Date: Wed, 15 Jun 2022 17:14:08 +0200 Subject: [PATCH] minor improvements --- archivers/wayback_archiver.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/archivers/wayback_archiver.py b/archivers/wayback_archiver.py index 81c1644..f46d1cb 100644 --- a/archivers/wayback_archiver.py +++ b/archivers/wayback_archiver.py @@ -18,10 +18,12 @@ class WaybackArchiver(Archiver): def __init__(self, storage: Storage, driver, config: WaybackConfig): super(WaybackArchiver, self).__init__(storage, driver) self.config = config - # TODO: this logic should live at the auto-archiver level self.seen_urls = {} def download(self, url, check_if_exists=False): + if self.config is None: + logger.error('Missing Wayback config') + return False if check_if_exists: if url in self.seen_urls: return self.seen_urls[url] @@ -57,7 +59,7 @@ class WaybackArchiver(Archiver): retries += 1 if status_r.status_code != 200: - return ArchiveResult(status="Internet archive failed", screenshot=screenshot) + return ArchiveResult(status=f"Internet archive failed: check https://web.archive.org/save/status/{job_id}", screenshot=screenshot) status_json = status_r.json() if status_json['status'] != 'success':