From dd4e372703105edc202d38b67496435b54a21c7d Mon Sep 17 00:00:00 2001 From: msramalho <19508417+msramalho@users.noreply.github.com> Date: Mon, 2 Jun 2025 19:33:53 +0100 Subject: [PATCH] use ffmpeg -bitexact to reduce duplicate content storing --- .../modules/generic_extractor/generic_extractor.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/auto_archiver/modules/generic_extractor/generic_extractor.py b/src/auto_archiver/modules/generic_extractor/generic_extractor.py index 2941270..9a75352 100644 --- a/src/auto_archiver/modules/generic_extractor/generic_extractor.py +++ b/src/auto_archiver/modules/generic_extractor/generic_extractor.py @@ -394,12 +394,13 @@ class GenericExtractor(Extractor): for entry in entries: try: filename = _helper_get_filename(entry) - logger.warning(f"Using filename {filename} for entry {entry.get('id', 'unknown')}") if not filename or not os.path.exists(filename): # file was not downloaded or could not be retrieved, example: sensitive videos on YT without using cookies. continue + logger.debug(f"Using filename {filename} for entry {entry.get('id', 'unknown')}") + new_media = Media(filename) for x in ["duration", "original_url", "fulltitle", "description", "upload_date"]: if x in entry: @@ -551,6 +552,7 @@ class GenericExtractor(Extractor): "--write-subs" if self.subtitles else "--no-write-subs", "--write-auto-subs" if self.subtitles else "--no-write-auto-subs", "--live-from-start" if self.live_from_start else "--no-live-from-start", + "--postprocessor-args", "ffmpeg:-bitexact" # ensure bitexact output to avoid mismatching hashes for same video ] # proxy handling