From b2ce6023a2c361c373df67a8aebe3f96b7a2bd3a Mon Sep 17 00:00:00 2001 From: Marty Oehme Date: Thu, 11 Sep 2025 21:37:18 +0200 Subject: [PATCH] chore: Log found files for extractors to debug logger --- papis_extract/extractors/pdf.py | 7 ++++++- papis_extract/extractors/pocketbook.py | 12 +++++++----- papis_extract/extractors/readera.py | 2 +- 3 files changed, 14 insertions(+), 7 deletions(-) diff --git a/papis_extract/extractors/pdf.py b/papis_extract/extractors/pdf.py index 5df854e..3ba9873 100644 --- a/papis_extract/extractors/pdf.py +++ b/papis_extract/extractors/pdf.py @@ -25,7 +25,12 @@ class PdfExtractor: if not filename.is_file(): logger.error(f"File {str(filename)} not readable.") return False - return self._is_pdf(filename) + + if not self._is_pdf(filename): + return False + + logger.debug(f"Found processable annotation file: {filename}") + return True def run(self, filename: Path) -> list[Annotation]: """Extract annotations from a file. diff --git a/papis_extract/extractors/pocketbook.py b/papis_extract/extractors/pocketbook.py index 46ba66b..5fc0585 100644 --- a/papis_extract/extractors/pocketbook.py +++ b/papis_extract/extractors/pocketbook.py @@ -20,11 +20,13 @@ class PocketBookExtractor: return False html = BeautifulSoup(content, features="xml") - return bool( - html.find( - "meta", {"name": "generator", "content": "PocketBook Bookmarks Export"} - ) - ) + if not html.find( + "meta", {"name": "generator", "content": "PocketBook Bookmarks Export"} + ): + return False + + logger.debug(f"Found processable annotation file: {filename}") + return True def run(self, filename: Path) -> list[Annotation]: """Extract annotations from pocketbook html file. diff --git a/papis_extract/extractors/readera.py b/papis_extract/extractors/readera.py index b6159ff..d992512 100644 --- a/papis_extract/extractors/readera.py +++ b/papis_extract/extractors/readera.py @@ -37,7 +37,7 @@ class ReadEraExtractor: return False logger.debug( - f"Found annotation file processable with ReadEraExtractor: {filename}" + f"Found processable annotation file: {filename}" ) return True