diff --git a/changedetectionio/processors/text_json_diff/processor.py b/changedetectionio/processors/text_json_diff/processor.py index 7845c897..60ec7753 100644 --- a/changedetectionio/processors/text_json_diff/processor.py +++ b/changedetectionio/processors/text_json_diff/processor.py @@ -227,7 +227,7 @@ class ContentProcessor: """Convert CDATA/comments in RSS to usable text.""" return cdata_in_document_to_text(html_content=content) - def preprocess_pdf(self, content, raw_content): + def preprocess_pdf(self, raw_content): """Convert PDF to HTML using external tool.""" from shutil import which tool = os.getenv("PDF_TO_HTML_TOOL", "pdftohtml") @@ -251,7 +251,7 @@ class ContentProcessor: metadata = ( f"
Added by changedetection.io: Document checksum - " f"{hashlib.md5(raw_content).hexdigest().upper()} " - f"Filesize - {len(html_content)} bytes
" + f"Original file size - {len(raw_content)} bytes" ) return html_content.replace('