From 324c54fe46d6d58a9354a220cd2b4b8fb8bfeec0 Mon Sep 17 00:00:00 2001 From: Leigh Morresi <275001+dgtlmoon@users.noreply.github.com> Date: Fri, 29 Jan 2021 13:05:31 +0100 Subject: [PATCH] Use requests's r.text so we dont have to deal with charsets --- backend/fetch_site_status.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/backend/fetch_site_status.py b/backend/fetch_site_status.py index 8db63a25..a3759a6d 100644 --- a/backend/fetch_site_status.py +++ b/backend/fetch_site_status.py @@ -63,7 +63,7 @@ class perform_site_check(Thread): try: r = requests.get(self.url, headers=headers, timeout=15, verify=False) - stripped_text_from_html = html2text.html2text(r.content.decode('utf-8')) + stripped_text_from_html = html2text.html2text(r.text) # @todo This should be a config option. # Many websites include junk in the links, trackers, etc.. Since we are really a service all about text changes..