0.42.2

UI - Configurable pager size #1599 #1598
Fetcher - Ability to specify headers from a textfile per watch, global or per tag ( https://github.com/dgtlmoon/changedetection.io/wiki/Adding-headers-from-an-external-file )
2025-11-17 15:06:11 +00:00 · 2023-05-25 16:47:30 +02:00 · 2023-05-25 16:38:54 +02:00 · 2023-05-22 17:19:52 +02:00 · 2023-05-21 23:10:39 +02:00 · 2023-05-21 23:10:08 +02:00
13 changed files with 194 additions and 24 deletions
--- a/README.md
+++ b/README.md
@@ -66,6 +66,7 @@ Requires Playwright to be enabled.
 - Proactively search for jobs, get notified when companies update their careers page, search job portals for keywords.
 - Get alerts when new job positions are open on Bamboo HR and other job platforms
 - Website defacement monitoring
 - Pokémon Card Restock Tracker / Pokémon TCG Tracker
 _Need an actual Chrome runner with Javascript support? We support fetching via WebDriver and Playwright!</a>_
--- a/changedetectionio/init.py
+++ b/changedetectionio/init.py
@@ -38,7 +38,7 @@ from flask_paginate import Pagination, get_page_parameter
 from changedetectionio import html_tools
 from changedetectionio.api import api_v1
-__version__ = '0.42.1'
+__version__ = '0.42.2'
 datastore = None
@@ -124,6 +124,15 @@ def _jinja2_filter_datetimestamp(timestamp, format="%Y-%m-%d %H:%M:%S"):
    return timeago.format(timestamp, time.time())
@app.template_filter('pagination_slice')
 def _jinja2_filter_pagination_slice(arr, skip):
    per_page = datastore.data['settings']['application'].get('pager_size', 50)
    if per_page:
        return arr[skip:skip + per_page]
    return arr
@app.template_filter('format_seconds_ago')
 def _jinja2_filter_seconds_precise(timestamp):
    if timestamp == False:
@@ -432,7 +441,11 @@ def changedetection_app(config=None, datastore_o=None):
        form = forms.quickWatchForm(request.form)
        page = request.args.get(get_page_parameter(), type=int, default=1)
        total_count = len(sorted_watches)
-        pagination = Pagination(page=page, total=total_count, per_page=int(os.getenv('pagination_per_page', 50)), css_framework = "semantic")
+
        pagination = Pagination(page=page,
                                total=total_count,
                                per_page=datastore.data['settings']['application'].get('pager_size', 50), css_framework="semantic")
        output = render_template(
            "watch-overview.html",
@@ -700,6 +713,7 @@ def changedetection_app(config=None, datastore_o=None):
                                     form=form,
                                     has_default_notification_urls=True if len(datastore.data['settings']['application']['notification_urls']) else False,
                                     has_empty_checktime=using_default_check_time,
                                     has_extra_headers_file=watch.has_extra_headers_file or datastore.has_extra_headers_file,
                                     is_html_webdriver=is_html_webdriver,
                                     jq_support=jq_support,
                                     playwright_enabled=os.getenv('PLAYWRIGHT_DRIVER_URL', False),
@@ -1444,6 +1458,7 @@ def check_for_new_version():
        # Check daily
        app.config.exit.wait(86400)
 def notification_runner():
    global notification_debug_log
    from datetime import datetime
--- a/changedetectionio/content_fetcher.py
+++ b/changedetectionio/content_fetcher.py
@@ -384,6 +384,7 @@ class base_html_playwright(Fetcher):
                self.headers = x.get('headers')
                self.instock_data = x.get('instock_data')
                self.screenshot = base64.b64decode(x.get('screenshot'))
                self.status_code = x.get('status_code')
                self.xpath_data = x.get('xpath_data')
            else:
--- a/changedetectionio/forms.py
+++ b/changedetectionio/forms.py
@@ -481,6 +481,10 @@ class globalSettingsApplicationForm(commonSettingsForm):
    global_subtractive_selectors = StringListField('Remove elements', [ValidateCSSJSONXPATHInput(allow_xpath=False, allow_json=False)])
    ignore_whitespace = BooleanField('Ignore whitespace')
    password = SaltyPasswordField()
    pager_size = IntegerField('Pager size',
                              render_kw={"style": "width: 5em;"},
                              validators=[validators.NumberRange(min=0,
                                                                 message="Should be atleast zero (disabled)")])
    removepassword_button = SubmitField('Remove password', render_kw={"class": "pure-button pure-button-primary"})
    render_anchor_tag_content = BooleanField('Render anchor tag content', default=False)
    shared_diff_access = BooleanField('Allow access to view diff page when password is enabled', default=False, validators=[validators.Optional()])
--- a/changedetectionio/model/App.py
+++ b/changedetectionio/model/App.py
@@ -23,25 +23,26 @@ class model(dict):
                    'workers': int(getenv("DEFAULT_SETTINGS_REQUESTS_WORKERS", "10")),  # Number of threads, lower is better for slow connections
                },
                'application': {
                    # Custom notification content
                    'api_access_token_enabled': True,
                    'password': False,
                    'base_url' : None,
                    'extract_title_as_title': False,
                    'empty_pages_are_a_change': False,
                    'extract_title_as_title': False,
                    'fetch_backend': getenv("DEFAULT_FETCH_BACKEND", "html_requests"),
                    'filter_failure_notification_threshold_attempts': _FILTER_FAILURE_THRESHOLD_ATTEMPTS_DEFAULT,
                    'global_ignore_text': [], # List of text to ignore when calculating the comparison checksum
                    'global_subtractive_selectors': [],
                    'ignore_whitespace': True,
                    'render_anchor_tag_content': False,
                    'notification_urls': [], # Apprise URL list
                    # Custom notification content
                    'notification_title': default_notification_title,
                    'notification_body': default_notification_body,
                    'notification_format': default_notification_format,
                    'notification_title': default_notification_title,
                    'notification_urls': [], # Apprise URL list
                    'pager_size': 50,
                    'password': False,
                    'render_anchor_tag_content': False,
                    'schema_version' : 0,
                    'shared_diff_access': False,
-                    'webdriver_delay': None  # Extra delay in seconds before extracting text
+                    'webdriver_delay': None , # Extra delay in seconds before extracting text
                }
            }
        }
@@ -49,3 +50,15 @@ class model(dict):
    def __init__(self, *arg, **kw):
        super(model, self).__init__(*arg, **kw)
        self.update(self.base_config)
 def parse_headers_from_text_file(filepath):
    headers = {}
    with open(filepath, 'r') as f:
        for l in f.readlines():
            l = l.strip()
            if not l.startswith('#') and ':' in l:
                (k, v) = l.split(':')
                headers[k.strip()] = v.strip()
    return headers
--- a/changedetectionio/model/Watch.py
+++ b/changedetectionio/model/Watch.py
@@ -473,6 +473,40 @@ class model(dict):
        # None is set
        return False
    @property
    def has_extra_headers_file(self):
        if os.path.isfile(os.path.join(self.watch_data_dir, 'headers.txt')):
            return True
        for f in self.all_tags:
            fname = "headers-"+re.sub(r'[\W_]', '', f).lower().strip() + ".txt"
            filepath = os.path.join(self.__datastore_path, fname)
            if os.path.isfile(filepath):
                return True
        return False
    def get_all_headers(self):
        from .App import parse_headers_from_text_file
        headers = self.get('headers', {}).copy()
        # Available headers on the disk could 'headers.txt' in the watch data dir
        filepath = os.path.join(self.watch_data_dir, 'headers.txt')
        try:
            if os.path.isfile(filepath):
                headers.update(parse_headers_from_text_file(filepath))
        except Exception as e:
            print(f"ERROR reading headers.txt at {filepath}", str(e))
        # Or each by tag, as tagname.txt in the main datadir
        for f in self.all_tags:
            fname = "headers-"+re.sub(r'[\W_]', '', f).lower().strip() + ".txt"
            filepath = os.path.join(self.__datastore_path, fname)
            try:
                if os.path.isfile(filepath):
                    headers.update(parse_headers_from_text_file(filepath))
            except Exception as e:
                print(f"ERROR reading headers.txt at {filepath}", str(e))
        return headers
    def get_last_fetched_before_filters(self):
        import brotli
--- a/changedetectionio/processors/text_json_diff.py
+++ b/changedetectionio/processors/text_json_diff.py
@@ -70,10 +70,9 @@ class perform_site_check(difference_detection_processor):
        # Unset any existing notification error
        update_obj = {'last_notification_error': False, 'last_error': False}
        extra_headers = watch.get('headers', [])
        # Tweak the base config with the per-watch ones
-        request_headers = deepcopy(self.datastore.data['settings']['headers'])
+        extra_headers = watch.get_all_headers()
        request_headers = self.datastore.get_all_headers()
        request_headers.update(extra_headers)
        # https://github.com/psf/requests/issues/4525
--- a/changedetectionio/store.py
+++ b/changedetectionio/store.py
@@ -3,7 +3,7 @@ from flask import (
 )
 from . model import App, Watch
-from copy import deepcopy
+from copy import deepcopy, copy
 from os import path, unlink
 from threading import Lock
 import json
@@ -474,8 +474,6 @@ class ChangeDetectionStore:
        return proxy_list if len(proxy_list) else None
    def get_preferred_proxy_for_watch(self, uuid):
        """
        Returns the preferred proxy by ID key
@@ -507,6 +505,25 @@ class ChangeDetectionStore:
        return None
    @property
    def has_extra_headers_file(self):
        filepath = os.path.join(self.datastore_path, 'headers.txt')
        return os.path.isfile(filepath)
    def get_all_headers(self):
        from .model.App import parse_headers_from_text_file
        headers = copy(self.data['settings'].get('headers', {}))
        filepath = os.path.join(self.datastore_path, 'headers.txt')
        try:
            if os.path.isfile(filepath):
                headers.update(parse_headers_from_text_file(filepath))
        except Exception as e:
            print(f"ERROR reading headers.txt at {filepath}", str(e))
        return headers
    # Run all updates
    # IMPORTANT - Each update could be run even when they have a new install and the schema is correct
    #             So therefor - each `update_n` should be very careful about checking if it needs to actually run
--- a/changedetectionio/templates/edit.html
+++ b/changedetectionio/templates/edit.html
@@ -152,6 +152,15 @@
 {{ render_field(form.headers, rows=5, placeholder="Example
 Cookie: foobar
 User-Agent: wonderbra 1.0") }}
                        <div class="pure-form-message-inline">
                            {% if has_extra_headers_file %}
                                <strong>Alert! Extra headers file found and will be added to this watch!</strong>
                            {% else %}
                                Headers can be also read from a file in your data-directory <a href="https://github.com/dgtlmoon/changedetection.io/wiki/Adding-headers-from-an-external-file">Read more here</a>
                            {% endif %}
                        </div>
                    </div>
                    <div class="pure-control-group" id="request-body">
                                        {{ render_field(form.body, rows=5, placeholder="Example
--- a/changedetectionio/templates/settings.html
+++ b/changedetectionio/templates/settings.html
@@ -70,6 +70,10 @@
                            <a href="https://github.com/dgtlmoon/changedetection.io/wiki/Configurable-BASE_URL-setting">read more here</a>.
                        </span>
                    </div>
                    <div class="pure-control-group">
                        {{ render_field(form.application.form.pager_size) }}
                        <span class="pure-form-message-inline">Number of items per page in the watch overview list, 0 to disable.</span>
                    </div>
                    <div class="pure-control-group">
                        {{ render_checkbox_field(form.application.form.extract_title_as_title) }}
--- a/changedetectionio/templates/watch-overview.html
+++ b/changedetectionio/templates/watch-overview.html
@@ -79,7 +79,7 @@
                <td colspan="6">No website watches configured, please add a URL in the box above, or <a href="{{ url_for('import_page')}}" >import a list</a>.</td>
            </tr>
            {% endif %}
-            {% for watch in (watches|sort(attribute=sort_attribute, reverse=sort_order == 'asc'))[pagination.skip:pagination.skip+pagination.per_page] %}
+            {% for watch in (watches|sort(attribute=sort_attribute, reverse=sort_order == 'asc'))|pagination_slice(skip=pagination.skip) %}
            <tr id="{{ watch.uuid }}"
                class="{{ loop.cycle('pure-table-odd', 'pure-table-even') }} processor-{{ watch['processor'] }}
                {% if watch.last_error is defined and watch.last_error != False %}error{% endif %}
--- a/changedetectionio/tests/conftest.py
+++ b/changedetectionio/tests/conftest.py
@@ -14,13 +14,16 @@ global app
 def cleanup(datastore_path):
    # Unlink test output files
-    files = ['output.txt',
+    files = [
-             'url-watches.json',
+        'count.txt',
-             'secret.txt',
+        'endpoint-content.txt'
-             'notification.txt',
+        'headers.txt',
-             'count.txt',
+        'headers-testtag.txt',
-             'endpoint-content.txt'
+        'notification.txt',
-                 ]
+        'secret.txt',
        'url-watches.json',
        'output.txt',
    ]
    for file in files:
        try:
            os.unlink("{}/{}".format(datastore_path, file))
--- a/changedetectionio/tests/test_request.py
+++ b/changedetectionio/tests/test_request.py
@@ -1,7 +1,8 @@
 import json
 import os
 import time
 from flask import url_for
-from . util import set_original_response, set_modified_response, live_server_setup
+from . util import set_original_response, set_modified_response, live_server_setup, wait_for_all_checks, extract_UUID_from_client
 def test_setup(live_server):
    live_server_setup(live_server)
@@ -234,3 +235,72 @@ def test_method_in_request(client, live_server):
    # Should be only one with method set to PATCH
    assert watches_with_method == 1
    res = client.get(url_for("form_delete", uuid="all"), follow_redirects=True)
    assert b'Deleted' in res.data
 def test_headers_textfile_in_request(client, live_server):
    #live_server_setup(live_server)
    # Add our URL to the import page
    test_url = url_for('test_headers', _external=True)
    # Add the test URL twice, we will check
    res = client.post(
        url_for("import_page"),
        data={"urls": test_url},
        follow_redirects=True
    )
    assert b"1 Imported" in res.data
    time.sleep(1)
    # Add some headers to a request
    res = client.post(
        url_for("edit_page", uuid="first"),
        data={
              "url": test_url,
              "tag": "testtag",
              "fetch_backend": "html_requests",
              "headers": "xxx:ooo\ncool:yeah\r\n"},
        follow_redirects=True
    )
    assert b"Updated watch." in res.data
    wait_for_all_checks(client)
    with open('test-datastore/headers-testtag.txt', 'w') as f:
        f.write("tag-header: test")
    with open('test-datastore/headers.txt', 'w') as f:
        f.write("global-header: nice\r\nnext-global-header: nice")
    with open('test-datastore/'+extract_UUID_from_client(client)+'/headers.txt', 'w') as f:
        f.write("watch-header: nice")
    client.get(url_for("form_watch_checknow"), follow_redirects=True)
    # Give the thread time to pick it up
    wait_for_all_checks(client)
    res = client.get(url_for("edit_page", uuid="first"))
    assert b"Extra headers file found and will be added to this watch" in res.data
    # Not needed anymore
    os.unlink('test-datastore/headers.txt')
    os.unlink('test-datastore/headers-testtag.txt')
    os.unlink('test-datastore/'+extract_UUID_from_client(client)+'/headers.txt')
    # The service should echo back the request verb
    res = client.get(
        url_for("preview_page", uuid="first"),
        follow_redirects=True
    )
    assert b"Global-Header:nice" in res.data
    assert b"Next-Global-Header:nice" in res.data
    assert b"Xxx:ooo" in res.data
    assert b"Watch-Header:nice" in res.data
    assert b"Tag-Header:test" in res.data
    #unlink headers.txt on start/stop
    res = client.get(url_for("form_delete", uuid="all"), follow_redirects=True)
    assert b'Deleted' in res.data
Author	SHA1	Message	Date
dgtlmoon	e9e1ce893f	0.42.2	2023-05-25 16:47:30 +02:00
dgtlmoon	b5a415c7b6	UI - Configurable pager size #1599 #1598	2023-05-25 16:38:54 +02:00
dgtlmoon	9e954532d6	Fetcher - Ability to specify headers from a textfile per watch, global or per tag ( https://github.com/dgtlmoon/changedetection.io/wiki/Adding-headers-from-an-external-file )	2023-05-22 17:19:52 +02:00
dgtlmoon	955835df72	Restock detection - Better reporting when it fails (#1584 )	2023-05-21 23:10:39 +02:00
dgtlmoon	1aeafef910	Fetcher - Puppeteer experimental fetcher wasn't returning the status-code (#1585 )	2023-05-21 23:10:08 +02:00
dgtlmoon	1367197df7	Update README.md	2023-05-21 21:28:19 +02:00