Implement basic support for failure notifications.

pull/1945/head
Patrick Sean Klein 1 year ago
parent 8a35d62e02
commit 582cc3eff2
No known key found for this signature in database
GPG Key ID: B6D50F39A56F6906

@ -111,6 +111,9 @@ nav
<div class="pure-control-group inline-radio"> <div class="pure-control-group inline-radio">
{{ render_checkbox_field(form.notification_muted) }} {{ render_checkbox_field(form.notification_muted) }}
</div> </div>
<div class="pure-control-group inline-radio">
{{ render_checkbox_field(form.notification_notify_on_failure) }}
</div>
{% if is_html_webdriver %} {% if is_html_webdriver %}
<div class="pure-control-group inline-radio"> <div class="pure-control-group inline-radio">
{{ render_checkbox_field(form.notification_screenshot) }} {{ render_checkbox_field(form.notification_screenshot) }}

@ -500,6 +500,7 @@ class processor_text_json_diff_form(commonSettingsForm):
notification_muted = BooleanField('Notifications Muted / Off', default=False) notification_muted = BooleanField('Notifications Muted / Off', default=False)
notification_screenshot = BooleanField('Attach screenshot to notification (where possible)', default=False) notification_screenshot = BooleanField('Attach screenshot to notification (where possible)', default=False)
notification_notify_on_failure = BooleanField('Send a notification on watch failure', default=False)
def extra_tab_content(self): def extra_tab_content(self):
return None return None

@ -0,0 +1,149 @@
#!/usr/bin/python3
import os
import time
from pathlib import Path
from typing import Optional
from flask import url_for
from .util import live_server_setup, wait_for_all_checks
NOTIFICATION_PATH = Path("test-datastore/notification.txt")
ENDPOINT_CONTENT_PATH = Path("test-datastore/endpoint-content.txt")
def test_setup(live_server):
live_server_setup(live_server)
def test_notification_on_failure(client, live_server):
# Set the response
ENDPOINT_CONTENT_PATH.write_text('test endpoint content\n')
# Successful request does not trigger a notification
preview = run_filter_test(client, test_url=url_for('test_endpoint', _external=True), expected_notification=None)
assert 'test endpoint content' in preview.text
# Failed request triggers a notification
preview = run_filter_test(client, test_url=url_for('test_endpoint', _external=True, status_code=403),
expected_notification="Access denied")
assert 'Error Text' in preview.text
def test_notification_on_failure_does_not_trigger_if_disabled(client, live_server):
# Set the response
ENDPOINT_CONTENT_PATH.write_text('test endpoint content\n')
# Successful request does not trigger a notification
preview = run_filter_test(client, test_url=url_for('test_endpoint', _external=True), expected_notification=None,
enable_notification_on_failure=False)
assert 'test endpoint content' in preview.text
# Failed request does not trigger a notification either
preview = run_filter_test(client, test_url=url_for('test_endpoint', _external=True, status_code=403),
expected_notification=None, enable_notification_on_failure=False)
assert 'Error Text' in preview.text
def expect_notification(expected_text):
if expected_text is None:
assert not NOTIFICATION_PATH.exists(), "Expected no notification, but found one"
else:
assert NOTIFICATION_PATH.exists(), "Expected notification, but found none"
notification = NOTIFICATION_PATH.read_text()
assert expected_text in notification, (f"Expected notification to contain '{expected_text}' but it did not. "
f"Notification: {notification}")
NOTIFICATION_PATH.unlink(missing_ok=True)
def run_filter_test(client, test_url: str, expected_notification: Optional[str], enable_notification_on_failure=True):
# Set up the watch
_setup_watch(client, test_url, enable_notification_on_failure=enable_notification_on_failure)
# Ensure that the watch has been triggered
wait_for_all_checks(client)
# Give the thread time to pick it up
time.sleep(3)
# Check the notification
expect_notification(expected_notification)
res = client.get(
url_for("preview_page", uuid="first"),
follow_redirects=True
)
# TODO Move to pytest?
cleanup(client)
return res
def cleanup(client):
# cleanup for the next test
res = client.get(url_for("form_delete", uuid="all"), follow_redirects=True)
assert b'Deleted' in res.data
NOTIFICATION_PATH.unlink(missing_ok=True)
def _trigger_watch(client):
client.get(url_for("form_watch_checknow"), follow_redirects=True)
wait_for_all_checks(client)
def _setup_watch(client, test_url, enable_notification_on_failure=True):
# Give the endpoint time to spin up
time.sleep(1)
# cleanup for the next
client.get(
url_for("form_delete", uuid="all"),
follow_redirects=True
)
if os.path.isfile("test-datastore/notification.txt"):
os.unlink("test-datastore/notification.txt")
# Add our URL to the import page
res = client.post(
url_for("form_quick_watch_add"),
data={"url": test_url, "tags": ''},
follow_redirects=True
)
assert b"Watch added" in res.data
# Give the thread time to pick up the first version
wait_for_all_checks(client)
# Goto the edit page, add our ignore text
# Add our URL to the import page
url = url_for('test_notification_endpoint', _external=True)
notification_url = url.replace('http', 'json')
print(">>>> Notification URL: " + notification_url)
# Just a regular notification setting, this will be used by the special 'filter not found' notification
notification_form_data = {"notification_urls": notification_url,
"notification_title": "New ChangeDetection.io Notification - {{watch_url}}",
"notification_body": "BASE URL: {{base_url}}\n"
"Watch URL: {{watch_url}}\n"
"Watch UUID: {{watch_uuid}}\n"
"Watch title: {{watch_title}}\n"
"Watch tag: {{watch_tag}}\n"
"Preview: {{preview_url}}\n"
"Diff URL: {{diff_url}}\n"
"Snapshot: {{current_snapshot}}\n"
"Diff: {{diff}}\n"
"Diff Full: {{diff_full}}\n"
"Diff as Patch: {{diff_patch}}\n"
":-)",
"notification_format": "Text"}
notification_form_data.update({
"url": test_url,
"title": "Notification test",
"filter_failure_notification_send": '',
"notification_notify_on_failure": 'y' if enable_notification_on_failure else '',
"time_between_check-minutes": "180",
"fetch_backend": "html_requests"})
res = client.post(
url_for("edit_page", uuid="first"),
data=notification_form_data,
follow_redirects=True
)
assert b"Updated watch." in res.data

@ -9,6 +9,11 @@ import queue
import threading import threading
import time import time
from changedetectionio import content_fetcher, html_tools
from .processors.restock_diff import UnableToExtractRestockData
from .processors.text_json_diff import FilterNotFoundInResponse
# A single update worker # A single update worker
# #
# Requests for checking on a single site(watch) from a queue of watches # Requests for checking on a single site(watch) from a queue of watches
@ -69,11 +74,16 @@ class update_worker(threading.Thread):
n_object.update({ n_object.update({
'current_snapshot': snapshot_contents, 'current_snapshot': snapshot_contents,
'diff': diff.render_diff(prev_snapshot, current_snapshot, line_feed_sep=line_feed_sep), 'diff': diff.render_diff(prev_snapshot, current_snapshot,
'diff_added': diff.render_diff(prev_snapshot, current_snapshot, include_removed=False, line_feed_sep=line_feed_sep), line_feed_sep=line_feed_sep),
'diff_full': diff.render_diff(prev_snapshot, current_snapshot, include_equal=True, line_feed_sep=line_feed_sep), 'diff_added': diff.render_diff(prev_snapshot, current_snapshot,
'diff_patch': diff.render_diff(prev_snapshot, current_snapshot, line_feed_sep=line_feed_sep, patch_format=True), include_removed=False, line_feed_sep=line_feed_sep),
'diff_removed': diff.render_diff(prev_snapshot, current_snapshot, include_added=False, line_feed_sep=line_feed_sep), 'diff_full': diff.render_diff(prev_snapshot, current_snapshot,
include_equal=True, line_feed_sep=line_feed_sep),
'diff_patch': diff.render_diff(prev_snapshot, current_snapshot,
line_feed_sep=line_feed_sep, patch_format=True),
'diff_removed': diff.render_diff(prev_snapshot, current_snapshot, include_added=False,
line_feed_sep=line_feed_sep),
'notification_timestamp': now, 'notification_timestamp': now,
'screenshot': watch.get_screenshot() if watch and watch.get('notification_screenshot') else None, 'screenshot': watch.get_screenshot() if watch and watch.get('notification_screenshot') else None,
'triggered_text': triggered_text, 'triggered_text': triggered_text,
@ -218,6 +228,26 @@ class update_worker(threading.Thread):
self.notification_q.put(n_object) self.notification_q.put(n_object)
logger.error(f"Sent step not found notification for {watch_uuid}") logger.error(f"Sent step not found notification for {watch_uuid}")
def send_failure_notification(self, watch_uuid: str, error_text: str):
watch = self.datastore.data['watching'].get(watch_uuid)
if not watch:
return
n_object = {'notification_title': 'Changedetection.io - Alert - {}'.format(error_text),
'notification_body': "Your watch {{watch_url}} failed!\n\nLink: {{base_url}}/edit/{{watch_uuid}}\n\nThanks - Your omniscient changedetection.io installation :)\n",
'notification_format': 'text'}
n_object['notification_urls'] = self._check_cascading_vars('notification_urls', watch)
# Only prepare to notify if the rules above matched
if n_object and n_object.get('notification_urls'):
n_object.update({
'watch_url': watch['url'],
'uuid': watch_uuid,
'screenshot': None
})
self.notification_q.put(n_object)
print("Sent error notification for {}".format(watch_uuid))
def cleanup_error_artifacts(self, uuid): def cleanup_error_artifacts(self, uuid):
# All went fine, remove error artifacts # All went fine, remove error artifacts
@ -227,9 +257,47 @@ class update_worker(threading.Thread):
if os.path.isfile(full_path): if os.path.isfile(full_path):
os.unlink(full_path) os.unlink(full_path)
def _update_watch(self, uuid, update_obj, exception):
# TODO check if update succeeded or had an error.
# If it had an error, handle notifications
# If it did not have one, clean up any error states
# TODO Future - loop over notification handlers and send them the update_obj, allowing modification
last_error = update_obj.get('last_error', False)
if last_error:
# TODO Future - message notification handlers
if self.datastore.data['watching'][uuid].get('notification_notify_on_failure', False):
self.send_failure_notification(watch_uuid=uuid, error_text=update_obj['last_error'])
pass
else:
# TODO Future - message notification handlers
pass
self.datastore.update_watch(uuid=uuid, update_obj=update_obj)
if isinstance(exception, FilterNotFoundInResponse) or isinstance(exception, content_fetcher.BrowserStepsStepTimout):
# Only when enabled, send the notification
if self.datastore.data['watching'][uuid].get('filter_failure_notification_send', False):
c = self.datastore.data['watching'][uuid].get('consecutive_filter_failures', 5)
c += 1
# Send notification if we reached the threshold?
threshold = self.datastore.data['settings']['application'].get(
'filter_failure_notification_threshold_attempts',
0)
print("Filter for {} not found, consecutive_filter_failures: {}".format(uuid, c))
if threshold > 0 and c >= threshold:
if not self.datastore.data['watching'][uuid].get('notification_muted'):
if isinstance(exception, FilterNotFoundInResponse):
self.send_filter_failure_notification(uuid)
else:
self.send_step_failure_notification(watch_uuid=uuid, step_n=exception.step_n)
c = 0
self.datastore.update_watch(uuid=uuid, update_obj={'consecutive_filter_failures': c})
def run(self): def run(self):
now = time.time() now = time.time()
while not self.app.config.exit.is_set(): while not self.app.config.exit.is_set():
update_handler = None update_handler = None
@ -241,7 +309,8 @@ class update_worker(threading.Thread):
else: else:
uuid = queued_item_data.item.get('uuid') uuid = queued_item_data.item.get('uuid')
self.current_uuid = uuid self.current_uuid = uuid
if uuid in list(self.datastore.data['watching'].keys()) and self.datastore.data['watching'][uuid].get('url'): if uuid in list(self.datastore.data['watching'].keys()) and self.datastore.data['watching'][uuid].get(
'url'):
changed_detected = False changed_detected = False
contents = b'' contents = b''
process_changedetection_results = True process_changedetection_results = True
@ -252,7 +321,8 @@ class update_worker(threading.Thread):
watch = self.datastore.data['watching'].get(uuid) watch = self.datastore.data['watching'].get(uuid)
logger.info(f"Processing watch UUID {uuid} Priority {queued_item_data.priority} URL {watch['url']}") logger.info(f"Processing watch UUID {uuid} Priority {queued_item_data.priority} URL {watch[
'url']}")
now = time.time() now = time.time()
try: try:
@ -261,7 +331,6 @@ class update_worker(threading.Thread):
# Abort processing when the content was the same as the last fetch # Abort processing when the content was the same as the last fetch
skip_when_same_checksum = queued_item_data.item.get('skip_when_checksum_same') skip_when_same_checksum = queued_item_data.item.get('skip_when_checksum_same')
# Init a new 'difference_detection_processor', first look in processors # Init a new 'difference_detection_processor', first look in processors
processor_module_name = f"changedetectionio.processors.{processor}.processor" processor_module_name = f"changedetectionio.processors.{processor}.processor"
try: try:
@ -314,16 +383,16 @@ class update_worker(threading.Thread):
else: else:
extra_help = ", it's possible that the filters were found, but contained no usable text." extra_help = ", it's possible that the filters were found, but contained no usable text."
self.datastore.update_watch(uuid=uuid, update_obj={ self._update_watch(uuid=uuid, update_obj={
'last_error': f"Got HTML content but no text found (With {e.status_code} reply code){extra_help}" 'last_error': f"Got HTML content but no text found (With {e.status_code} reply code){extra_help}"
}) }, exception=e)
if e.screenshot: if e.screenshot:
watch.save_screenshot(screenshot=e.screenshot, as_error=True) watch.save_screenshot(screenshot=e.screenshot, as_error=True)
if e.xpath_data: if e.xpath_data:
watch.save_xpath_data(data=e.xpath_data) watch.save_xpath_data(data=e.xpath_data)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.Non200ErrorCodeReceived as e: except content_fetchers_exceptions.Non200ErrorCodeReceived as e:
@ -345,7 +414,7 @@ class update_worker(threading.Thread):
if e.page_text: if e.page_text:
watch.save_error_text(contents=e.page_text) watch.save_error_text(contents=e.page_text)
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text}) self._update_watch(uuid=uuid, update_obj={'last_error': err_text}, exception=e)
process_changedetection_results = False process_changedetection_results = False
except FilterNotFoundInResponse as e: except FilterNotFoundInResponse as e:
@ -353,7 +422,7 @@ class update_worker(threading.Thread):
continue continue
err_text = "Warning, no filters were found, no change detection ran - Did the page change layout? update your Visual Filter if necessary." err_text = "Warning, no filters were found, no change detection ran - Did the page change layout? update your Visual Filter if necessary."
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text}) self._update_watch(uuid=uuid, update_obj={'last_error': err_text}, exception=None)
# Filter wasnt found, but we should still update the visual selector so that they can have a chance to set it up again # Filter wasnt found, but we should still update the visual selector so that they can have a chance to set it up again
if e.screenshot: if e.screenshot:
@ -375,7 +444,7 @@ class update_worker(threading.Thread):
self.send_filter_failure_notification(uuid) self.send_filter_failure_notification(uuid)
c = 0 c = 0
self.datastore.update_watch(uuid=uuid, update_obj={'consecutive_filter_failures': c}) self._update_watch(uuid=uuid, update_obj={'consecutive_filter_failures': c}, exception=None)
process_changedetection_results = False process_changedetection_results = False
@ -384,16 +453,16 @@ class update_worker(threading.Thread):
process_changedetection_results = False process_changedetection_results = False
changed_detected = False changed_detected = False
except content_fetchers_exceptions.BrowserConnectError as e: except content_fetchers_exceptions.BrowserConnectError as e:
self.datastore.update_watch(uuid=uuid, self._update_watch(uuid=uuid,
update_obj={'last_error': e.msg update_obj={'last_error': e.msg
} }
) , exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.BrowserFetchTimedOut as e: except content_fetchers_exceptions.BrowserFetchTimedOut as e:
self.datastore.update_watch(uuid=uuid, self._update_watch(uuid=uuid,
update_obj={'last_error': e.msg update_obj={'last_error': e.msg
} }
) , exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.BrowserStepsStepException as e: except content_fetchers_exceptions.BrowserStepsStepException as e:
@ -415,11 +484,11 @@ class update_worker(threading.Thread):
logger.debug(f"BrowserSteps exception at step {error_step} {str(e.original_e)}") logger.debug(f"BrowserSteps exception at step {error_step} {str(e.original_e)}")
self.datastore.update_watch(uuid=uuid, self._update_watch(uuid=uuid,
update_obj={'last_error': err_text, update_obj={'last_error': err_text,
'browser_steps_last_error_step': error_step 'browser_steps_last_error_step': error_step
} }
) , exception=None)
if watch.get('filter_failure_notification_send', False): if watch.get('filter_failure_notification_send', False):
c = watch.get('consecutive_filter_failures', 5) c = watch.get('consecutive_filter_failures', 5)
@ -433,27 +502,31 @@ class update_worker(threading.Thread):
self.send_step_failure_notification(watch_uuid=uuid, step_n=e.step_n) self.send_step_failure_notification(watch_uuid=uuid, step_n=e.step_n)
c = 0 c = 0
self.datastore.update_watch(uuid=uuid, update_obj={'consecutive_filter_failures': c}) self._update_watch(uuid=uuid, update_obj={'consecutive_filter_failures': c}, exception=None)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.EmptyReply as e: except content_fetchers_exceptions.EmptyReply as e:
# Some kind of custom to-str handler in the exception handler that does this? # Some kind of custom to-str handler in the exception handler that does this?
err_text = "EmptyReply - try increasing 'Wait seconds before extracting text', Status Code {}".format(e.status_code) err_text = "EmptyReply - try increasing 'Wait seconds before extracting text', Status Code {}".format(
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text, e.status_code)
'last_check_status': e.status_code}) self._update_watch(uuid=uuid, update_obj={'last_error': err_text,
'last_check_status': e.status_code},
exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.ScreenshotUnavailable as e: except content_fetchers_exceptions.ScreenshotUnavailable as e:
err_text = "Screenshot unavailable, page did not render fully in the expected time or page was too long - try increasing 'Wait seconds before extracting text'" err_text = "Screenshot unavailable, page did not render fully in the expected time or page was too long - try increasing 'Wait seconds before extracting text'"
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text, self._update_watch(uuid=uuid, update_obj={'last_error': err_text,
'last_check_status': e.status_code}) 'last_check_status': e.status_code},
exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.JSActionExceptions as e: except content_fetchers_exceptions.JSActionExceptions as e:
err_text = "Error running JS Actions - Page request - "+e.message err_text = "Error running JS Actions - Page request - " + e.message
if e.screenshot: if e.screenshot:
watch.save_screenshot(screenshot=e.screenshot, as_error=True) watch.save_screenshot(screenshot=e.screenshot, as_error=True)
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text, self._update_watch(uuid=uuid, update_obj={'last_error': err_text,
'last_check_status': e.status_code}) 'last_check_status': e.status_code},
exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.PageUnloadable as e: except content_fetchers_exceptions.PageUnloadable as e:
err_text = "Page request from server didnt respond correctly" err_text = "Page request from server didnt respond correctly"
@ -463,20 +536,22 @@ class update_worker(threading.Thread):
if e.screenshot: if e.screenshot:
watch.save_screenshot(screenshot=e.screenshot, as_error=True) watch.save_screenshot(screenshot=e.screenshot, as_error=True)
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text, self._update_watch(uuid=uuid, update_obj={'last_error': err_text,
'last_check_status': e.status_code, 'last_check_status': e.status_code,
'has_ldjson_price_data': None}) 'has_ldjson_price_data': None},
exception=e)
process_changedetection_results = False process_changedetection_results = False
except content_fetchers_exceptions.BrowserStepsInUnsupportedFetcher as e: except content_fetchers_exceptions.BrowserStepsInUnsupportedFetcher as e:
err_text = "This watch has Browser Steps configured and so it cannot run with the 'Basic fast Plaintext/HTTP Client', either remove the Browser Steps or select a Chrome fetcher." err_text = "This watch has Browser Steps configured and so it cannot run with the 'Basic fast Plaintext/HTTP Client', either remove the Browser Steps or select a Chrome fetcher."
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': err_text}) self._update_watch(uuid=uuid, update_obj={
'last_error': err_text}, exception=e)
process_changedetection_results = False process_changedetection_results = False
logger.error(f"Exception (BrowserStepsInUnsupportedFetcher) reached processing watch UUID: {uuid}") logger.error(f"Exception (BrowserStepsInUnsupportedFetcher) reached processing watch UUID: {uuid}")
except Exception as e: except Exception as e:
logger.error(f"Exception reached processing watch UUID: {uuid}") logger.error(f"Exception reached processing watch UUID: {uuid}")
logger.error(str(e)) logger.error(str(e))
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': "Exception: " + str(e)}) self._update_watch(uuid=uuid, update_obj={'last_error': "Exception: " + str(e)}, exception=e)
# Other serious error # Other serious error
process_changedetection_results = False process_changedetection_results = False
@ -512,7 +587,7 @@ class update_worker(threading.Thread):
# Now update after running everything # Now update after running everything
timestamp = round(time.time()) timestamp = round(time.time())
try: try:
self.datastore.update_watch(uuid=uuid, update_obj=update_obj) self._update_watch(uuid=uuid, update_obj=update_obj, exception=None)
# Also save the snapshot on the first time checked, "last checked" will always be updated, so we just check history length. # Also save the snapshot on the first time checked, "last checked" will always be updated, so we just check history length.
@ -546,11 +621,12 @@ class update_worker(threading.Thread):
if not watch.get('notification_muted'): if not watch.get('notification_muted'):
self.send_content_changed_notification(watch_uuid=uuid) self.send_content_changed_notification(watch_uuid=uuid)
except Exception as e: except Exception as e:
# Catch everything possible here, so that if a worker crashes, we don't lose it until restart! # Catch everything possible here, so that if a worker crashes, we don't lose it until restart!
logger.critical("!!!! Exception in update_worker while processing process_changedetection_results !!!") logger.critical("!!!! Exception in update_worker while processing process_changedetection_results !!!")
logger.critical(str(e)) logger.critical(str(e))
self.datastore.update_watch(uuid=uuid, update_obj={'last_error': str(e)}) self._update_watch(uuid=uuid, update_obj={'last_error': str(e)}, exception=e)
# Always record that we atleast tried # Always record that we atleast tried
@ -565,10 +641,10 @@ class update_worker(threading.Thread):
except Exception as e: except Exception as e:
pass pass
self.datastore.update_watch(uuid=uuid, update_obj={'fetch_time': round(time.time() - now, 3), self._update_watch(uuid=uuid, update_obj={'fetch_time': round(time.time() - now, 3),
'last_checked': round(time.time()), 'last_checked': round(time.time()),
'check_count': count 'check_count': count
}) }, exception=None if process_changedetection_results else Exception("Unknown"))
self.current_uuid = None # Done self.current_uuid = None # Done

Loading…
Cancel
Save