#!/usr/bin/python3 import time from flask import url_for from . util import live_server_setup from changedetectionio import html_tools def test_setup(live_server): live_server_setup(live_server) # Unit test of the stripper # Always we are dealing in utf-8 def test_strip_text_func(): from ..fetch_processor import json_html_plaintext test_content = """ Some content is listed here but sometimes we want to remove the lines. but not always.""" ignore_lines = ["sometimes"] fetcher = fetch_site_status.perform_site_check(datastore=False) stripped_content = html_tools.strip_ignore_text(test_content, ignore_lines) assert b"sometimes" not in stripped_content assert b"Some content" in stripped_content def set_original_ignore_response(): test_return_data = """
Some initial textWhich is across multiple lines
So let's see what happens. """ with open("test-datastore/endpoint-content.txt", "w") as f: f.write(test_return_data) def set_modified_original_ignore_response(): test_return_data = """ Some NEW nice initial textWhich is across multiple lines
So let's see what happens.new ignore stuff
blah
""" with open("test-datastore/endpoint-content.txt", "w") as f: f.write(test_return_data) # Is the same but includes ZZZZZ, 'ZZZZZ' is the last line in ignore_text def set_modified_ignore_response(): test_return_data = """ Some initial textWhich is across multiple lines
ZZZZz
So let's see what happens. """ with open("test-datastore/endpoint-content.txt", "w") as f: f.write(test_return_data) def test_check_ignore_text_functionality(client, live_server): sleep_time_for_fetch_thread = 3 # Use a mix of case in ZzZ to prove it works case-insensitive. ignore_text = "XXXXX\r\nYYYYY\r\nzZzZZ\r\nnew ignore stuff" set_original_ignore_response() # Give the endpoint time to spin up time.sleep(1) # Add our URL to the import page test_url = url_for('test_endpoint', _external=True) res = client.post( url_for("import_page"), data={"urls": test_url}, follow_redirects=True ) assert b"1 Imported" in res.data # Trigger a check client.get(url_for("form_watch_checknow"), follow_redirects=True) # Give the thread time to pick it up time.sleep(sleep_time_for_fetch_thread) # Goto the edit page, add our ignore text # Add our URL to the import page res = client.post( url_for("edit_page", uuid="first"), data={"ignore_text": ignore_text, "url": test_url, 'fetch_backend': "html_requests"}, follow_redirects=True ) assert b"Updated watch." in res.data # Check it saved res = client.get( url_for("edit_page", uuid="first"), ) assert bytes(ignore_text.encode('utf-8')) in res.data # Trigger a check client.get(url_for("form_watch_checknow"), follow_redirects=True) # Give the thread time to pick it up time.sleep(sleep_time_for_fetch_thread) # It should report nothing found (no new 'unviewed' class) res = client.get(url_for("index")) assert b'unviewed' not in res.data assert b'/test-endpoint' in res.data # Make a change set_modified_ignore_response() # Trigger a check client.get(url_for("form_watch_checknow"), follow_redirects=True) # Give the thread time to pick it up time.sleep(sleep_time_for_fetch_thread) # It should report nothing found (no new 'unviewed' class) res = client.get(url_for("index")) assert b'unviewed' not in res.data assert b'/test-endpoint' in res.data # Just to be sure.. set a regular modified change.. set_modified_original_ignore_response() client.get(url_for("form_watch_checknow"), follow_redirects=True) time.sleep(sleep_time_for_fetch_thread) res = client.get(url_for("index")) assert b'unviewed' in res.data # Check the preview/highlighter, we should be able to see what we ignored, but it should be highlighted # We only introduce the "modified" content that includes what we ignore so we can prove the newest version also displays # at /preview res = client.get(url_for("preview_page", uuid="first")) # We should be able to see what we ignored assert b'