Request timeout debugging

This commit is contained in:
Luciano Gervasoni
2025-09-05 14:00:50 +02:00
parent 2fae0a3a9d
commit e4a325d6b4
2 changed files with 3 additions and 0 deletions

View File

@@ -148,6 +148,7 @@ class DB_Handler():
try:
# Extract URL content
dict_url_data = process_url(obj_url.url, paywall_bypass)
logger.debug("Processing raw URL EXTRACT URL CONTENT OK: {}".format(obj_url.url))
except Exception as e:
if (raise_exception_on_error):
# Simply raise exception, handled in a different way
@@ -242,6 +243,7 @@ class DB_Handler():
status_pattern_match = _get_status_pattern_matching(obj_url.url, list_pattern_status_tuple)
# Process URL
self._process_single_url(obj_url, status_pattern_match, raise_exception_on_error=False)
logger.debug("Processing raw URL OK: {}".format(obj_url.url))
logger.info("Updated #{} raw URLs".format(len(raw_urls)))
except Exception as e:

View File

@@ -40,6 +40,7 @@ def url_host_slowdown(url, url_host_slowdown_seconds):
cache.set("process_{}".format(url_host).encode("utf-8"), time.time(), timeout=60*5) # Expire after 5 minutes
def process_url(url, paywall_bypass=False):
logger.debug("Processing raw URL 1: {}".format(url))
if (paywall_bypass):
# TODO: Implement self-hosted instance