diff --git a/app_urls/fetcher/src/fetch_utils_url_processor.py b/app_urls/fetcher/src/fetch_utils_url_processor.py index 086e817..838c850 100644 --- a/app_urls/fetcher/src/fetch_utils_url_processor.py +++ b/app_urls/fetcher/src/fetch_utils_url_processor.py @@ -71,6 +71,8 @@ def process_url(url, paywall_bypass=False): config.request_timeout = 15 # timeout in seconds # Default mode article = newspaper.article(url_of_interest, config=config) + + logger.debug("Processing raw URL 2: {}".format(url)) except newspaper.ArticleBinaryDataException: logger.warning("ArticleException for input URL {}".format(url)) return {"override_status": "invalid"} @@ -120,6 +122,8 @@ def process_url(url, paywall_bypass=False): logger.warning("Exception for input URL {}\n{}".format(url, str(e))) return None + logger.debug("Processing raw URL 3: {}".format(url)) + # Not a valid URL? if (not article.is_valid_url()): logger.debug("Invalid URL found: {}".format(url))