Refactoring fetcher, working feeds and raw url writer

This commit is contained in:
Luciano Gervasoni
2025-03-12 17:56:40 +01:00
parent e124dbc21a
commit 61c31ee9aa
24 changed files with 2085 additions and 194 deletions

View File

@@ -0,0 +1,33 @@
def remove_http_s(url):
url = url.replace("https://", "") if url.startswith("https://") else url
url = url.replace("http://", "") if url.startswith("http://") else url
return url
def is_valid_url(url):
if (url.startswith("https://")):
return True
else:
return False
def get_searxng_instances():
# SearxNG instances: https://searx.space/
searx_instances = set()
searx_instances.add("https://searx.work/")
searx_instances.add("https://search.ononoki.org/")
searx_instances.add("https://searxng.nicfab.eu/")
searx_instances.add("https://searx.be/")
# searx_instances.add("https://searx.fmac.xyz/")
# searx_instances.add("https://northboot.xyz/") # FIX
# searx_instances.add("https://serx.ml/") # Offline
# searx_instances.add("https://searx.ru/")
# searx_instances.add("https://searx.sp-codes.de/")
# searx_instances.add("https://searxng.nicfab.eu/")
# searx_instances.add("https://s.frlt.one/")
# searx_instances.add("https://search.sapti.me/")
# To list
list_searx_instances = list(searx_instances)
return list_searx_instances