prep bug fix

This commit is contained in:
AliNajafi
2023-10-20 19:06:37 +03:00
parent 6424b0437a
commit a451d548fe

View File

@@ -28,9 +28,10 @@ url_extractor = URLExtract()
def url_handler(text: str):
urls = list(url_extractor.gen_urls(text))
updated_urls = [url if "http" in url else f"https://{url}" for url in urls]
updated_urls = list(
set([url if "http" in url else f"https://{url}" for url in urls])
)
domains = [urllib.parse.urlparse(url_text).netloc for url_text in updated_urls]
domains = list(set(domains))
for i in range(len(domains)):
text = text.replace(urls[i], f" <http> {domains[i]} </http> ")
return text