Improve regex

This commit is contained in:
fabiofranco85 2023-03-27 07:38:35 -03:00 committed by GitHub
parent ebfdfe3099
commit 5a80ef2571
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -17,7 +17,7 @@ import numpy as np
from openai.embeddings_utils import distances_from_embeddings, cosine_similarity
# Regex pattern to match a URL
HTTP_URL_PATTERN = r'^http[s]*://.+'
HTTP_URL_PATTERN = r'^http[s]{0,1}://.+$'
# Define root domain to crawl
domain = "openai.com"