mirror of
https://github.com/james-m-jordan/openai-cookbook.git
synced 2025-05-09 19:32:38 +00:00
Merge pull request #289 from fabiofranco85/fabiofranco85-patch-1
Improve regex in web crawler
This commit is contained in:
commit
e04893c94e
@ -17,7 +17,7 @@ import numpy as np
|
||||
from openai.embeddings_utils import distances_from_embeddings, cosine_similarity
|
||||
|
||||
# Regex pattern to match a URL
|
||||
HTTP_URL_PATTERN = r'^http[s]*://.+'
|
||||
HTTP_URL_PATTERN = r'^http[s]{0,1}://.+$'
|
||||
|
||||
# Define root domain to crawl
|
||||
domain = "openai.com"
|
||||
|
Loading…
x
Reference in New Issue
Block a user