diff --git a/apps/web-crawl-q-and-a/web-qa.py b/apps/web-crawl-q-and-a/web-qa.py index ccc34fdb..0feb3825 100644 --- a/apps/web-crawl-q-and-a/web-qa.py +++ b/apps/web-crawl-q-and-a/web-qa.py @@ -17,7 +17,7 @@ import numpy as np from openai.embeddings_utils import distances_from_embeddings, cosine_similarity # Regex pattern to match a URL -HTTP_URL_PATTERN = r'^http[s]*://.+' +HTTP_URL_PATTERN = r'^http[s]{0,1}://.+$' # Define root domain to crawl domain = "openai.com"