Create test_ingestion.py

This commit is contained in:
Alex 2023-03-13 17:37:01 +00:00
parent bac25112b7
commit 20a0800aa7

19
scripts/test_ingestion.py Normal file
View File

@ -0,0 +1,19 @@
import os
import dotenv
import tiktoken
from langchain import FAISS
from langchain.embeddings import OpenAIEmbeddings
dotenv.load_dotenv()
embeddings_key = os.getenv("API_KEY")
docsearch = FAISS.load_local('outputs/inputs', OpenAIEmbeddings(openai_api_key=embeddings_key))
d1 = docsearch.similarity_search("Whats new in 1.5.3?")
print(d1)
print("=====================================")
print("=====================================")
for i in d1:
print("docs length (tokens)")
doc_len = len(tiktoken.get_encoding("cl100k_base").encode(i.page_content))
print(doc_len)