| from langchain.text_splitter import RecursiveCharacterTextSplitter |
| from langchain.document_loaders import UnstructuredFileLoader |
| from langchain.vectorstores.faiss import FAISS |
| from langchain.embeddings import OpenAIEmbeddings |
| import pickle |
|
|
| |
| loader = UnstructuredFileLoader("state_of_the_union.txt") |
| raw_documents = loader.load() |
|
|
| |
| text_splitter = RecursiveCharacterTextSplitter() |
| documents = text_splitter.split_documents(raw_documents) |
|
|
|
|
| |
| embeddings = OpenAIEmbeddings() |
| vectorstore = FAISS.from_documents(documents, embeddings) |
|
|
|
|
| |
| with open("vectorstore.pkl", "wb") as f: |
| pickle.dump(vectorstore, f) |
|
|