Update vector_store_retriever.py
Browse files
vector_store_retriever.py
CHANGED
|
@@ -12,8 +12,14 @@ hf = HuggingFaceInstructEmbeddings(
|
|
| 12 |
)
|
| 13 |
|
| 14 |
# Load and process the PDF files
|
| 15 |
-
|
| 16 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 17 |
|
| 18 |
#splitting the text into
|
| 19 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
|
|
|
|
| 12 |
)
|
| 13 |
|
| 14 |
# Load and process the PDF files
|
| 15 |
+
from langchain.document_loaders import PyPDFDirectoryLoader
|
| 16 |
+
|
| 17 |
+
loader = PyPDFDirectoryLoader("new_papers/")
|
| 18 |
+
|
| 19 |
+
docs = loader.load()
|
| 20 |
+
|
| 21 |
+
#loader = PyPDFLoader('./new_papers/', glob="./*.pdf")
|
| 22 |
+
#documents = loader.load()
|
| 23 |
|
| 24 |
#splitting the text into
|
| 25 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
|