Spaces:
Paused
Paused
File size: 673 Bytes
2624a11 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
from langchain_community.document_loaders import PyMuPDFLoader, TextLoader
from langchain_community.vectorstores import Qdrant
def process_file(file):
documents = []
if file.endswith(".pdf"):
loader = PyMuPDFLoader(file)
docs = loader.load()
documents.extend(docs)
else:
loader = TextLoader(file)
docs = loader.load()
documents.extend(docs)
return documents
def add_to_qdrant(documents, embeddings, qdrant_client, collection_name):
Qdrant.from_documents(
documents,
embeddings,
url=qdrant_client.url,
prefer_grpc=True,
collection_name=collection_name,
) |