Spaces:

raseel-zymr
/

Document-QandA

Sleeping

App Files Files Community

raseel-zymr commited on Jun 20, 2023

Commit

952eb35

•

1 Parent(s): 5aee298

Upload TXT and PDF files

Browse files

Files changed (1) hide show

app.py +33 -10

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
 import streamlit as st
 from io import StringIO
 #for textfiles
@@ -18,12 +19,42 @@ from langchain.document_loaders import UnstructuredPDFLoader
 os.environ["HUGGINGFACEHUB_API_TOKEN"] = st.secrets["hf_api_key"]
 st.title('Document Q&A - Ask anything in your Document')
 st.sidebar.subheader('Upload document')
 uploaded_file = st.sidebar.file_uploader("Upload File",type=['txt','pdf'])
 with st.sidebar.expander('File'):
-    if(uploaded_file):
-    	st.info(uploaded_file.name)
@@ -42,12 +73,6 @@ if(uploaded_file):
 	loader = TextLoader(uploaded_file.name)
 	documents = loader.load()
-# Document Loader
-#loader = TextLoader('./KS-all-info_rev1.txt')
-# loader = TextLoader(os.path.join("./", uploaded_file.name))
 	# import textwrap
 	# def wrap_text_preserve_newlines(text, width=110):
     # 	# Split the input text into lines based on newline characters
@@ -78,8 +103,6 @@ if(uploaded_file):
 	docs = db.similarity_search(query)
 	answer = chain.run(input_documents=docs, question=query)
 	st.subheader('Answer')
 	st.write(answer)

 import os
 import streamlit as st
+from pathlib import Path
 from io import StringIO
 #for textfiles
 os.environ["HUGGINGFACEHUB_API_TOKEN"] = st.secrets["hf_api_key"]
+def pdf_file(filename):
+	st.subheader('Uploaded PDF File:')
+	st.write(filename)
+def text_file(filename):
+	st.subheader('Uploaded Text File:')
+	st.write(filename)
+	# loader = TextLoader(filename)
+	# documents = loader.load()
+	# # Text Splitter
+	# text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=10)
+	# docs = text_splitter.split_documents(documents)
+	# db = FAISS.from_documents(docs, embeddings)
+	# chain = load_qa_chain(llm2, chain_type="stuff")
 st.title('Document Q&A - Ask anything in your Document')
+st.subheader('This application can be used to upload text(.txt) and PDF(.pdf) files and ask questions about their contents.')
 st.sidebar.subheader('Upload document')
 uploaded_file = st.sidebar.file_uploader("Upload File",type=['txt','pdf'])
+if Path(uploaded_file.name).suffix == '.txt':
+	text_file(uploaded_file.name)
+if Path(uploaded_file.name).suffix == '.pdf':
+	pdf_file(uploaded_file.name)
 with st.sidebar.expander('File'):
+    if (uploaded_file):
+	    st.info(uploaded_file.name)
+if os.path.exists('/content/'):
+	st.info(os.listdir('/content/'))
 	loader = TextLoader(uploaded_file.name)
 	documents = loader.load()
 	# import textwrap
 	# def wrap_text_preserve_newlines(text, width=110):
     # 	# Split the input text into lines based on newline characters
 	docs = db.similarity_search(query)
 	answer = chain.run(input_documents=docs, question=query)
 	st.subheader('Answer')
 	st.write(answer)