Spaces:

RanaZaeem12
/

ExtractAnswer

Sleeping

RanaZaeem12 commited on May 11

Commit

c8b4723

verified ·

1 Parent(s): 3c64a05

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,16 +3,24 @@ from PyPDF2 import PdfReader
 import docx
 from pptx import Presentation
 from transformers import pipeline
-import os
-st.title("Multi-Document Q&A App 📄💬")
 qa_pipeline = pipeline("question-answering", model="distilbert-base-uncased-distilled-squad")
-uploaded_files = st.file_uploader("Upload PDF, Word, or PPT files", type=["pdf", "docx", "pptx"], accept_multiple_files=True)
 all_text = ""
 def extract_text_from_pdf(file):
     reader = PdfReader(file)
     return "\n".join([page.extract_text() or "" for page in reader.pages])
@@ -30,6 +38,7 @@ def extract_text_from_pptx(file):
                 text.append(shape.text)
     return "\n".join(text)
 for file in uploaded_files:
     file_type = file.name.split('.')[-1].lower()
     if file_type == "pdf":
@@ -39,10 +48,14 @@ for file in uploaded_files:
     elif file_type == "pptx":
         all_text += extract_text_from_pptx(file) + "\n"
 if all_text:
-    st.success("Files processed. You can now ask questions.")
-    question = st.text_input("Ask a question based on your uploaded files:")
     if question:
         result = qa_pipeline(question=question, context=all_text)
-        st.write("**Answer:**", result['answer'])

 import docx
 from pptx import Presentation
 from transformers import pipeline
+# Title of the app
+st.title("📚 Multi-Document Q&A App")
+# Load question-answering pipeline from Hugging Face
 qa_pipeline = pipeline("question-answering", model="distilbert-base-uncased-distilled-squad")
+# File uploader for multiple file types
+uploaded_files = st.file_uploader(
+    "Upload PDF, Word (.docx), or PPT (.pptx) files",
+    type=["pdf", "docx", "pptx"],
+    accept_multiple_files=True
+)
+# Combine text from all files
 all_text = ""
+# File processing functions
 def extract_text_from_pdf(file):
     reader = PdfReader(file)
     return "\n".join([page.extract_text() or "" for page in reader.pages])
                 text.append(shape.text)
     return "\n".join(text)
+# Extract text from uploaded files
 for file in uploaded_files:
     file_type = file.name.split('.')[-1].lower()
     if file_type == "pdf":
     elif file_type == "pptx":
         all_text += extract_text_from_pptx(file) + "\n"
+# Show input for question if files were processed
 if all_text:
+    st.success("✅ Files processed. Ask your question below.")
+    question = st.text_input("❓ Ask a question:")
     if question:
         result = qa_pipeline(question=question, context=all_text)
+        st.write("📌 **Answer:**", result['answer'])
+else:
+    st.info("Upload some files to begin...")