Spaces:

mdasad3617
/

lab-report-analyzer

Running

App Files Files Community

mdasad3617 commited on Nov 30, 2024

Commit

375547d

verified ·

1 Parent(s): 0f90d5a

Update app.py

Browse files

Files changed (1) hide show

app.py +83 -23

app.py CHANGED Viewed

@@ -1,45 +1,105 @@
 import streamlit as st
 from transformers import pipeline
 import logging
 # Setup logging
 def setup_logging():
     logging.basicConfig(
         level=logging.INFO,
-        format='%(asctime)s - %(levelname)s - %(message)s',
-        handlers=[
-            logging.StreamHandler()
-        ]
     )
 def main():
     setup_logging()
-    logging.info("Starting the Streamlit app.")
-    # Initialize the translation pipeline for English to Hinglish
-    translator = pipeline("translation", model="surajp/eng_to_hinglish")  # Replace with your desired model
-    # Streamlit UI
-    st.title("English to Hinglish Translator")
-    st.write("Type or paste your English text below, and get the Hinglish translation.")
-    text = st.text_area("Enter your English text here:", placeholder="Type here...")
-    if st.button("Translate"):
         try:
-            if text:
-                logging.info("Translating English text to Hinglish.")
-                result = translator(text, max_length=200)
-                translation = result[0]['translation_text'] if result else "No translation available."
-                st.text_area("Hinglish Translation:", translation, height=200)
-                logging.info("Translation completed successfully.")
-            else:
-                st.warning("Please enter text to translate.")
         except Exception as e:
-            logging.error(f"Error during translation: {e}")
-            st.error("An error occurred during translation. Please check the logs for more details.")
-    logging.info("Closing the Streamlit app.")
 if __name__ == "__main__":
     main()

 import streamlit as st
 from transformers import pipeline
+from PIL import Image
+import pytesseract
 import logging
+import PyPDF2
 # Setup logging
 def setup_logging():
     logging.basicConfig(
         level=logging.INFO,
+        format="%(asctime)s - %(levelname)s - %(message)s",
+        handlers=[logging.StreamHandler()],
     )
+# Text extraction from image
+def extract_text_from_image(image):
+    try:
+        text = pytesseract.image_to_string(image)
+        return text
+    except Exception as e:
+        logging.error(f"Error during OCR: {e}")
+        return "Error occurred during text extraction."
+# Text extraction from PDF
+def extract_text_from_pdf(file):
+    try:
+        pdf_reader = PyPDF2.PdfReader(file)
+        text = ""
+        for page in pdf_reader.pages:
+            text += page.extract_text()
+        return text
+    except Exception as e:
+        logging.error(f"Error during PDF text extraction: {e}")
+        return "Error occurred during text extraction."
+# Main function
 def main():
     setup_logging()
+    st.title("Lab Report Analyzer")
+    st.write("Analyze lab reports from images, PDFs, or text and get summaries in English, Hindi, and Urdu.")
+    # Hugging Face pipelines
+    summarizer = pipeline("summarization", model="facebook/bart-large-cnn")  # Summarization model
+    translator_hi = pipeline("translation", model="Helsinki-NLP/opus-mt-en-hi")  # English to Hindi
+    translator_ur = pipeline("translation", model="Helsinki-NLP/opus-mt-en-ur")  # English to Urdu
+    # File upload section
+    uploaded_file = st.file_uploader("Upload a file (Image or PDF):", type=["png", "jpg", "jpeg", "pdf"])
+    text_input = st.text_area("Or paste your text here:")
+    if st.button("Analyze"):
+        extracted_text = ""
+        # Extract text based on file type
+        if uploaded_file:
+            if uploaded_file.name.endswith(".pdf"):
+                st.info("Extracting text from PDF...")
+                extracted_text = extract_text_from_pdf(uploaded_file)
+            else:
+                st.info("Extracting text from image...")
+                image = Image.open(uploaded_file)
+                extracted_text = extract_text_from_image(image)
+        elif text_input:
+            extracted_text = text_input
+        else:
+            st.warning("Please upload a file or enter text.")
+            return
+        # Display extracted text
+        st.subheader("Extracted Text")
+        st.text_area("Extracted Text:", extracted_text, height=200)
+        # Summarize the text
         try:
+            st.info("Summarizing text...")
+            summary = summarizer(extracted_text, max_length=150, min_length=30, do_sample=False)[0]['summary_text']
+            st.subheader("Summary (English)")
+            st.write(summary)
         except Exception as e:
+            logging.error(f"Error during summarization: {e}")
+            st.error("An error occurred during summarization.")
+        # Translate summary to Hindi
+        try:
+            st.info("Translating summary to Hindi...")
+            summary_hi = translator_hi(summary)[0]['translation_text']
+            st.subheader("Summary (Hindi)")
+            st.write(summary_hi)
+        except Exception as e:
+            logging.error(f"Error during Hindi translation: {e}")
+            st.error("An error occurred during Hindi translation.")
+        # Translate summary to Urdu
+        try:
+            st.info("Translating summary to Urdu...")
+            summary_ur = translator_ur(summary)[0]['translation_text']
+            st.subheader("Summary (Urdu)")
+            st.write(summary_ur)
+        except Exception as e:
+            logging.error(f"Error during Urdu translation: {e}")
+            st.error("An error occurred during Urdu translation.")
 if __name__ == "__main__":
     main()