Spaces:

CR7CAD
/

ISOM5240FinalProject

Sleeping

App Files Files Community

CR7CAD commited on Mar 17

Commit

4077883

verified ·

1 Parent(s): 6135a86

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -14

app.py CHANGED Viewed

@@ -1,8 +1,7 @@
 import os
-import tempfile
 import streamlit as st
 import docx
-import textract
 from transformers import pipeline
 import numpy as np
 from scipy.spatial.distance import cosine
@@ -35,7 +34,7 @@ models = load_models()
 #####################################
 def extract_text_from_file(file_obj):
     """
-    Extract text from .doc and .docx files.
     Returns the extracted text or an error message if extraction fails.
     """
     filename = file_obj.name
@@ -48,17 +47,13 @@ def extract_text_from_file(file_obj):
             text = "\n".join(para.text for para in document.paragraphs if para.text.strip())
         except Exception as e:
             text = f"Error processing DOCX file: {e}"
-    elif ext == ".doc":
         try:
-            with tempfile.NamedTemporaryFile(delete=False, suffix=".doc") as tmp:
-                tmp.write(file_obj.read())
-                tmp_filename = tmp.name
-            text = textract.process(tmp_filename).decode("utf-8")
-            os.unlink(tmp_filename)
         except Exception as e:
-            text = f"Error processing DOC file: {e}"
     else:
-        text = "Unsupported file type."
     return text
 #####################################
@@ -127,7 +122,7 @@ def compute_suitability(candidate_summary, company_prompt, models):
 st.title("Resume Analyzer and Company Suitability Checker")
 st.markdown(
     """
-Upload your resume file in **.doc** or **.docx** format. The app performs the following tasks:
 1. Extracts text from the resume.
 2. Uses a transformer-based model to generate a concise candidate summary.
 3. Compares the candidate summary with a company profile to produce a suitability score.
@@ -135,7 +130,7 @@ Upload your resume file in **.doc** or **.docx** format. The app performs the fo
 )
 # File uploader
-uploaded_file = st.file_uploader("Upload your resume (.doc or .docx)", type=["doc", "docx"])
 # Company description text area
 company_prompt = st.text_area(
@@ -175,7 +170,7 @@ if uploaded_file is not None and company_prompt and st.button("Analyze Resume"):
         # Extract text from resume
         resume_text = extract_text_from_file(uploaded_file)
-        if resume_text.startswith("Error") or resume_text == "Unsupported file type.":
             st.error(resume_text)
         else:
             # Display extracted text

 import os
+import io
 import streamlit as st
 import docx
 from transformers import pipeline
 import numpy as np
 from scipy.spatial.distance import cosine
 #####################################
 def extract_text_from_file(file_obj):
     """
+    Extract text from .docx files.
     Returns the extracted text or an error message if extraction fails.
     """
     filename = file_obj.name
             text = "\n".join(para.text for para in document.paragraphs if para.text.strip())
         except Exception as e:
             text = f"Error processing DOCX file: {e}"
+    elif ext == ".txt":
         try:
+            text = file_obj.getvalue().decode("utf-8")
         except Exception as e:
+            text = f"Error processing TXT file: {e}"
     else:
+        text = "Unsupported file type. Please upload a .docx or .txt file."
     return text
 #####################################
 st.title("Resume Analyzer and Company Suitability Checker")
 st.markdown(
     """
+Upload your resume file in **.docx** or **.txt** format. The app performs the following tasks:
 1. Extracts text from the resume.
 2. Uses a transformer-based model to generate a concise candidate summary.
 3. Compares the candidate summary with a company profile to produce a suitability score.
 )
 # File uploader
+uploaded_file = st.file_uploader("Upload your resume (.docx or .txt)", type=["docx", "txt"])
 # Company description text area
 company_prompt = st.text_area(
         # Extract text from resume
         resume_text = extract_text_from_file(uploaded_file)
+        if resume_text.startswith("Error") or resume_text == "Unsupported file type. Please upload a .docx or .txt file.":
             st.error(resume_text)
         else:
             # Display extracted text