Spaces:

billyxx
/

Sprouts_Assignment

Sleeping

App Files Files Community

billyxx commited on 18 days ago

Commit

fc1e181

verified ·

1 Parent(s): 31aa939

Upload app.py

Browse files

Files changed (1) hide show

app.py +22 -23

app.py CHANGED Viewed

@@ -12,48 +12,48 @@ os.makedirs(UPLOAD_FOLDER, exist_ok=True)
 def process_resumes(job_description, uploaded_files):
     if not job_description.strip():
         return "Please provide a job description.", None
-    if not uploaded_files:
-        return "Please upload at least one resume file.", None
     resume_texts = []
     for uploaded_file in uploaded_files:
         filename = getattr(uploaded_file, "name", None)
         if filename is None:
             return "One of the uploaded files is missing a filename. Please upload files, not text.", None
-        # Reset file pointer
-        if hasattr(uploaded_file, "seek"):
-            uploaded_file.seek(0)
-        # Process based on extension
         ext = filename.lower().split(".")[-1]
         if ext == "txt":
-            # Read text directly
-            if hasattr(uploaded_file, "read"):
-                content = uploaded_file.read()
-                # bytes? decode
-                text = content.decode("utf-8") if isinstance(content, bytes) else content
-            else:
-                return f"Unexpected content for {filename}", None
         elif ext == "pdf":
-            # Save temporarily to disk to use pdfplumber (which needs a file path)
             temp_path = os.path.join(UPLOAD_FOLDER, filename)
             with open(temp_path, "wb") as f:
-                f.write(uploaded_file.read())
             import pdfplumber
             with pdfplumber.open(temp_path) as pdf:
                 pages = [page.extract_text() for page in pdf.pages if page.extract_text()]
                 text = "\n".join(pages)
         elif ext == "docx":
-            # Save temporarily to disk for python-docx
             temp_path = os.path.join(UPLOAD_FOLDER, filename)
             with open(temp_path, "wb") as f:
-                f.write(uploaded_file.read())
             from docx import Document
             doc = Document(temp_path)
             text = "\n".join([p.text for p in doc.paragraphs])
@@ -63,9 +63,10 @@ def process_resumes(job_description, uploaded_files):
         resume_texts.append((filename, text))
-    # Rank resumes and generate summaries
     results = rank_resumes(job_description, resume_texts)
     for candidate in results:
         candidate["summary"] = summarize_resume_flan(candidate["text"], job_description)
@@ -80,8 +81,6 @@ def process_resumes(job_description, uploaded_files):
     return "", table_data
 def extract_text_from_docx(filepath):
     doc = Document(filepath)
     full_text = []

 def process_resumes(job_description, uploaded_files):
     if not job_description.strip():
         return "Please provide a job description.", None
     resume_texts = []
     for uploaded_file in uploaded_files:
         filename = getattr(uploaded_file, "name", None)
         if filename is None:
             return "One of the uploaded files is missing a filename. Please upload files, not text.", None
         ext = filename.lower().split(".")[-1]
+        # Read file content or bytes
+        if hasattr(uploaded_file, "read"):
+            content = uploaded_file.read()
+        elif isinstance(uploaded_file, str):
+            content = uploaded_file
+        else:
+            return f"Unsupported upload type for file: {filename}", None
+        # Process by file type
         if ext == "txt":
+            text = content.decode("utf-8") if isinstance(content, bytes) else content
         elif ext == "pdf":
             temp_path = os.path.join(UPLOAD_FOLDER, filename)
             with open(temp_path, "wb") as f:
+                if isinstance(content, bytes):
+                    f.write(content)
+                else:
+                    f.write(content.encode("utf-8"))
             import pdfplumber
             with pdfplumber.open(temp_path) as pdf:
                 pages = [page.extract_text() for page in pdf.pages if page.extract_text()]
                 text = "\n".join(pages)
         elif ext == "docx":
             temp_path = os.path.join(UPLOAD_FOLDER, filename)
             with open(temp_path, "wb") as f:
+                if isinstance(content, bytes):
+                    f.write(content)
+                else:
+                    f.write(content.encode("utf-8"))
             from docx import Document
             doc = Document(temp_path)
             text = "\n".join([p.text for p in doc.paragraphs])
         resume_texts.append((filename, text))
+    # Rank resumes
     results = rank_resumes(job_description, resume_texts)
+    # Generate summaries
     for candidate in results:
         candidate["summary"] = summarize_resume_flan(candidate["text"], job_description)
     return "", table_data
 def extract_text_from_docx(filepath):
     doc = Document(filepath)
     full_text = []