Spaces:

billyxx
/

Sprouts_Assignment

Sleeping

App Files Files Community

billyxx commited on 18 days ago

Commit

272e246

verified ·

1 Parent(s): bee3a95

Upload app.py

Browse files

Files changed (1) hide show

app.py +43 -26

app.py CHANGED Viewed

@@ -13,41 +13,57 @@ def process_resumes(job_description, uploaded_files):
     if not job_description.strip():
         return "Please provide a job description.", None
-    if not uploaded_files:
-        return "Please upload at least one resume file.", None
     resume_texts = []
     for uploaded_file in uploaded_files:
-        filepath = uploaded_file.name  # uploaded_file is a NamedTemporaryFile-like object
-        # Read file content depending on extension
-        if filepath.endswith(".txt"):
-            text = uploaded_file.read().decode("utf-8")
-        elif filepath.endswith(".pdf"):
-            import pdfplumber
-            uploaded_file.seek(0)
-            with pdfplumber.open(uploaded_file) as pdf:
-                pages = [page.extract_text() for page in pdf.pages if page.extract_text() is not None]
-                text = "\n".join(pages)
-        elif filepath.endswith(".docx"):
-            from docx import Document
             uploaded_file.seek(0)
-            doc = Document(uploaded_file)
-            full_text = [para.text for para in doc.paragraphs]
-            text = "\n".join(full_text)
         else:
-            return f"Unsupported file format: {filepath}", None
-        resume_texts.append((filepath, text))
-    # Rank resumes
     results = rank_resumes(job_description, resume_texts)
-    # Add filename to candidate info
-    for i, candidate in enumerate(results):
-        candidate["name"] = resume_texts[i][0]
     # Generate summaries
     for candidate in results:
         candidate["summary"] = summarize_resume_flan(candidate["text"], job_description)
@@ -64,6 +80,7 @@ def process_resumes(job_description, uploaded_files):
     return "", table_data
 def extract_text_from_docx(filepath):
     doc = Document(filepath)
     full_text = []

     if not job_description.strip():
         return "Please provide a job description.", None
     resume_texts = []
     for uploaded_file in uploaded_files:
+        # If the uploaded_file is a file-like object (has 'read' method)
+        if hasattr(uploaded_file, "read"):
+            # Reset file pointer just in case
             uploaded_file.seek(0)
+            content = uploaded_file.read()
+            # Get filename attribute, fallback if not available
+            filename = getattr(uploaded_file, "name", "unknown")
+            # Save the file to disk if you want or just process in-memory
+            # For example, save to UPLOAD_FOLDER
+            filepath = os.path.join(UPLOAD_FOLDER, os.path.basename(filename))
+            with open(filepath, "wb") as f:
+                f.write(content)
         else:
+            # uploaded_file is probably a NamedString (str-like)
+            # Gradio provides the filename differently in this case,
+            # so you might have to assign a default or get from UI
+            content = uploaded_file
+            filepath = None
+            filename = "unknown"
+        # Process content depending on extension
+        if filename.endswith(".txt") or (filepath and filepath.endswith(".txt")):
+            text = content.decode("utf-8") if isinstance(content, bytes) else content
+        elif filename.endswith(".pdf") or (filepath and filepath.endswith(".pdf")):
+            # If saved to file, open from file
+            if filepath:
+                import pdfplumber
+                with pdfplumber.open(filepath) as pdf:
+                    pages = [page.extract_text() for page in pdf.pages if page.extract_text()]
+                    text = "\n".join(pages)
+            else:
+                # No file saved, cannot process PDF bytes easily here
+                return "Please upload PDF files via file upload.", None
+        elif filename.endswith(".docx") or (filepath and filepath.endswith(".docx")):
+            if filepath:
+                from docx import Document
+                doc = Document(filepath)
+                text = "\n".join([p.text for p in doc.paragraphs])
+            else:
+                return "Please upload DOCX files via file upload.", None
+        else:
+            return f"Unsupported file format: {filename}", None
+        resume_texts.append((filename, text))
+    # Now call rank_resumes etc.
     results = rank_resumes(job_description, resume_texts)
     # Generate summaries
     for candidate in results:
         candidate["summary"] = summarize_resume_flan(candidate["text"], job_description)
     return "", table_data
 def extract_text_from_docx(filepath):
     doc = Document(filepath)
     full_text = []