resumeMagic

Sleeping

App Files Files Community

pktpaulie commited on Nov 10, 2024

Commit

fcf1770

verified ·

1 Parent(s): 0fba36c

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -288

app.py CHANGED Viewed

@@ -19,7 +19,7 @@ import pdfplumber
 import docx
 import numpy as np
 import pypandoc
 # Create temporary directories
 temp_dir = tempfile.mkdtemp()
@@ -145,12 +145,14 @@ st.markdown("""
         .stButton>:active, focus {
          box-shadow: none;
          transform: translateY(0);
         }
     </style>
 """, unsafe_allow_html=True)
 # Add ResumeMagic Logo
-# st.image("logo.jpeg", use_container_width=True)
 st.markdown('<div class="logo-container"></div>', unsafe_allow_html=True)
 st.image("logo.jpeg", width=80)
 st.markdown('</div>', unsafe_allow_html=True)
@@ -249,7 +251,7 @@ def display_content_with_page_numbers(content, words_per_page=500):
         end_index = start_index + words_per_page
         page_content = ' '.join(words[start_index:end_index])
-        st.markdown(f"### Page {i + 1}")
         st.write(page_content)
 def save_docx_as_pdf(input_path, output_path='output.pdf'):
@@ -265,44 +267,8 @@ def save_docx_as_pdf(input_path, output_path='output.pdf'):
         shutil.copy(input_path, output_path)
     else:
         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
-# def save_docx_as_pdf(input_path, output_path='output.pdf'):
-#     if input_path.lower().endswith('.docx'):
-#         try:
-#             # Attempt to use unoconv
-#             subprocess.run(['unoconv', '-o', output_path, input_path])
-#             if not os.path.exists(output_path):
-#                 raise FileNotFoundError("unoconv failed to convert DOCX to PDF")
-#         except FileNotFoundError:
-#             # Fallback to text-based display
-#             with open(output_path, 'w') as f:
-#                 f.write(input_path.read())
-#     elif input_path.lower().endswith('.pdf'):
-#         shutil.copy(input_path, output_path)
-#     else:
-#         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
-def save_docx_as_pdf6(input_path, output_path='output.pdf'):
-    if input_path.lower().endswith('.docx'):
-        try:
-            # Convert .docx to .pdf using docx2pdf
-            convert(input_path, output_path)
-            if not os.path.exists(output_path):
-                raise FileNotFoundError("Conversion failed; output PDF not found.")
-        except Exception as e:
-            st.error(f"Failed to convert DOCX to PDF: {str(e)}")
-    elif input_path.lower().endswith('.pdf'):
-        shutil.copy(input_path, output_path)
-    else:
-        raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
-# Install docx2pdf if not already installed
-# try:
-#     import docx2pdf
-# except ImportError:
-#     !pip install docx2pdf
 # def save_docx_as_pdf(input_path, output_path='output.pdf'):
 #     if input_path.lower().endswith('.docx'):
@@ -313,21 +279,7 @@ def save_docx_as_pdf6(input_path, output_path='output.pdf'):
 #     else:
 #         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
-def save_docx_as_pdf2(doc_content, output_path='output.pdf'):
-    # Save document content as a .docx file
-    temp_doc_path = 'temp.docx'
-    doc = Document()
-    doc.add_paragraph(doc_content)
-    doc.save(temp_doc_path)
-    # Convert .docx to PDF
-    from docx2pdf import convert
-    convert(temp_doc_path, output_path)
-    os.remove(temp_doc_path)
-    # subprocess.run(['libreoffice', '--headless', '--convert-to', 'pdf', temp_doc_path, '--outdir', os.path.dirname(output_path)])
 def save_docx_as_pdf1(input_path, output_path='output.pdf'):
     if input_path.lower().endswith('.docx'):
         from docx2pdf import convert
@@ -337,9 +289,6 @@ def save_docx_as_pdf1(input_path, output_path='output.pdf'):
     else:
         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
-# if uploaded_resume.type == "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
-#     save_docx_as_pdf(resume_path, 'uploaded_resume.pdf')
-#     display_doc_as_image('uploaded_resume.pdf')
 def display_pdf_page1(pdf_path):
     try:
@@ -368,7 +317,7 @@ def display_pdf_pages_as_images(pdf_path):
     try:
         with pdfplumber.open(pdf_path) as pdf:
             for i, page in enumerate(pdf.pages):
-                st.markdown(f"### Page {i + 1}")
                 # Convert the page to an image
                 image = page.to_image()
                 # Render the image using Streamlit
@@ -394,146 +343,14 @@ def display_pdf_page(pdf_path, page_number=1):
     # Display the image
     display(img)
-def display_doc_as_image2(pdf_path):
-    # try:
-    #     images = convert_from_path(pdf_path, size=800)
-    #     display(Image(filename=images[0].filename))
-    # except Exception as e:
-    #     st.error(f"Failed to display image: {str(e)}")
     iframe_code = f"""
     <iframe src="{pdf_path}" width="100%" height="600px"></iframe>
     """
     st.markdown(iframe_code, unsafe_allow_html=True)
-    # try:
-    #     # Convert PDF to images
-    #     images = []
-    #     for i in range(1):  # Assuming only one page
-    #         command = [
-    #             "pdf2image", "-j", "--png",
-    #             "-f", str(i+1),
-    #             "-l", str(i+1),
-    #             pdf_path
-    #         ]
-    #         output = subprocess.check_output(command)
-    #         # Decode the base64 image data
-    #         img_data = base64.b64decode(output.split()[0])
-    #         img = Image.open(BytesIO(img_data))
-    #         images.append(img)
-    #     # Display the first page
-    #     display(images[0])
-    # except Exception as e:
-    #     st.error(f"Failed to display image: {str(e)}")
-def display_doc_as_image3(pdf_path):
-    try:
-        # Convert PDF to images
-        images = []
-        for i in range(1):  # Assuming only one page
-            img = Image.open(BytesIO(open(pdf_path, 'rb').read()))
-            images.append(img)
-        # Display the first page
-        display(images[0])
-    except Exception as e:
-        st.error(f"Failed to display image: {str(e)}")
-    # try:
-    #     images = convert_from_path(pdf_path, size=800)
-    #     display(Image.fromarray(images[0]))
-    # except Exception as e:
-    #     st.error(f"Failed to display image: {str(e)}")
-def display_doc_as_image1(pdf_url):
-    st.components.v1.iframe(pdf_url, width=800, height=600)
-    # try:
-    #     img = Image.open(pdf_path)
-    #     st.image(img)
-    # except Exception as e:
-    #     st.error(f"Failed to display image: {str(e)}")
-def display_doc_as_image(file_path):
-    """Display document with multiple fallback options"""
-    try:
-        # First attempt: Use pdf2image with explicit poppler path
-        try:
-            from pdf2image import convert_from_path
-            # Try common poppler paths on Linux
-            poppler_paths = [
-                '/usr/bin/pdftoppm',  # Common Linux path
-                '/opt/homebrew/bin/pdftoppm',  # Mac Homebrew path
-                'poppler-utils'  # Package name
-            ]
-            for poppler_path in poppler_paths:
-                try:
-                    images = convert_from_path(
-                        file_path,
-                        size=800,
-                        poppler_path=os.path.dirname(poppler_path) if os.path.isfile(poppler_path) else None
-                    )
-                    st.image(images[0])
-                    return
-                except Exception:
-                    continue
-            # If no poppler path worked, try without specifying path
-            images = convert_from_path(file_path, size=800)
-            st.image(images[0])
-        except Exception as e:
-            # Second attempt: Use Streamlit's native PDF display
-            try:
-                with open(file_path, "rb") as pdf_file:
-                    pdf_bytes = pdf_file.read()
-                    st.pdf(pdf_bytes)
-                return
-            except Exception as pdf_error:
-                st.error(f"Error displaying PDF: {str(pdf_error)}")
-            # Third attempt: If it's a DOCX file, try to extract text
-            if file_path.lower().endswith('.docx'):
-                try:
-                    doc = Document(file_path)
-                    text = '\n'.join([paragraph.text for paragraph in doc.paragraphs])
-                    st.text(text)
-                    return
-                except Exception as docx_error:
-                    st.error(f"Error displaying DOCX: {str(docx_error)}")
-    except Exception as main_error:
-        st.error(f"Error in display function: {str(main_error)}")
-        st.info("Displaying file path for debugging: " + file_path)
-        # Last resort: Try to read and display raw bytes
-        try:
-            with open(file_path, 'rb') as f:
-                bytes_data = f.read()
-                if file_path.lower().endswith('.pdf'):
-                    st.pdf(bytes_data)
-                else:
-                    st.text("File content preview not available")
-        except Exception as final_error:
-            st.error(f"Final fallback failed: {str(final_error)}")
-def display_doc_as_image5(pdf_path):
-    poppler_path = 'usr/bin'
-    images = convert_from_path(pdf_path, poppler_path=poppler_path)
-    for img in images:
-        buf = BytesIO()
-        img.save(buf, format="PNG")
-        st.image(buf)
-    # from IPython.display import display, Image
-    # images = convert_from_bytes(open(pdf_path, 'rb').read(), size=800)
-    # display(images[0])
 # Process if files are uploaded
 if uploaded_resume and uploaded_job_description:
     # Save files
@@ -578,11 +395,13 @@ if uploaded_resume and uploaded_job_description:
             # st.write(generated_resume)
             #Autoscroll
-            st.markdown("""
                 <script>
-                    window.scrollTo(0, document.body.scrollHeight);
                 </script>
-            """, unsafe_allow_html=True)
             # with st.spinner("Computing Match"):
@@ -617,19 +436,17 @@ if uploaded_resume and uploaded_job_description:
                 with col1:
                     st.markdown("### Uploaded Resume:")
                     save_docx_as_pdf(resume_path, '/tmp/uploaded_resume.pdf')
-                    # display_doc_as_image1('/tmp/uploaded_resume.pdf')
                     display_pdf_pages_as_images(resume_path)
                 with col2:
                     st.markdown("### Tailored Resume:")
-                    # display_doc_as_image2(gen_pdf_path)
                     # display_pdf_pages_as_images(gen_pdf_path)
-                    # st.write(generated_resume)
-                    display_content_with_page_numbers(generated_resume, 290)
                     st.success(f"Download tailored resume")
                     st.download_button(
                         label="Generated Resume (PDF)",
                         data=open(gen_pdf_path, 'rb').read(),
-                        file_name="generated_resume.pdf",
                         mime="application/pdf"
                         )
                     st.download_button(
@@ -653,94 +470,7 @@ if uploaded_resume and uploaded_job_description:
                 #         mime="application/vnd.openxmlformats-officedocument.wordprocessingml.document"
                 #     )
-                    # from io import BytesIO
-                    # doc = Document()
-                    # with tempfile.NamedTemporaryFile(delete=False, suffix=".docx") as temp_doc:
-                    #     temp_doc_path = temp_doc.name
-                    #     doc.save(temp_doc_path)
-                    # Convert the DOCX to PDF and display
-                    # pdf_path = '/tmp/generated_resume.pdf'
-                    # save_docx_as_pdf(temp_doc_path, pdf_path)
-                    # # Now pass the path to any function that expects a file path
-                    # pdf_path = '/tmp/generated_resume.pdf'
-                    # save_bytes_as_pdf(temp_doc_path, pdf_path)
-                    # # Display the generated PDF or handle further processing
-                    # display_doc_as_image(pdf_path)
-                    # with tempfile.NamedTemporaryFile(suffix='.docx') as temp_doc:
-                    #     doc = Document()
-                    #     doc.add_paragraph(generated_resume)
-                    #     # doc.save(temp_doc.name)
-                    #     # resume_bytes = BytesIO()
-                    #     # doc.save(resume_bytes)
-                    #     # resume_bytes.seek(0)
-                    #     # Convert DOCX to PDF
-                    #     # pdf_path = f"temp_{os.path.basename(temp_doc.name)}.pdf"
-                    #     # convert(temp_doc.name, pdf_path)
-                    #     # save_docx_as_pdf(temp_doc.name, pdf_path)
-                    #     pdf_path = '/tmp/generated_resume.docx'
-                    #     doc.save(pdf_path)
-                    #     # pdf_path = save_uploaded_file(resume_bytes)
-                    #     save_docx_as_pdf(generated_resume, pdf_path)
-                    #     # Display resumes side by side
-                    #     col1, col2 = st.columns(2)
-                    #     with col1:
-                    #         st.write("Uploaded Resume:")
-                    #         if resume_path:
-                    #             display_doc_as_image(resume_path)
-                    #         else:
-                    #             st.warning("No resume file found")
-                    #     with col2:
-                    #         st.write("Generated Resume:")
-                    #         if pdf_path:
-                    #             display_doc_as_image(pdf_path)
-                    #         else:
-                    #             st.warning("No generated resume file found")
-                    # Allow users to download both PDFs
-                    # st.download_button(
-                    #     label="Download Uploaded Resume",
-                    #     data=resume_bytes,
-                    #     file_name="uploaded_resume.pdf",
-                    #     mime="application/pdf"
-                    # )
-                    # doc = Document()
-                    # doc.add_paragraph(generated_resume)
-                    # resume_bytes = BytesIO()
-                    # doc.save(resume_bytes)
-                    # resume_bytes.seek(0)
-                    # gen_resume_path = save_uploaded_file(resume_bytes)
-                    # # uploaded_resume_path = save_uploaded_file(resume)
-                    # col1, col2 = st.columns(2)
-                    # with col1:
-                    #     save_docx_as_pdf(resume_path, 'uploaded_resume.pdf')
-                    #     display_doc_as_image('uploaded_resume.pdf')
-                    # with col2:
-                    #     st.markdown("### Tailored Resume:")
-                    #     save_docx_as_pdf(gen_resume_path, 'tailored_resume.pdf')
-                    #     display_doc_as_image('tailored_resume.pdf')
-                    # st.download_button(
-                    #     label="Download Resume",
-                    #     data=resume_bytes,
-                    #     file_name="tailored_resume.docx",
-                    #     mime="application/vnd.openxmlformats-officedocument.wordprocessingml.document"
-                    # )
 else:
     st.warning("Please upload both the resume and job description files.")

 import docx
 import numpy as np
 import pypandoc
+import streamlit.components.v1 as components
 # Create temporary directories
 temp_dir = tempfile.mkdtemp()
         .stButton>:active, focus {
          box-shadow: none;
          transform: translateY(0);
+         color: #fff;
+         border: none !important;
+         outline: none;
         }
     </style>
 """, unsafe_allow_html=True)
 # Add ResumeMagic Logo
 st.markdown('<div class="logo-container"></div>', unsafe_allow_html=True)
 st.image("logo.jpeg", width=80)
 st.markdown('</div>', unsafe_allow_html=True)
         end_index = start_index + words_per_page
         page_content = ' '.join(words[start_index:end_index])
+        st.markdown(f"#### Page {i + 1}")
         st.write(page_content)
 def save_docx_as_pdf(input_path, output_path='output.pdf'):
         shutil.copy(input_path, output_path)
     else:
         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
 # def save_docx_as_pdf(input_path, output_path='output.pdf'):
 #     if input_path.lower().endswith('.docx'):
 #     else:
 #         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
 def save_docx_as_pdf1(input_path, output_path='output.pdf'):
     if input_path.lower().endswith('.docx'):
         from docx2pdf import convert
     else:
         raise ValueError("Unsupported file format. Please upload a .docx or .pdf file.")
 def display_pdf_page1(pdf_path):
     try:
     try:
         with pdfplumber.open(pdf_path) as pdf:
             for i, page in enumerate(pdf.pages):
+                st.markdown(f"#### Page {i + 1}")
                 # Convert the page to an image
                 image = page.to_image()
                 # Render the image using Streamlit
     # Display the image
     display(img)
+def display_doc_as_image2(pdf_path):
     iframe_code = f"""
     <iframe src="{pdf_path}" width="100%" height="600px"></iframe>
     """
     st.markdown(iframe_code, unsafe_allow_html=True)
 # Process if files are uploaded
 if uploaded_resume and uploaded_job_description:
     # Save files
             # st.write(generated_resume)
             #Autoscroll
+            components.html("""
                 <script>
+                    window.onload = function() {
+                        window.scrollTo(0, document.body.scrollHeight);
+                    };
                 </script>
+            """)
             # with st.spinner("Computing Match"):
                 with col1:
                     st.markdown("### Uploaded Resume:")
                     save_docx_as_pdf(resume_path, '/tmp/uploaded_resume.pdf')
                     display_pdf_pages_as_images(resume_path)
                 with col2:
                     st.markdown("### Tailored Resume:")
                     # display_pdf_pages_as_images(gen_pdf_path)
+                    st.write(generated_resume)
+                    # display_content_with_page_numbers(generated_resume, 290)
                     st.success(f"Download tailored resume")
                     st.download_button(
                         label="Generated Resume (PDF)",
                         data=open(gen_pdf_path, 'rb').read(),
+                        file_name="tailored_resume.pdf",
                         mime="application/pdf"
                         )
                     st.download_button(
                 #         mime="application/vnd.openxmlformats-officedocument.wordprocessingml.document"
                 #     )
 else:
     st.warning("Please upload both the resume and job description files.")