Spaces:

jonah-ramponi
/

CV_Reviewer

Running

App Files Files Community

Jonah Ramponi commited on Aug 28, 2024

Commit

0c94c61

1 Parent(s): 98eaa40

Cleanup

Browse files

Files changed (10) hide show

.streamlit/config.toml +2 -0
CVReview.py +113 -0
Interview.py +75 -0
app.py +74 -180
assets/logo.png +0 -0
backend.py → utils/backend.py +10 -4
utils/format.py +9 -88
utils/gpt.py +10 -16
utils/process_doc.py +5 -7
utils/prompts.py +0 -17

.streamlit/config.toml ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ [client]
2	+ showSidebarNavigation = false

CVReview.py ADDED Viewed

	@@ -0,0 +1,113 @@

+"""
+    CV Review Feature
+"""
+import json
+import concurrent.futures
+from httpx import LocalProtocolError
+import streamlit as st
+from cohere.core.api_error import ApiError
+from utils.backend import produce_report
+from utils.format import extract_json
+def generate_markdown_report(REPORT_OBJ: dict) -> str:
+    """Format the report object dictionary into a markdown readable report"""
+    def add_section(section_title: str, table_contents: list) -> str:
+        """Utility function to add a section containing a table to the markdown report"""
+        if not table_contents:
+            return ""
+        section = f"### {section_title.title()}\n\n"
+        section += (
+            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
+            "| ----------------------- | ---------- | ----------- | -------------- |\n"
+        )
+        for table_row in table_contents:
+            section += f"| {table_row.get('jobPostingDetails', 'N/A')} | {table_row.get('cvDetails', 'N/A')} | {table_row.get('explanation', '')} | **{table_row.get('severityScore', 0)}** |\n"
+        return section + "\n"
+    report = (
+        f"# CV Analysis Report\n\n"
+        f"**Name:** {REPORT_OBJ.get('personName', 'Unknown')}  \n"
+        f"**Job:** {REPORT_OBJ.get('jobTitle', 'N/A')} at {REPORT_OBJ.get('companyName', 'N/A')}  \n"
+        f"**Job Description:** {REPORT_OBJ.get('jobDesc', 'No description available.')}\n\n"
+        "---\n\n"
+        "## Key Findings\n\n"
+    )
+    sections = ["experience", "education", "responsibilities", "languages", "tools"]
+    for section in sections:
+        report += add_section(section, REPORT_OBJ.get(section, []))
+    report += "---\n"
+    return report
+def CVReviewPage():
+    """Source Code for CV Review Page"""
+    SHARED_STATE = st.session_state.shared_materials
+    API_KEY = st.session_state.api_key
+    produce_report = st.button("Produce Suitability Report")
+    if produce_report:
+        try:
+            results = {}
+            # We will make 3 calls in parallel, to get various bits of information efficiently
+            with concurrent.futures.ThreadPoolExecutor() as executor:
+                futures = {
+                    critique_type: executor.submit(
+                        produce_report,
+                        SHARED_STATE["cv"],
+                        SHARED_STATE["job_posting"],
+                        critique_type,
+                        API_KEY,
+                    )
+                    for critique_type in ["basic", "general", "specific"]
+                }
+                for critique_type, future in futures.items():
+                    results[critique_type] = future.result()
+        except LocalProtocolError:
+            st.error("You need to enter a Cohere API Key.")
+        except ApiError:
+            st.error("You need a valid Cohere API Key")
+        # merge the from our calls, by extracting the json object from the gpt message
+        resultsDict = {}
+        for jsonText in results.values():
+            _, output_report_json = extract_json(jsonText)
+            resultsDict.update(output_report_json)
+        # store this as the report object
+        SHARED_STATE["report"] = resultsDict
+        # if the report object exists
+        if SHARED_STATE["report"]:
+            REPORT = SHARED_STATE["report"]
+            # these are used for file naming
+            name = REPORT.get("personName", "MissingPersonName")
+            job_title = REPORT.get("jobTitle", "MissingTitle")
+            company_name = REPORT.get("companyName", "MissingCompany")
+            # render markdown report
+            st.markdown(generate_markdown_report(REPORT))
+            # Downloadable in json form !
+            st.download_button(
+                label="Download Report JSON",
+                data=json.dumps(REPORT, indent=4),
+                file_name=f"{name}_{job_title}_{company_name}.json",
+                mime="application/json",
+                use_container_width=True,
+            )

Interview.py ADDED Viewed

	@@ -0,0 +1,75 @@

+"""
+    Simulates an interview, using uploaded CV and Job Description
+"""
+import random
+import streamlit as st
+from httpx import LocalProtocolError
+from cohere.core.api_error import ApiError
+from utils.gpt import stream
+def InterviewPage():
+    """Source Code for the Interview Simulation Page"""
+    initial_questions = [
+        "Ready for me to grill you?",
+        "Please let me know when you're ready to begin the interview",
+        "Ready to rumble?",
+    ]
+    # the initial message will be a random choice, initiating the conversation
+    if "messages" not in st.session_state:
+        st.session_state["messages"] = [
+            {"role": "assistant", "message": random.choice(initial_questions)}
+        ]
+    MESSAGES = st.session_state.messages
+    SHARED_STATE = st.session_state.shared_materials
+    API_KEY = st.session_state.api_key
+    clear_conversation = st.button("Clear Conversation")
+    # Clear conversation will clear message state, and initialize with a new random question
+    if clear_conversation:
+        st.session_state["messages"] = [
+            {"role": "assistant", "message": random.choice(initial_questions)}
+        ]
+    if not SHARED_STATE["valid_flag"]:
+        st.error("You need to upload a Job Description & CV to use this feature.")
+    else:
+        try:
+            # Populate the chat with historic messages
+            for msg in MESSAGES:
+                st.chat_message(msg["role"]).write(msg["message"])
+            if user_input := st.chat_input():
+                # Write the user question to UI
+                st.chat_message("user").write(user_input)
+                assistant_message = st.chat_message("assistant")
+                # Stream assistant message, using relevant background information
+                response = assistant_message.write_stream(
+                    stream(
+                        background_info={
+                            "cv": SHARED_STATE["cv"],
+                            "job_posting": SHARED_STATE["job_posting"],
+                        },
+                        chat_history=MESSAGES,
+                        api_key=API_KEY,
+                    )
+                )
+                # Append messages to chat history
+                MESSAGES.append({"role": "user", "message": user_input})
+                MESSAGES.append({"role": "assistant", "message": response})
+        except LocalProtocolError:
+            st.error("You need to enter a Cohere API Key.")
+        except ApiError:
+            st.error("You need a valid Cohere API Key")

app.py CHANGED Viewed

@@ -2,191 +2,85 @@
     For HF, the interface should be called app.py
 """
-import json
-import random
-import concurrent.futures
 import streamlit as st
-from backend import paired_critique
 from utils.process_doc import parse_docx, parse_pdf
-from utils.gpt import test_api_key, gpt_stream_response_chat_history
-from utils.format import extract_json, generate_markdown_report
-st.set_page_config(layout="wide")
-with st.sidebar:
-    COHERE_API_KEY = st.text_input(
-        "Cohere API Key Entry",
-        value="",
-        placeholder="Enter your Free Tier Cohere API Key",
     )
-if "state" not in st.session_state:
-    st.session_state.state = {"successful_report_flag": True, "paired_report": {}}
-STATE = st.session_state.state
-# Weird Hugging Face display issue, padding fixes it
-st.markdown("\n")
-st.markdown("\n")
-st.markdown("\n")
-cv_upload_box = st.file_uploader(
-    "CV Upload Box",
-    help="Upload your CV in .docx or .pdf form. This CV will be parsed, and used to analyse against the given job post.",
-    type=["docx", "pdf"],
-    accept_multiple_files=False,
-)
-job_posting_upload_box = st.text_area(
-    "Job Description Upload Box",
-    value="""Job description
-As a Data Scientist at Meta, you will shape the future of people-facing and business-facing products we build across our entire family of applications (Facebook, Instagram, Messenger, WhatsApp, Oculus). By applying your technical skills, analytical mindset, and product intuition to one of the richest data sets in the world, you will help define the experiences we build for billions of people and hundreds of millions of businesses around the world. You will collaborate on a wide array of product and business problems with a diverse set of cross-functional partners across Product, Engineering, Research, Data Engineering, Marketing, Sales, Finance and others. You will use data and analysis to identify and solve product development’s biggest challenges. You will influence product strategy and investment decisions with data, be focused on impact, and collaborate with other teams. By joining Meta, you will become part of a world-class analytics community dedicated to skill development and career growth in analytics and beyond.Product leadership: You will use data to shape product development, quantify new opportunities, identify upcoming challenges, and ensure the products we build bring value to people, businesses, and Meta. You will help your partner teams prioritize what to build, set goals, and understand their product’s ecosystem.Analytics: You will guide teams using data and insights. You will focus on developing hypotheses and employ a diverse toolkit of rigorous analytical approaches, different methodologies, frameworks, and technical approaches to test them.Communication and influence: You won’t simply present data, but tell data-driven stories. You will convince and influence your partners using clear insights and recommendations. You will build credibility through structure and clarity, and be a trusted strategic partner.
-Data Scientist, Product Analytics Responsibilities:
-Work with large and complex data sets to solve a wide array of challenging problems using different analytical and statistical approaches.
-Apply technical expertise with quantitative analysis, experimentation, data mining, and the presentation of data to develop strategies for our products that serve billions of people and hundreds of millions of businesses.
-Identify and measure success of product efforts through goal setting, forecasting, and monitoring of key product metrics to understand trends.
-Define, understand, and test opportunities and levers to improve the product, and drive roadmaps through your insights and recommendations.
-Partner with Product, Engineering, and cross-functional teams to inform, influence, support, and execute product strategy and investment decisions.
-Minimum Qualifications:
-A minimum of 6 years of work experience in analytics (minimum of 4 years with a Ph.D.).
-Bachelor's degree in Mathematics, Statistics, a relevant technical field, or equivalent practical experience.
-Experience with data querying languages (e.g. SQL), scripting languages (e.g. Python), and/or statistical/mathematical software (e.g. R).
-Preferred Qualifications:
-Masters or Ph.D. Degree in a quantitative field.
-About Meta:
-Meta builds technologies that help people connect, find communities, and grow businesses. When Facebook launched in 2004, it changed the way people connect. Apps like Messenger, Instagram and WhatsApp further empowered billions around the world. Now, Meta is moving beyond 2D screens toward immersive experiences like augmented and virtual reality to help build the next evolution in social technology. People who choose to build their careers by building with us at Meta help shape a future that will take us beyond what digital connection makes possible today—beyond the constraints of screens, the limits of distance, and even the rules of physics.
-Individual compensation is determined by skills, qualifications, experience, and location. Compensation details listed in this posting reflect the base hourly rate, monthly rate, or annual salary only, and do not include bonus, equity or sales incentives, if applicable. In addition to base compensation, Meta offers benefits. Learn more about benefits at Meta.""",
-    placeholder="Copy and Paste a job post you are interested in. Make sure to include the full post! More information is better.",
-    help="In this box, please dump text content for a job description you are interested in. This could easily be setup to work directly with a webpage (we'd simply need to scrape said page) however I do not want to do that on HF spaces.",
-)
-if cv_upload_box and job_posting_upload_box != "":
-    STATE["job_posting"] = job_posting_upload_box
-    cv_filetype = cv_upload_box.name.split(".")[-1]
-    cv_file_contents = cv_upload_box.getvalue()
-    STATE["cv"] = (
-        parse_docx(cv_file_contents)
-        if cv_filetype == "docx"
-        else parse_pdf(cv_file_contents)
-    )
-    cv_critique, practice_interview, general_cv_critique = st.tabs(
-        ["Role Specific CV Critique", "Practice Interview", "General CV Critique"]
-    )
-    with cv_critique:
-        produce_report = st.button("Produce Suitability Report")
-        if produce_report:
-            # Make 3 calls in parallel
-            with concurrent.futures.ThreadPoolExecutor() as executor:
-                future1 = executor.submit(
-                    paired_critique,
-                    STATE["cv"],
-                    STATE["job_posting"],
-                    "basic",
-                    COHERE_API_KEY,
-                )
-                future2 = executor.submit(
-                    paired_critique,
-                    STATE["cv"],
-                    STATE["job_posting"],
-                    "general",
-                    COHERE_API_KEY,
-                )
-                future3 = executor.submit(
-                    paired_critique,
-                    STATE["cv"],
-                    STATE["job_posting"],
-                    "specific",
-                    COHERE_API_KEY,
-                )
-                basic_details_out = future1.result()
-                general_details_out = future2.result()
-                specific_details_out = future3.result()
-            # merge the outputs
-            resultsDict = {}
-            for jsonText in [
-                basic_details_out,
-                general_details_out,
-                specific_details_out,
-            ]:
-                valid_json_flag, output_report_json = extract_json(jsonText)
-                if not valid_json_flag:
-                    STATE["successful_report_flag"] = False
-                resultsDict.update(output_report_json)
-            STATE["paired_report"] = resultsDict
-        if STATE["successful_report_flag"] and STATE["paired_report"]:
-            paired_report = STATE["paired_report"]
-            name = paired_report.get("personName", "MissingPersonName")
-            job_title = paired_report.get("jobTitle", "MissingTitle")
-            company_name = paired_report.get("companyName", "MissingCompany")
-            with cv_critique:
-                st.markdown(generate_markdown_report(STATE["paired_report"]))
-                st.download_button(
-                    label="Download Report JSON",
-                    data=json.dumps(STATE["paired_report"], indent=4),
-                    file_name=f"{name}_{job_title}_{company_name}.json",
-                    mime="application/json",
-                    use_container_width=True,
-                )
-    # Streaming Chatbot !!!
-    with practice_interview:
-        initial_questions = [
-            "What do you think is the biggest reason you're unsuitable for the role?",
-            "Why are you interested in this role specifically?",
-            "What do you know about the company?",
-        ]
-        if "messages" not in st.session_state:
-            st.session_state["messages"] = [
-                {"role": "assistant", "message": random.choice(initial_questions)}
-            ]
-        # Populate the chat with historic messages
-        for msg in st.session_state.messages:
-            st.chat_message(msg["role"]).write(msg["message"])
-        if prompt := st.chat_input():
-            st.session_state.messages.append({"role": "user", "message": prompt})
-            st.chat_message("user").write(prompt)
-            assistant_message = st.chat_message("assistant")
-            response = assistant_message.write_stream(
-                gpt_stream_response_chat_history(
-                    st.session_state.messages,
-                    background_info={
-                        "cv": STATE["cv"],
-                        "job_posting": STATE["job_posting"],
-                    },
-                    api_key=COHERE_API_KEY,
-                )
-            )
-            st.session_state.messages.append({"role": "assistant", "message": response})

     For HF, the interface should be called app.py
 """
+import pathlib
 import streamlit as st
 from utils.process_doc import parse_docx, parse_pdf
+from Interview import InterviewPage
+from CVReview import CVReviewPage
+CURRENT_DIR = pathlib.Path(__file__).parent.resolve()
+def main():
+    st.set_page_config(layout="wide")
+    if "api_key" not in st.session_state:
+        st.session_state.api_key = ""
+    if "report" not in st.session_state:
+        st.session_state.report = {}
+    if "shared_materials" not in st.session_state:
+        st.session_state.shared_materials = {"valid_flag": False, "report": None}
+    SHARED_MATERIALS = st.session_state.shared_materials
+    with st.sidebar:
+        st.session_state["api_key"] = st.text_input(
+            "Cohere API Key Entry",
+            value="",
+            placeholder="Enter your Free Tier Cohere API Key",
+        )
+        job_posting_upload_box = st.text_area(
+            "Job Description Upload Box",
+            value="",
+            placeholder="Copy and Paste the contents of a job post you are interested in.",
+            help="In this box, please dump text content for a job description you are interested in. This could easily be setup to work directly with a webpage (we'd simply need to scrape said page) however I do not want to do that on HF spaces.",
+        )
+        cv_upload_box = st.file_uploader(
+            "CV Upload Box",
+            help="Upload your CV in .docx or .pdf form. This CV will be parsed, and used to analyse against the given job post.",
+            type=["docx", "pdf"],
+            accept_multiple_files=False,
+        )
+    if cv_upload_box and job_posting_upload_box != "":
+        SHARED_MATERIALS["job_posting"] = job_posting_upload_box
+        cv_filetype = cv_upload_box.name.split(".")[-1]
+        cv_file_contents = cv_upload_box.getvalue()
+        SHARED_MATERIALS["cv"] = (
+            parse_docx(cv_file_contents)
+            if cv_filetype == "docx"
+            else parse_pdf(cv_file_contents)
+        )
+        SHARED_MATERIALS["valid_flag"] = True
+    pg = st.navigation(
+        {
+            "Job Search AI Tools": [
+                st.Page(
+                    InterviewPage,
+                    title="Practice Interview",
+                    icon=":material/chat:",
+                ),
+                st.Page(
+                    CVReviewPage,
+                    title="CV Review",
+                    icon=":material/description:",
+                ),
+            ],
+        }
     )
+    pg.run()
+if __name__ == "__main__":
+    main()

assets/logo.png ADDED Viewed

backend.py → utils/backend.py RENAMED Viewed

@@ -1,3 +1,7 @@
 from utils.prompts import (
     basic_details_extraction_prompt,
     general_skils_extraction_prompt,
@@ -13,13 +17,15 @@ prompt_mapping = {
 }
-def paired_critique(
-    cv_contents: str, job_post_contents: str, response_type: str, API_KEY: str
 ) -> str:
     """Process CV contents, using Cohere"""
     # First, get the prompt from the prompt dict
-    prompt = prompt_mapping.get(response_type)
     # Now, populate with the contents of the CV and job posting
     prompt = prompt.replace("<cv>", cv_contents).replace(
@@ -43,5 +49,5 @@ if __name__ == "__main__":
     COHERE_API_KEY = ""
-    output = paired_critique(post_contents, cv_contents, "specific", COHERE_API_KEY)
     print(output)

+"""
+    Main Backend Handling Function
+"""
 from utils.prompts import (
     basic_details_extraction_prompt,
     general_skils_extraction_prompt,
 }
+def produce_report(
+    cv_contents: str, job_post_contents: str, PROMPT_TO_USE: str, API_KEY: str
 ) -> str:
     """Process CV contents, using Cohere"""
+    # The KEY ARGUMENT here is PROMPT_TO_USE, which controls the prompt to use
     # First, get the prompt from the prompt dict
+    prompt = prompt_mapping.get(PROMPT_TO_USE)
     # Now, populate with the contents of the CV and job posting
     prompt = prompt.replace("<cv>", cv_contents).replace(
     COHERE_API_KEY = ""
+    output = produce_report(post_contents, cv_contents, "specific", COHERE_API_KEY)
     print(output)

utils/format.py CHANGED Viewed

@@ -1,7 +1,8 @@
 import json
-def extract_json(input_string: str) -> dict:
     """String to Json function"""
     # First, ensure we remove json wrapper
@@ -21,98 +22,14 @@ def extract_json(input_string: str) -> dict:
         return False, {}
-def generate_markdown_report(data):
-    # Header
-    report = f"# CV Analysis Report\n\n"
-    report += f"**Name:** {data.get('personName', 'Unknown')}  \n"
-    report += f"**Job:** {data.get('jobTitle', 'N/A')} at {data.get('companyName', 'N/A')}  \n"
-    report += (
-        f"**Job Description:** {data.get('jobDesc', 'No description available.')}\n\n"
-    )
-    report += "---\n\n"
-    report += "## Key Findings\n\n"
-    experiences = data.get("experience", [])
-    if experiences:
-        report += "### Experience\n\n"
-        report += (
-            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
-        )
-        report += (
-            "| ----------------------- | ---------- | ----------- | -------------- |\n"
-        )
-        for exp in experiences:
-            report += f"| {exp.get('jobPostingDetails', 'N/A')} | {exp.get('cvDetails', 'N/A')} | {exp.get('explanation', '')} | **{exp.get('severityScore', 0)}** |\n"
-        report += "\n"
-    education = data.get("education", [])
-    if education:
-        report += "### Education\n\n"
-        report += (
-            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
-        )
-        report += (
-            "| ----------------------- | ---------- | ----------- | -------------- |\n"
-        )
-        for edu in education:
-            report += f"| {edu.get('jobPostingDetails', 'N/A')} | {edu.get('cvDetails', 'N/A')} | {edu.get('explanation', '')} | **{edu.get('severityScore', 0)}** |\n"
-        report += "\n"
-    responsibilities = data.get("responsibilities", [])
-    if responsibilities:
-        report += "### Responsibilities\n\n"
-        report += (
-            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
-        )
-        report += (
-            "| ----------------------- | ---------- | ----------- | -------------- |\n"
-        )
-        for resp in responsibilities:
-            report += f"| {resp.get('jobPostingDetails', 'N/A')} | {resp.get('cvDetails', 'N/A')} | {resp.get('explanation', '')} | **{resp.get('severityScore', 0)}** |\n"
-        report += "\n"
-    languages = data.get("languages", [])
-    if languages:
-        report += "### Languages\n\n"
-        report += (
-            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
-        )
-        report += (
-            "| ----------------------- | ---------- | ----------- | -------------- |\n"
-        )
-        for lang in languages:
-            report += f"| {lang.get('jobPostingDetails', 'N/A')} | {lang.get('cvDetails', 'N/A')} | {lang.get('explanation', '')} | **{lang.get('severityScore', 0)}** |\n"
-        report += "\n"
-    # Tools
-    tools = data.get("tools", [])
-    if tools:
-        report += "### Tools\n\n"
-        report += (
-            "| Job Posting Requirement | CV Details | Explanation | Impact Score |\n"
-        )
-        report += (
-            "| ----------------------- | ---------- | ----------- | -------------- |\n"
-        )
-        for tool in tools:
-            report += f"| {tool.get('jobPostingDetails', 'N/A')} | {tool.get('cvDetails', 'N/A')} | {tool.get('explanation', '')} | **{tool.get('severityScore', 0)}** |\n"
-        report += "\n"
-    # Closing
-    report += "---\n"
-    return report
 def format_chat_history_cohere(chat_history: list, background_info: dict) -> list:
     """Takes streamlit chat history, and converts to cohere format"""
-    # Could use cohere to track history, maybe for the future
     new_output = [
         {
             "role": "USER",
-            "message": f"Hi there! Here is my CV! {background_info['cv']}.\n\n I'd like you to act as a senior technical recruiter, recruiting for a role at a specific company. I want you to ask highly specific questions about the role, and critique my CV and its' suitability for the role. Please also ask general interview questions.",
         },
         {
             "role": "CHATBOT",
@@ -124,6 +41,7 @@ def format_chat_history_cohere(chat_history: list, background_info: dict) -> lis
         },
     ]
     for item in chat_history:
         new_output.append(
             {
@@ -137,6 +55,9 @@ def format_chat_history_cohere(chat_history: list, background_info: dict) -> lis
 if __name__ == "__main__":
     example_json = """
 """
     extract_json(example_json)

 import json
+from typing import Union
+def extract_json(input_string: str) -> Union[bool, dict]:
     """String to Json function"""
     # First, ensure we remove json wrapper
         return False, {}
 def format_chat_history_cohere(chat_history: list, background_info: dict) -> list:
     """Takes streamlit chat history, and converts to cohere format"""
+    # TODO: Could use cohere to track history, maybe for the future
     new_output = [
         {
             "role": "USER",
+            "message": f"Hi there! Here is my CV! {background_info['cv']}.\n\n I'd like you to act as a senior technical recruiter. Critique my CV and its' suitability for the role. You may only ask me one question at a time. Be as critical of the CV as possible, really focus on the CV and its relevance to the role. Ask about inconsistencies, mistakes in grammar, things which are technically not quite right suggesting a misunderstanding, or ask me to justify claims I make in my CV. You could also ask specific technical details about the architectures I have used.",
         },
         {
             "role": "CHATBOT",
         },
     ]
+    # Lazy approach to format it correctly for cohere input!
     for item in chat_history:
         new_output.append(
             {
 if __name__ == "__main__":
     example_json = """
+```json
+{
+"dogs": "are blue?"
+}
 """
     extract_json(example_json)

utils/gpt.py CHANGED Viewed

@@ -1,9 +1,15 @@
 import cohere
 from utils.format import format_chat_history_cohere
 def test_api_key(api_key: str):
     try:
         # try to just generate 3 tokens
         co = cohere.Client(
@@ -15,7 +21,9 @@ def test_api_key(api_key: str):
         return False
-def gpt_stream_response_chat_history(chat_history, background_info, api_key):
     """Get response from Cohere and stream response"""
     co = cohere.Client(
         api_key=api_key,
@@ -32,20 +40,6 @@ def gpt_stream_response_chat_history(chat_history, background_info, api_key):
             yield event.text
-def gpt_stream_response(prompt: str, api_key: str):
-    """Get response from Cohere and stream response"""
-    co = cohere.Client(
-        api_key=api_key,
-    )
-    stream = co.chat_stream(message=prompt)
-    for event in stream:
-        if event.event_type == "text-generation":
-            yield event.text
 def gpt_response(prompt: str, api_key: str) -> str:
     """Get response from Cohere, with option to get output in json format"""

+"""
+    GPT Related Functions
+"""
+from typing import List, Dict, Generator
 import cohere
 from utils.format import format_chat_history_cohere
 def test_api_key(api_key: str):
+    """Function to test Cohere API is working"""
     try:
         # try to just generate 3 tokens
         co = cohere.Client(
         return False
+def stream(
+    background_info: str, chat_history: List[Dict[str, str]] = [], api_key: str = ""
+) -> Generator:
     """Get response from Cohere and stream response"""
     co = cohere.Client(
         api_key=api_key,
             yield event.text
 def gpt_response(prompt: str, api_key: str) -> str:
     """Get response from Cohere, with option to get output in json format"""

utils/process_doc.py CHANGED Viewed

@@ -12,10 +12,11 @@ def parse_pdf(pdf_file) -> str:
     """Read PDF from Streamlit's file uploader"""
     pdf_document = fitz.open("pdf", pdf_file)
     all_text = []
-    for page_number in range(len(pdf_document)):
         page = pdf_document.load_page(page_number)
@@ -26,15 +27,12 @@ def parse_pdf(pdf_file) -> str:
     return "\n\n".join(all_text)
-def parse_docx(docx_file):
     """Read in docx file"""
     docx_file = io.BytesIO(docx_file)
-    document = Document(docx_file)
-    all_text = []
-    for paragraph in document.paragraphs:
-        all_text.append(paragraph.text)
     return "\n".join(all_text)

     """Read PDF from Streamlit's file uploader"""
     pdf_document = fitz.open("pdf", pdf_file)
+    n_pages = len(pdf_document)
     all_text = []
+    for page_number in range(n_pages):
         page = pdf_document.load_page(page_number)
     return "\n\n".join(all_text)
+def parse_docx(docx_file) -> str:
     """Read in docx file"""
     docx_file = io.BytesIO(docx_file)
+    doc = Document(docx_file)
+    all_text = [para.text for para in doc.paragraphs]
     return "\n".join(all_text)

utils/prompts.py CHANGED Viewed

@@ -88,7 +88,6 @@ If you wish to leave a field blank in a given json, use "". You must never use n
 Now respond with your professional, concise, answer.
 """
 specific_skills_comparison_prompt = """
 You are an expert at understanding how suitable a given CV is for a given job posting.
 You will focus on evaluating the candidates experience quality
@@ -141,19 +140,3 @@ You must never use null as this will be loaded using json.loads! If there is not
 Now respond with your professional, concise, answer.
 """
-interviewer_prompt = """
-**Goal**
-You are an interviewer, and will carry out a natural interview
-**Background Information**
-The user has the following CV:
-<cv>
-The user is interested in the following job:
-<job-posting>
-You will act like an interviewer for that job, critiquing the user's CV and asking them questions. Follow the conversation naturally.
-Ask either STAR reasoning, or technical questions, based on the job posting, or general job title.
-"""

 Now respond with your professional, concise, answer.
 """
 specific_skills_comparison_prompt = """
 You are an expert at understanding how suitable a given CV is for a given job posting.
 You will focus on evaluating the candidates experience quality
 Now respond with your professional, concise, answer.
 """