Spaces:

cogcorp
/

assignment1

Sleeping

App Files Files Community

cogcorp commited on May 23, 2023

Commit

ba952d1

1 Parent(s): 75ce576

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -22

app.py CHANGED Viewed

@@ -8,16 +8,16 @@ import gradio as gr
 import os
 from sklearn.neighbors import NearestNeighbors
 def download_pdf(url, output_path):
     urllib.request.urlretrieve(url, output_path)
 def preprocess(text):
     text = text.replace('\n', ' ')
     text = re.sub('\s+', ' ', text)
     return text
 def pdf_to_text(path, start_page=1, end_page=None):
     doc = fitz.open(path)
     total_pages = doc.page_count
@@ -35,10 +35,8 @@ def pdf_to_text(path, start_page=1, end_page=None):
     doc.close()
     return text_list
 def text_to_chunks(texts, word_length=150, start_page=1):
     text_toks = [t.split(' ') for t in texts]
-    page_nums = []
     chunks = []
     for idx, words in enumerate(text_toks):
@@ -93,23 +91,21 @@ def load_recommender(path, start_page=1):
     chunks = text_to_chunks(texts, start_page=start_page)
     recommender.fit(chunks)
     return 'Corpus Loaded.'
-def generate_text(openAI_key, prompt, engine="davinci"):
-    openai.api_key = openAI_key
     completions = openai.Completion.create(
         engine=engine,
         prompt=prompt,
         max_tokens=512,
-        n=1,
-        stop=None,
-        temperature=0.7,
     )
     message = completions.choices[0].text
     return message
-def generate_answer(question, openAI_key):
     topn_chunks = recommender(question)
     prompt = ""
     prompt += 'search results:\n\n'
@@ -126,13 +122,10 @@ def generate_answer(question, openAI_key):
               "answer should be short and concise. Answer step-by-step. \n\nQuery: {question}\nAnswer: "
     prompt += f"Query: {question}\nAnswer:"
-    answer = generate_text(openAI_key, prompt, "davinci")
     return answer
-def question_answer(url, file, question, openAI_key):
-    if openAI_key.strip() == '':
-        return '[ERROR]: Please enter your Open AI Key. Get your key here: https://platform.openai.com/account/api-keys'
     if url.strip() == '' and file is None:
         return '[ERROR]: Both URL and PDF are empty. Provide at least one.'
@@ -153,14 +146,22 @@ def question_answer(url, file, question, openAI_key):
     if question.strip() == '':
         return '[ERROR]: Question field is empty'
-    return generate_answer(question, openAI_key)
 title = 'PDF GPT'
 description = """ PDF GPT allows you to chat with your PDF file using Universal Sentence Encoder and Open AI. It gives hallucination free response than other tools as the embeddings are better than OpenAI. The returned response can even cite the page number in square brackets([]) where the information is located, adding credibility to the responses and helping to locate pertinent information quickly."""
-iface = gr.Interface(fn=question_answer, inputs=[gr.inputs.Textbox(label="Enter PDF URL here"), file, question, openAI_key], outputs=[answer], title=title, description=description)
 iface.launch()

 import os
 from sklearn.neighbors import NearestNeighbors
+ openai.api_key = openAI
 def download_pdf(url, output_path):
     urllib.request.urlretrieve(url, output_path)
 def preprocess(text):
     text = text.replace('\n', ' ')
     text = re.sub('\s+', ' ', text)
     return text
 def pdf_to_text(path, start_page=1, end_page=None):
     doc = fitz.open(path)
     total_pages = doc.page_count
     doc.close()
     return text_list
 def text_to_chunks(texts, word_length=150, start_page=1):
     text_toks = [t.split(' ') for t in texts]
     chunks = []
     for idx, words in enumerate(text_toks):
     chunks = text_to_chunks(texts, start_page=start_page)
     recommender.fit(chunks)
     return 'Corpus Loaded.'
+def generate_text(prompt, engine="davinci"):
+    openai.api_key = openAI
     completions = openai.Completion.create(
         engine=engine,
         prompt=prompt,
         max_tokens=512,
+    n=1,
+    stop=None,
+    temperature=0.7,
     )
     message = completions.choices[0].text
     return message
+def generate_answer(question):
     topn_chunks = recommender(question)
     prompt = ""
     prompt += 'search results:\n\n'
               "answer should be short and concise. Answer step-by-step. \n\nQuery: {question}\nAnswer: "
     prompt += f"Query: {question}\nAnswer:"
+    answer = generate_text(prompt, "davinci")
     return answer
+def question_answer(url, file, question):
     if url.strip() == '' and file is None:
         return '[ERROR]: Both URL and PDF are empty. Provide at least one.'
     if question.strip() == '':
         return '[ERROR]: Question field is empty'
+    return generate_answer(question)
 title = 'PDF GPT'
 description = """ PDF GPT allows you to chat with your PDF file using Universal Sentence Encoder and Open AI. It gives hallucination free response than other tools as the embeddings are better than OpenAI. The returned response can even cite the page number in square brackets([]) where the information is located, adding credibility to the responses and helping to locate pertinent information quickly."""
+iface = gr.Interface(
+    fn=question_answer,
+    inputs=[
+        gr.inputs.Textbox(label="Enter PDF URL here"),
+        gr.inputs.File(label="Upload PDF file"),
+        gr.inputs.Textbox(label="Enter your question here"),
+    ],
+    outputs=gr.outputs.Textbox(label="Generated Answer"),
+    title=title,
+    description=description
+)
 iface.launch()