Spaces:

NowLoadY
/

ocr-gpt

Runtime error

NowLoadY commited on Apr 5, 2023

Commit

1532c55

1 Parent(s): d804d15

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,24 +1,35 @@
 import easyocr
 import gradio as gr
-from transformers import pipeline
-# Initialize OCR reader and GPT pipeline
 reader = easyocr.Reader(['ch_sim', 'en'])
-gpt = pipeline('text-generation', model='gpt2')
 # Define the OCR function
-def ocr_gpt(image):
     ocr_result = reader.readtext(image)
-    corrected_text = gpt(ocr_result[0][1])[0]['generated_text']
-    gpt_opinion = gpt("What do you think about the information in the image?")[0]['generated_text']
     return corrected_text, gpt_opinion
 # Define Gradio UI components
 image_input = gr.inputs.Image()
-gpt_input = gr.inputs.Textbox(lines=1, label="GPT API Input")
 ocr_output = gr.outputs.Textbox(label="OCR Result (GPT Corrected)")
 gpt_opinion_output = gr.outputs.Textbox(label="GPT Opinion on Image Information")
 # Create Gradio interface
-iface = gr.Interface(fn=ocr_gpt, inputs=[gpt_input, image_input], outputs=[ocr_output, gpt_opinion_output])
 #iface.launch(share=True)

 import easyocr
 import gradio as gr
+import openai
+import requests
+# Set OpenAI API key
+openai.api_key = "your_api_key_here"
+# Initialize OCR reader
 reader = easyocr.Reader(['ch_sim', 'en'])
 # Define the OCR function
+# Update the ocr_gpt function to accept the API key as an input
+def ocr_gpt(image, gpt_opinion_prompt, api_key):
+    openai.api_key = api_key
     ocr_result = reader.readtext(image)
+    prompt = "Correct the following OCR result: " + ocr_result[0][1]
+    response = openai.Completion.create(engine="davinci-codex", prompt=prompt, max_tokens=50, n=1, stop=None, temperature=0.5)
+    corrected_text = response.choices[0].text.strip()
+    gpt_opinion_response = openai.Completion.create(engine="davinci-codex", prompt=gpt_opinion_prompt, max_tokens=50, n=1, stop=None, temperature=0.5)
+    gpt_opinion = gpt_opinion_response.choices[0].text.strip()
     return corrected_text, gpt_opinion
 # Define Gradio UI components
 image_input = gr.inputs.Image()
+gpt_input = gr.inputs.Textbox(lines=1, label="GPT Opinion Prompt")
+api_key_input = gr.inputs.Textbox(lines=1, label="API Key")
 ocr_output = gr.outputs.Textbox(label="OCR Result (GPT Corrected)")
 gpt_opinion_output = gr.outputs.Textbox(label="GPT Opinion on Image Information")
 # Create Gradio interface
+iface = gr.Interface(fn=ocr_gpt, inputs=[image_input, gpt_input, api_key_input], outputs=[ocr_output, gpt_opinion_output])
 #iface.launch(share=True)