rajsinghparihar
default groq api key set in repo secrets
28f535f
raw
history blame
5.01 kB
import gradio as gr
from rag import RAG, ServiceContextModule
from llama_index.core import set_global_service_context
import json
from prompts import general_prompt
from gradio_pdf import PDF
import requests
import os
service_context_module = None
current_model = None
def initialize(api_key, model_name):
global service_context_module, current_model
gr.Info("Initializing app")
url = "https://api.groq.com/openai/v1/models"
headers = {
"Authorization": f"Bearer {api_key}",
"Content-Type": "application/json",
}
try:
response = requests.get(url, headers=headers)
data = response.json()
models = [model["id"] for model in data["data"]]
except Exception:
gr.Error("Invalid API KEY")
return gr.update(choices=[])
if not service_context_module or current_model != model_name:
service_context_module = ServiceContextModule(api_key, model_name)
current_model = model_name
gr.Info("App started")
set_global_service_context(
service_context=service_context_module.service_context
)
else:
gr.Info("App is already running")
return gr.update(choices=models)
def process_document(file, query):
if file.endswith(".pdf"):
return process_pdf(file, query=query)
else:
return "Unsupported file format"
def postprocess_json_string(json_string: str) -> dict:
json_string = json_string.replace("'", '"')
json_string = json_string[json_string.rfind("{") : json_string.rfind("}") + 1]
try:
json_data = json.loads(json_string)
except Exception as e:
print("Error parsing output, invalid json format", e)
return json_data
def process_pdf(file, query):
rag_module = RAG(filepaths=[file])
fields = [field for field in query.split(",")]
formatted_prompt = general_prompt(fields=fields)
response = rag_module.run_query_engine(prompt=formatted_prompt)
extracted_json = postprocess_json_string(json_string=response)
return extracted_json
with gr.Blocks(title="Document Information Extractor.") as app:
gr.Markdown(
value="""
# Welcome to Document Information Extractor.
Created by [@rajsinghparihar](https://huggingface.co/rajsinghparihar) for extracting useful information from pdf documents like invoices, salary slips, etc.
## Usage:
- In the Init Section, Enter your `GROQ_API_KEY` in the corresponding labeled textbox.
- choose the model from the list of available models.
- click `Initialize` to start the app.
- In the app section, you can upload a document (pdf files: currently works for readable pdfs only, will add ocr functionality later)
- Enter the entities you wanna extract as a comma seperated string. (check the examples for more info)
- Click Submit to see the extracted entities as a JSON object.
"""
)
with gr.Tab(label="Init Section") as init_tab:
with gr.Row():
api_key = gr.Text(
label="Enter your Groq API KEY",
type="password",
)
if api_key == "" or not api_key:
api_key = os.getenv("GROQ_API_KEY")
available_models = gr.Dropdown(
value="llama3-70b-8192",
label="Choose your LLM",
choices=[
"gemma-7b-it",
"llama3-70b-8192",
"llama3-8b-8192",
"mixtral-8x7b-32768",
"whisper-large-v3",
],
)
init_btn = gr.Button(value="Initialize")
init_btn.click(
fn=initialize,
inputs=[api_key, available_models],
outputs=available_models,
)
with gr.Tab(label="App Section") as app_tab:
iface = gr.Interface(
fn=process_document,
inputs=[
PDF(label="Document"),
gr.Text(
label="Entities you wanna extract in comma separated string format"
),
],
outputs=gr.JSON(label="Extracted Entities"),
description="Upload a PDF document and extract specified entities from it.",
examples=[
[
"examples/Commerce Bank Statement Sample.pdf",
"Customer Name, Account Number, Statement Date, Ending Balance, Total Deposits, Checks Paid",
],
[
"examples/Salary-Slip-pdf.pdf",
"Employee Name, Bank Name, Location, Total Salary, Total Deductions",
],
],
)
gr.Markdown("""
## Pros of LLMs as information extractors over current extraction solutions:
- LLMs are able to understand the scope of the problem from the context and are more robust to typos or extraction failure
## Cons
- Higher Inference Cost
- Can't use free APIs for Sensitive documents.
""")
app.launch(server_name="0.0.0.0", server_port=7860)