File size: 658 Bytes
e62cb42
 
 
 
 
 
1695fdf
 
 
e62cb42
 
 
 
 
 
 
 
 
 
 
1695fdf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
from fastapi import FastAPI, HTTPException
from pydantic import BaseModel
from transformers import AutoModelForCausalLM, AutoTokenizer

app = FastAPI()

# Load your fine-tuned model and tokenizer
model = AutoModelForCausalLM.from_pretrained("Hadeel11/fine-tuned-model")
tokenizer = AutoTokenizer.from_pretrained("Hadeel11/fine-tuned-model")

class Query(BaseModel):
    question: str
    contexts: list

@app.post("/predict/")
async def predict(query: Query):
    inputs = tokenizer(query.question, return_tensors="pt")
    outputs = model.generate(**inputs)
    answer = tokenizer.decode(outputs[0], skip_special_tokens=True)
    return {"answer": answer}