File size: 709 Bytes
1462422
344585f
 
1462422
 
 
344585f
 
 
 
 
 
 
1462422
 
344585f
 
 
 
 
 
 
 
 
1462422
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from fastapi import FastAPI
import torch
from transformers import AutoModelForCausalLM, AutoTokenizer

app = FastAPI()

# Define model-related constants
MODEL_NAME = "arnir0/Tiny-LLM"

# Global variables to store the tokenizer and model
tokenizer = None
model = None

@app.get("/")
def greet_json():
    global tokenizer, model

    # Load the model and tokenizer if not already loaded
    if model is None or tokenizer is None:
        tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
        model = AutoModelForCausalLM.from_pretrained(MODEL_NAME)
        model.eval()  # Set model to evaluation mode (optional for inference)

    return {"Hello": "World!", "model_status": "Loaded and hibernated!"}