Upload app.py
Browse files
app.py
CHANGED
@@ -2,6 +2,8 @@ import torch
|
|
2 |
from transformers import AutoTokenizer
|
3 |
from model import SmolLM2, SmolLM2Config
|
4 |
import gradio as gr
|
|
|
|
|
5 |
|
6 |
# Initialize model and tokenizer
|
7 |
device = 'cuda' if torch.cuda.is_available() else 'cpu'
|
@@ -9,7 +11,8 @@ tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/cosmo2-tokenizer")
|
|
9 |
model = SmolLM2(SmolLM2Config())
|
10 |
|
11 |
# Load trained weights
|
12 |
-
|
|
|
13 |
model.load_state_dict(checkpoint['model_state_dict'])
|
14 |
model.to(device)
|
15 |
model.eval()
|
|
|
2 |
from transformers import AutoTokenizer
|
3 |
from model import SmolLM2, SmolLM2Config
|
4 |
import gradio as gr
|
5 |
+
import zipfile
|
6 |
+
import io
|
7 |
|
8 |
# Initialize model and tokenizer
|
9 |
device = 'cuda' if torch.cuda.is_available() else 'cpu'
|
|
|
11 |
model = SmolLM2(SmolLM2Config())
|
12 |
|
13 |
# Load trained weights
|
14 |
+
|
15 |
+
checkpoint = torch.load('checkpoint_step_5000.pt', map_location=device) # Adjust path as needed
|
16 |
model.load_state_dict(checkpoint['model_state_dict'])
|
17 |
model.to(device)
|
18 |
model.eval()
|