Petro
commited on
Commit
•
b932f3e
1
Parent(s):
66bb7d2
test
Browse files
main.py
CHANGED
@@ -2,12 +2,11 @@ from ctransformers import AutoModelForCausalLM
|
|
2 |
from fastapi import FastAPI
|
3 |
from pydantic import BaseModel
|
4 |
|
5 |
-
file_name = "
|
6 |
llm = AutoModelForCausalLM.from_pretrained(file_name,
|
7 |
model_type='mistral',
|
8 |
-
max_new_tokens=
|
9 |
-
|
10 |
-
threads=3,
|
11 |
)
|
12 |
|
13 |
#Pydantic object
|
|
|
2 |
from fastapi import FastAPI
|
3 |
from pydantic import BaseModel
|
4 |
|
5 |
+
file_name = "zephyr-7b-beta.Q4_K_S.gguf"
|
6 |
llm = AutoModelForCausalLM.from_pretrained(file_name,
|
7 |
model_type='mistral',
|
8 |
+
max_new_tokens=2096,
|
9 |
+
threads=8000,
|
|
|
10 |
)
|
11 |
|
12 |
#Pydantic object
|