Petro commited on
Commit
b932f3e
1 Parent(s): 66bb7d2
Files changed (1) hide show
  1. main.py +3 -4
main.py CHANGED
@@ -2,12 +2,11 @@ from ctransformers import AutoModelForCausalLM
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
- file_name = "gemma-2b.Q2_K.gguf"
6
  llm = AutoModelForCausalLM.from_pretrained(file_name,
7
  model_type='mistral',
8
- max_new_tokens=2_096,
9
- context_length=8_000,
10
- threads=3,
11
  )
12
 
13
  #Pydantic object
 
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
+ file_name = "zephyr-7b-beta.Q4_K_S.gguf"
6
  llm = AutoModelForCausalLM.from_pretrained(file_name,
7
  model_type='mistral',
8
+ max_new_tokens=2096,
9
+ threads=8000,
 
10
  )
11
 
12
  #Pydantic object