Petro commited on
Commit
7fa9dc9
1 Parent(s): b0a8dfd

First model version

Browse files
Files changed (1) hide show
  1. main.py +3 -3
main.py CHANGED
@@ -6,13 +6,13 @@ from pydantic import BaseModel
6
 
7
  file_name = "zephyr-7b-beta.Q4_K_S.gguf"
8
  config = {
9
- "max_new_token": 1024,
10
  "repetition_penalty": 1.1,
11
  "temperature": 0.5,
12
  "top_k": 50,
13
  "top_p": 0.9,
14
- "stream": True,
15
- "threads": int(os.cpu_count() / 2),
16
  }
17
  llm = CTransformers(
18
  model=file_name,
 
6
 
7
  file_name = "zephyr-7b-beta.Q4_K_S.gguf"
8
  config = {
9
+ "max_new_token": 10,
10
  "repetition_penalty": 1.1,
11
  "temperature": 0.5,
12
  "top_k": 50,
13
  "top_p": 0.9,
14
+ "stream": False,
15
+ "threads": 3,
16
  }
17
  llm = CTransformers(
18
  model=file_name,