AndreasThinks commited on
Commit
1180e45
·
verified ·
1 Parent(s): 0fb26a5

Changed to q4 model to make quicker.

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -11,8 +11,8 @@ logger = logging.getLogger(__name__)
11
  logger.info("Loading the model...")
12
  llm = Llama.from_pretrained(
13
  repo_id="AndreasThinks/mistral-7b-english-welsh-translate-GGUF",
14
- filename="*q8_0.gguf",
15
- verbose=False
16
  )
17
  logger.info("Model loaded successfully")
18
 
 
11
  logger.info("Loading the model...")
12
  llm = Llama.from_pretrained(
13
  repo_id="AndreasThinks/mistral-7b-english-welsh-translate-GGUF",
14
+ filename="*q4_k_m.gguf",
15
+ verbose=True
16
  )
17
  logger.info("Model loaded successfully")
18