cortexso
/

gemma

jan-hq commited on Jun 25, 2024

Commit

f503cbc

verified ·

1 Parent(s): 9cae646

Create model.yml

Files changed (1) hide show

model.yml ADDED Viewed

+name: gemma
+model: gemma:7B
+version: 1
+files:
+  - llama_model_path: model.gguf
+# Results Preferences
+top_p: 0.95
+temperature: 0.7
+frequency_penalty: 0
+presence_penalty: 0
+max_tokens: 4096 # Infer from base config.json -> max_position_embeddings
+stream: true # true | false
+# Engine / Model Settings
+ngl: 33 # Infer from base config.json -> num_attention_heads
+ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
+engine: cortex.llamacpp
+prompt_template: "<start_of_turn>user\n{prompt}<end_of_turn>\n<start_of_turn>model"