HigherMind's picture
Upload mlc-chat-config.json with huggingface_hub
b8286c4 verified
{
"version": "0.1.0",
"model_type": "mistral",
"quantization": "q4f16_1",
"model_config": {
"hidden_size": 4096,
"intermediate_size": 14336,
"num_attention_heads": 32,
"num_hidden_layers": 32,
"rms_norm_eps": 1e-05,
"vocab_size": 32768,
"position_embedding_base": 1000000.0,
"num_key_value_heads": 8,
"head_dim": 128,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"max_batch_size": 128
},
"vocab_size": 32768,
"context_window_size": 32768,
"sliding_window_size": 2048,
"prefill_chunk_size": 128,
"attention_sink_size": 4,
"tensor_parallel_shards": 1,
"pipeline_parallel_stages": 1,
"temperature": 1.0,
"presence_penalty": 0.0,
"frequency_penalty": 0.0,
"repetition_penalty": 1.0,
"top_p": 1.0,
"tokenizer_files": [
"tokenizer.model",
"tokenizer.json",
"tokenizer_config.json"
],
"tokenizer_info": {
"token_postproc_method": "byte_fallback",
"prepend_space_in_encode": false,
"strip_space_in_decode": true
},
"conv_template": {
"name": "mistral_default",
"system_template": "[INST] {system_message}",
"system_message": "The following is a conversation with an AI assistant. She is smart and very honest. She wants to help the human understand whatever it is they want to understand using her insights and wisdom.",
"system_prefix_token_ids": [
1
],
"add_role_after_system_message": false,
"roles": {
"user": "[INST]",
"assistant": "[/INST]",
"tool": "[INST]"
},
"role_templates": {
"user": "{user_message}",
"assistant": "{assistant_message}",
"tool": "{tool_message}"
},
"messages": [],
"seps": [
" "
],
"role_content_sep": " ",
"role_empty_sep": "",
"stop_str": [
"</s>"
],
"stop_token_ids": [
2
],
"function_string": "",
"use_function_calling": false
},
"pad_token_id": 0,
"bos_token_id": 1,
"eos_token_id": 2
}