Spaces:
Paused
Paused
Create mlc-chat-config.json
Browse files- mlc-chat-config.json +58 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "qwen2",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"version": "0.1.0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008
|
8 |
+
},
|
9 |
+
"vocab_size": 32000,
|
10 |
+
"context_window_size": 4096,
|
11 |
+
"sliding_window_size": -1,
|
12 |
+
"prefill_chunk_size": 4096,
|
13 |
+
"tensor_parallel_shards": 1,
|
14 |
+
|
15 |
+
"architectures": ["Qwen2ForCausalLM"],
|
16 |
+
"attention_dropout": 0.0,
|
17 |
+
"bos_token_id": 151643,
|
18 |
+
"eos_token_id": 151643,
|
19 |
+
"hidden_act": "silu",
|
20 |
+
"hidden_size": 896,
|
21 |
+
"initializer_range": 0.02,
|
22 |
+
"intermediate_size": 4864,
|
23 |
+
"max_position_embeddings": 32768,
|
24 |
+
"max_window_layers": 24,
|
25 |
+
"model_type": "qwen2",
|
26 |
+
"num_attention_heads": 14,
|
27 |
+
"num_hidden_layers": 24,
|
28 |
+
"num_key_value_heads": 2,
|
29 |
+
"rms_norm_eps": 1e-6,
|
30 |
+
"rope_scaling": null,
|
31 |
+
"rope_theta": 1000000.0,
|
32 |
+
"sliding_window": 32768,
|
33 |
+
"tie_word_embeddings": true,
|
34 |
+
"torch_dtype": "bfloat16",
|
35 |
+
"transformers_version": "4.50.3",
|
36 |
+
"use_cache": true,
|
37 |
+
"use_sliding_window": false,
|
38 |
+
"vocab_size": 151936,
|
39 |
+
|
40 |
+
"pad_token_id": 0,
|
41 |
+
"bos_token_id": 1,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"tokenizer_files": [
|
44 |
+
"tokenizer.model",
|
45 |
+
"tokenizer.json",
|
46 |
+
"tokenizer_config.json"
|
47 |
+
],
|
48 |
+
|
49 |
+
"conv_template": {
|
50 |
+
"name": "qwen2",
|
51 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n ",
|
52 |
+
"system_message": "You respond with the JSON structure below by filling in the values as described in its entirety. Find the different billing and shipping address. No explanation, just the JSON string. And do it fast!\n{\n \"billingAddressCity\": \"Fill in the billing address city\",\n \"billingAddressCountryCode\": \"Fill in the billing address country\",\n \"billingAddressPostalCode\": \"Fill in the billing address postal code\",\n \"billingAddressStateCode\": \"Fill in the billing address state\",\n \"billingAddressStreetLine1\": \"Fill in the billing address street and number\",\n \"billingAddressStreetLine2\": \"Fill in the billing address apartment or unit number\",\n \"billingName\": \"Fill in the name associated to the billing address\",\n \"billingPhone\": \"Fill in the billing phone number\",\n \"emailAddress\": \"Fill in the email address\",\n \"ipAddress\": \"Fill in the IP address\",\n \"shippingAddressCity\": Fill in the shipping address city,\n \"shippingAddressCountryCode\": \"Fill in the shipping address country\",\n \"shippingAddressPostalCode\": \"Fill in the shippin address postal code\",\n \"shippingAddressStateCode\": Fill in the shipping address state\",\n \"shippingAddressStreetLine1\": \"Fill in the shipping address line 1\",\n \"shippingAddressStreetLine2\": \"Fill in the shipping address line 2\",\n \"shippingName\": \"Fill in the name assiciated to the shipping address\",\n \"transactionId\": \"Fill in the transaction id or order number\".\n}"
|
53 |
+
},
|
54 |
+
|
55 |
+
"temperature": 0.1,
|
56 |
+
"repetition_penalty": 1.0,
|
57 |
+
"top_p": 0.2
|
58 |
+
}
|