Piotr Zalewski commited on
Commit
533c223
1 Parent(s): 86cac43

#2 retrying 32k context

Browse files
Files changed (1) hide show
  1. config.json +3 -3
config.json CHANGED
@@ -18,7 +18,7 @@
18
  "hidden_size": 2304,
19
  "initializer_range": 0.02,
20
  "intermediate_size": 9216,
21
- "max_position_embeddings": 8192,
22
  "model_type": "gemma2",
23
  "num_attention_heads": 8,
24
  "num_hidden_layers": 26,
@@ -26,8 +26,8 @@
26
  "pad_token_id": 0,
27
  "query_pre_attn_scalar": 256,
28
  "rms_norm_eps": 1e-06,
29
- "rope_theta": 10000.0,
30
- "sliding_window": 4096,
31
  "torch_dtype": "bfloat16",
32
  "transformers_version": "4.42.4",
33
  "use_cache": true,
 
18
  "hidden_size": 2304,
19
  "initializer_range": 0.02,
20
  "intermediate_size": 9216,
21
+ "max_position_embeddings": 32768,
22
  "model_type": "gemma2",
23
  "num_attention_heads": 8,
24
  "num_hidden_layers": 26,
 
26
  "pad_token_id": 0,
27
  "query_pre_attn_scalar": 256,
28
  "rms_norm_eps": 1e-06,
29
+ "rope_theta": 160000.0,
30
+ "sliding_window": 32768,
31
  "torch_dtype": "bfloat16",
32
  "transformers_version": "4.42.4",
33
  "use_cache": true,