File size: 379 Bytes
b3912d8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
!!python/object:aether.model.model.TransformerLensModelArguments
implementation: transformer_lens
model_name: default
n_layers: 2
model_seed: 0
d_model: 16
n_ctx: 1024
d_head: 32
n_heads: 8
act_fn: gelu
d_vocab: 5000
use_local_attn: false
tokenizer_name: georgeyw/TinyStories-tokenizer-5k
window_size: null
attn_types: null
attn_only: true
positional_embedding_type: shortformer