File size: 379 Bytes
b3912d8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
!!python/object:aether.model.model.TransformerLensModelArguments
implementation: transformer_lens
model_name: default
n_layers: 2
model_seed: 0
d_model: 16
n_ctx: 1024
d_head: 32
n_heads: 8
act_fn: gelu
d_vocab: 5000
use_local_attn: false
tokenizer_name: georgeyw/TinyStories-tokenizer-5k
window_size: null
attn_types: null
attn_only: true
positional_embedding_type: shortformer
|