{ "attention_qkv_bias": true, "attention_qkv_bias_fast": false, "codebook_size": 1024, "dim": 1024, "dropout": 0.1, "head_dim": 64, "initializer_range": 0.02, "intermediate_size": 2816, "intermediate_size_fast": 4096, "max_seq_len": 4096, "n_fast_layer": 4, "n_head": 16, "n_layer": 24, "n_local_heads": 16, "n_local_heads_fast": 2, "norm_eps": 1e-06, "num_codebooks": 8, "rope_base": 1000000.0, "tie_word_embeddings": false, "vocab_size": 151936 }