huypn16
/

sae-qwen-2.5-1.5B-OWM-16x

Model card Files Files and versions Community

huypn16 commited on Oct 16, 2024

Commit

bf27ccf

•

1 Parent(s): fb08763

Update layers.14/cfg.json

Files changed (1) hide show

layers.14/cfg.json +24 -1

layers.14/cfg.json CHANGED Viewed

	@@ -1 +1,24 @@
1	- {~~"expansion_factor": 16, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536}~~

+{
+  "model_name": "Qwen/Qwen2.5-1.5B-Instruct",
+  "architecture": "topk",
+  "hook_name": "blocks.14.hook_resid_post",
+  "hook_layer": 14,
+  "layer": 14,
+  "k": 64,
+  "activation_fn_str": "relu",
+  "d_sae": 24576,
+  "d_in": 1536,
+  "multi_topk": false,
+  "device": "cuda",
+  "apply_b_dec_to_input": false,
+  "finetuning_scaling_factor": false,
+  "context_size": 1024,
+  "hook_head_index": null,
+  "prepend_bos": true,
+  "normalize_activations": "none",
+  "dtype": "float32",
+  "sae_lens_training_version": "eleuther",
+  "neuronpedia_id": null,
+  "activation_fn_kwargs": {},
+  "model_from_pretrained_kwargs": {}
+}