huypn16
/

sae-qwen-2.5-1.5B-OMS-16x

Model card Files Files and versions Community

huypn16 commited on Oct 15, 2024

Commit

8055dd0

·

verified ·

1 Parent(s): 06cadf5

Update layers.8/cfg.json

Files changed (1) hide show

layers.8/cfg.json +26 -26

layers.8/cfg.json CHANGED Viewed

@@ -1,28 +1,28 @@
 {
-  'normalize_decoder': True,
-  'num_latents': 0,
-  'k': 64,
-  'multi_topk': False,
-  'layer': 8,
-  'device': 'cuda',
-  'activation_fn_str': 'relu',
-  'd_sae': 24576,
-  'd_in': 1536,
-  'architecture': 'topk',
-  'apply_b_dec_to_input': False,
-  'finetuning_scaling_factor': False,
-  'context_size': 1024,
-  'model_name': 'Qwen/Qwen2.5-1.5B-Instruct',
-  'hook_name': 'blocks.8.hook_sae_acts_topk',
-  'hook_layer': 8,
-  'hook_head_index': None,
-  'prepend_bos': True,
-  'dataset_path': '',
-  'dataset_trust_remote_code': False,
-  'normalize_activations': 'none',
-  'dtype': 'float32',
-  'sae_lens_training_version': 'eleuther',
-  'activation_fn_kwargs': {},
-  'neuronpedia_id': None,
-  'model_from_pretrained_kwargs': {}
 }

 {
+  "normalize_decoder": true,
+  "num_latents": 0,
+  "k": 64,
+  "multi_topk": false,
+  "layer": 8,
+  "device": "cuda",
+  "activation_fn_str": "relu",
+  "d_sae": 24576,
+  "d_in": 1536,
+  "architecture": "topk",
+  "apply_b_dec_to_input": false,
+  "finetuning_scaling_factor": false,
+  "context_size": 1024,
+  "model_name": "Qwen/Qwen2.5-1.5B-Instruct",
+  "hook_name": "blocks.8.hook_sae_acts_topk",
+  "hook_layer": 8,
+  "hook_head_index": null,
+  "prepend_bos": true,
+  "dataset_path": "",
+  "dataset_trust_remote_code": false,
+  "normalize_activations": "none",
+  "dtype": "float32",
+  "sae_lens_training_version": "eleuther",
+  "activation_fn_kwargs": {},
+  "neuronpedia_id": null,
+  "model_from_pretrained_kwargs": {}
 }