Neelectric commited on
Commit
5c58629
·
verified ·
1 Parent(s): 85249ae

First attempt at uploading a cross-coder manually

Browse files
Files changed (2) hide show
  1. 4.pt +3 -0
  2. 4_cfg.json +1 -0
4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38714b63aafc3326753ab81ac3bcc066e635df0b00cffa3ef392f0ce26f32bc9
3
+ size 402732704
4_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 49, "batch_size": 4096, "buffer_mult": 128, "lr": 5e-05, "num_tokens": 191931392, "l1_coeff": 2, "beta1": 0.9, "beta2": 0.999, "d_in": 1536, "dict_size": 16384, "seq_len": 1024, "enc_dtype": "fp32", "model_name": "qwen2.5-math-1.5b", "site": "resid_pre", "device": "cuda", "model_batch_size": 4, "log_every": 20, "save_every": 10000, "dec_init_norm": 0.08, "hook_point": "blocks.14.hook_resid_pre", "wandb_project": "R1-crosscoder", "wandb_entity": "Neelectric", "run_name": "qwen2.5-math-1.5b_crosscoder"}