diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json deleted file mode 100644 index 4a6a6be2ae0c0faaaa900691d2543751431c2479..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/ae.pt deleted file mode 100644 index 896b25cc095736479e8e375aa43bb8f1d9485add..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2719944aa66b4b8a560631fcad5c75b33841c9d7f912952964f5d9cb99b5fec -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/config.json deleted file mode 100644 index 2c45cc2dc008951a9bc97a9ef03408732449b171..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/ae.pt deleted file mode 100644 index 66e9b1ad3bd7fa22cf97142f8932f545a8636b14..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3fc8256b3a3256b6e5418b9d91b5734339cefeaae85e42c82d4b52008a38b27f -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/config.json deleted file mode 100644 index c7f2cb053cd762a6531082f29bef43ccacf0b009..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/ae.pt deleted file mode 100644 index b284ba561188960e13d2f2e35dc847a1582f2982..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:03dee9a5170fbb2615fb26cd612921da7f0418ceb4ba8bdbac70a2ae5d0e9860 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/config.json deleted file mode 100644 index 4d2e3cfe0b533b8602cd19746ae08b83911445c5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/ae.pt deleted file mode 100644 index 992467c2be358ef51dfb8d14e62ba30b70199ee9..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:43df85ceb189027f81fe27c41aa57fb75d22bc81dbafd20e64147daf97035cdf -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/config.json deleted file mode 100644 index c8ee9e65d660237a68ee9cb615dcb34403e76505..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/ae.pt deleted file mode 100644 index 122baf1b48bc71144ab29614c29e0bd080ac1fca..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c732f580ab880879cdde780baee7d26987f9867b7d7f23bca02e8907769fa58 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/config.json deleted file mode 100644 index 7fc41580e2b0cb4fedab3da66cd797f2b4d66e43..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/ae.pt deleted file mode 100644 index 04c9df0e54ec1f4242477be49e8c014029417571..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b4ae0849c49f1767bb915700aae9995dc9bcff76ff3c63dd820df7ef966c28a6 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/config.json deleted file mode 100644 index de70d0507c3b38b4e87f408edd652de1f56268a5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.025, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json deleted file mode 100644 index 9b5d569e29c34d1c28371f091e217b2290ffafde..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/ae.pt deleted file mode 100644 index 3ec9d9fde94cc6cfe7f36e797305c3c4a7e726f1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:94b2d3c50422f04a443b32a439c897098fbbc36aa205194d42848cd016a3b8f7 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/config.json deleted file mode 100644 index d547bb13872f3fff95bbb5c4d9ddad4ace7a8783..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/ae.pt deleted file mode 100644 index a8bfb7a3456e537e8526bcfcf2b2f6bc31602304..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:96c629f309743528eae9100f7ad4de436f74372ec3ad4b9df2b8b42766e73928 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/config.json deleted file mode 100644 index 94cc62b4447fdb46495178bd661278aea314ca74..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/ae.pt deleted file mode 100644 index d03f3c750e3cf6063bec91f54d78c06171e8fa9a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1d80023e2d3c4825e43bdf2863afe3be88422263ffbca3e22cf6f1c861197be1 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/config.json deleted file mode 100644 index 9be111f8a88319f13d87ea13c98b63f1dce663bd..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/ae.pt deleted file mode 100644 index 850a80a58d33d1c5171a581e552a2c21944c9a30..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2154ad3037938d4584f8f6b38773f58fe3a28a1d95ca64122baa8b7ca6fe681 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/config.json deleted file mode 100644 index 9aa9019a7c7e69a6321ead93f4f4bc71a06fcf10..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/ae.pt deleted file mode 100644 index c56d42777b02f9fbb92d1e4c636c1c9488ecdb62..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0fc3a384661f113926ac9709e5a0279eb5818f7c95d360459eea20e7783c1929 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/config.json deleted file mode 100644 index e55f8639191b7d10b60faf0f1e4841607af8407e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/ae.pt deleted file mode 100644 index d03af8f4d541219f7a4797f02583bd8e34285ee1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f2f5f81d086fdbb0d0c970b1a8592d474224cc8a10771351045fae65e5a11406 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/config.json deleted file mode 100644 index 3ee414a34d7223bad090753495bb7b66df22505a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.035, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json deleted file mode 100644 index 1ad7b8cdc7336f95179634a513e599b12903fc25..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/ae.pt deleted file mode 100644 index 0816331c0b1b29f8825a43c0bc8157150f3072ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c82ad7f17773d76485798e5bbfd41d1854d5d28cdce8015e1b537cf671197d1 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/config.json deleted file mode 100644 index c1116d63353f9972a88f2bfdd114456e7cb2195d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/ae.pt deleted file mode 100644 index de3f6ea794a70667345a463ba043b8af69a687a7..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6cfe58ba4ea5e4aa094a4d7f41bb1d067965ba57ed9c342c81335f62b8863ba8 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/config.json deleted file mode 100644 index 6e22d5f9ed79283b6b0c8ab2e7706d7c787ad5cd..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/ae.pt deleted file mode 100644 index 745aaab27469246655c3d07cc157313de4e11027..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64f7c9c06f1e41050ad18309eaf59b11e5d60b9cad6cf323353f67cbf94c6893 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/config.json deleted file mode 100644 index 3390109c86375c1da57713692b6e62951db7c9da..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/ae.pt deleted file mode 100644 index d52ce731f08bf2d0a225f3c7230d4b3898c9c317..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:375a73377c3ab24b5a2a3ea113530d00b47d856c236430df5841022e8680e79d -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/config.json deleted file mode 100644 index 7489c9a6a9ebb1bdb87a81cdb9de9ac44cabe6ee..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/ae.pt deleted file mode 100644 index 5e531823fa945153211e442da7f1bde150c954e5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:466756eef1a6aff1f13301308339b0e57502a85914d51a874f95531ef442020c -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/config.json deleted file mode 100644 index 5fb6eb8b31b605fa5035ad68ee183cd95490293b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/ae.pt deleted file mode 100644 index 5979ec5292d2cc632878f3b694b39a9f6257798f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a75d62beba010099b105df801d0277ea97ee73b78aa42606ad714a21f2c8fa08 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/config.json deleted file mode 100644 index f236d6c71019ed33408c2f6bf430e6a6e171871a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.04, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json deleted file mode 100644 index 1ef2abdfc4760e9ce760978633b9da3e2fde70b4..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/ae.pt deleted file mode 100644 index a0eea3be695b9243449ffac6283825fbcada0398..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7fd81969d804d3b87a344c72d08d26dcb8a65c25dc87d818f875d4e2ac09f347 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/config.json deleted file mode 100644 index 7040f519164590a9e16c19f6fcd72a390d370c14..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/ae.pt deleted file mode 100644 index e100945938f1a98af10e2960cfca6c7d15bdff52..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7dd1e2ddd31bf59234b04214e8231f913688d48efb36667e84dc5bcee4e39285 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/config.json deleted file mode 100644 index e4e081d590b89a8ff7493b63928ee6a3a35a61b2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/ae.pt deleted file mode 100644 index b64c4a05f3e47cfde22bb9c4cf9c3b686a281a00..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:350beb4c71c62ff10017f1024b8888cffb47e03b4a9773357d800de783ae719e -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/config.json deleted file mode 100644 index bd808db494c2f17f4d14ea6a9cc81fa393e9cdf4..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/ae.pt deleted file mode 100644 index 6b1350298f00ce4f5ba9ffd79d8a9fdf1bba86d0..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9670c6f6089787461394123fcb0e28bcee2adda9d015d39578dabd3013931702 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/config.json deleted file mode 100644 index 34d4c8bfd404157744a1c0c24f040e99378dd8f3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/ae.pt deleted file mode 100644 index 6f477a50a7c39870b3a63478d68455bfc90bb34c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fe0c190a4648b9bf55ce354934aa1b21dd9a0e8900b4c256c7c164f11719656a -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/config.json deleted file mode 100644 index ea536936f2ee2378cf0dc5719e16d751488762cc..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/ae.pt deleted file mode 100644 index 235fefde7dc202d57dbdcfd5eac3dbe148e4a947..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9a1805452d79ba00cf56f6708d33abbd4113a1a462238fd92bdd3b068bc626fc -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/config.json deleted file mode 100644 index 1506cf245231242190f00e43eaa7f6a1a0948f2f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.05, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json deleted file mode 100644 index b1639ea66042048389e8ac376e6d9f3262db046f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/ae.pt deleted file mode 100644 index 7fa972e865713183fb4723b886dc4019e7ba3a54..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2bf92a9f845ab6e96cf23b872db200ccb62463b32b462eb08e34623d74b1bae8 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/config.json deleted file mode 100644 index a8446ba7a6e06229857977103b86cc82cd4691bc..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/ae.pt deleted file mode 100644 index 5c90bbf07300bea87bb6dcb378a7f0b8376ab070..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:723da694f229e2cc820f256fcc59625311adee59ec8ba407ba9ee5cb07f4cee4 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/config.json deleted file mode 100644 index 956ca468bf99f49040ee703161a3caf7a31adfce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/ae.pt deleted file mode 100644 index 1b2a3e06e38ac5e0c9f83e4ab6e65fd6be1f8daf..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3409bfeec4f6af5b84b5e8069f2480961ecfe47c9db1b4d46463cf323a896549 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/config.json deleted file mode 100644 index a62ecb9505b03070c0fa18360225d1dcd54ca2ba..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/ae.pt deleted file mode 100644 index b86a55cd7f196144c4bf57536f49cd50731bab72..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2d9d57d103ab9239adc7a5b2ed7eeeee575bbbe180e9410f17e1e35c4079e0e -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/config.json deleted file mode 100644 index d52b827b357feb7ac4797fa855509f812254e538..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/ae.pt deleted file mode 100644 index 43583529093f7e59395d12e531b3d231f7993299..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:acba9c1e3c7f02bbe3cc7e07975bafeda0770e29b439b9848991f67bca000620 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/config.json deleted file mode 100644 index ee5441ce81b46613f97556728a06bb9f6b02923f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/ae.pt deleted file mode 100644 index d06c931fb787eae696a162adcc2b03d729ff1cf5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d168baccfc05737d21ef2caa6c5b9d86e4ad34a94c12fb1d66d8e4583479990a -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/config.json deleted file mode 100644 index 230c703b7168f116a22f19b16398e8b113e2c604..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.06, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt deleted file mode 100644 index 35e5bce4b4f88b19e5c7932711b4c1c8bf0328ce..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:128cb0fe4243dbb2ec45b6e104d765dae7fba4e6ed08cdb5e9136bac1d1d8c22 -size 1208232760 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json deleted file mode 100644 index 70712938dce90bbe62ded1b59bd3c4c8690cd2b0..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "0" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/ae.pt deleted file mode 100644 index 213e466b03f8388c53c2d614cb26fccefefbacf5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:88f0b478c66fffadf534e4f6a7dfbb917e32bddb58f8d9ce4ef74db321115a87 -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/config.json deleted file mode 100644 index 1d02330b0d653cc6219d8a720c9655a1d34b1a65..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_195/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "195" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/ae.pt deleted file mode 100644 index d9f4d3cfba433267dcf9437bd57a5e9bd0f9adaa..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2fb50e65f2d332e85f0961d41654887db6fd7402406d803c23756f6ec584c9e -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/config.json deleted file mode 100644 index 3dd2ceebc2f5276219dfbbcae1ef9a0808a7ab68..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_1953/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "1953" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/ae.pt deleted file mode 100644 index fa8f6870072dd28af60a1ceeb19f4eb43642c5e8..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c8cb71e72be70cd78bc523888cd75e9883650cceb6b3cd19ea44fe53ea419887 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/config.json deleted file mode 100644 index edba5e389059c641a76cae4c68fa25c2f21a6d59..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_19531/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "19531" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/ae.pt deleted file mode 100644 index bbcb92f7574d0b6fb6d8a4c152ea9c5e518b555f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fa2a3c3c4bfa963b1fb66c98d0086384ac5925ec62fae1672fd7d3a2cdbcdc2d -size 1208232776 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/config.json deleted file mode 100644 index 0649fec1ff6703e40bc45da433e0b3d69f6464e5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_617/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "617" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/ae.pt deleted file mode 100644 index ff2ea936f55bce303d04fe9d837077e4de241426..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:86eb270a7595b6b10859a91cde15f979671cf03d9fdd0ce692cc8cc9ea169a61 -size 1208232848 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/config.json deleted file mode 100644 index 3692e64b731ff3e6cb614b7c20bbd1689f60ef84..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_6176/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "6176" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/ae.pt b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/ae.pt deleted file mode 100644 index 5c965e853a10c6aec489fe8b323a81c06abcd8bf..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:289536d9c4d1fd92c8160c6e56f7c8c810d35eafc6f4b88379413fab1ec4cc04 -size 1208233048 diff --git a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/config.json b/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/config.json deleted file mode 100644 index 7c7e833dd7a0c38a2dddd272314d0a94680b7c90..0000000000000000000000000000000000000000 --- a/gemma-2-2b_vanilla_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_61763/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "trainer": { - "dict_class": "AutoEncoder", - "trainer_class": "StandardTrainer", - "activation_dim": 2304, - "dict_size": 65536, - "lr": 0.0003, - "l1_penalty": 0.07, - "warmup_steps": 1000, - "resample_steps": null, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5", - "steps": "61763" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 32, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file