diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json deleted file mode 100644 index f5f6c17d57c5b99249c4add22b64d208990b20e1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/ae.pt deleted file mode 100644 index 973a74a62b1046890b43720424525b3df1164a8a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2936474d9c934443b3d5369b94bdc45053a7f4b2b5ba89cb53fc2651dccce915 -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/config.json deleted file mode 100644 index 760ed4b0fa1f98a7fe539f6e25948362891965a5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/ae.pt deleted file mode 100644 index ae90eb4c3a9d051a6ba74f85a7851afa01f0ac66..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3e1e3d667af479cce5692ac6aab166258cacf1ed4d480fbd80eeadb32127315d -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/config.json deleted file mode 100644 index d3ed18524e1161a09ec9b8451036ab8a1c135fa0..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/ae.pt deleted file mode 100644 index b88aee2e97c6e24d8a660b3785762ca0f332e1ba..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1ae2e3b8be3f90444c4496646fb6aa604f0c2c7809b62a0d8608c47d1e697a2c -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/config.json deleted file mode 100644 index a5bbf33b6c21b80f07861025ab91d44ca45ecfd7..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/ae.pt deleted file mode 100644 index ee24e29c6efc45f42561510365053ebf247f7e4c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:98396469af5a09409acad191e2fb8637e647029ad7fe6764ea11b847b1471e6d -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/config.json deleted file mode 100644 index 028c98cf8fee133c17aba70e53b113e923c6c1cc..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/ae.pt deleted file mode 100644 index 2ebae94e9be697b6b1a80a0d86e16d39c98c197f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:72247aad0086f6772c263e029965661f81a79ea11caae94727f16d95c07d313c -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/config.json deleted file mode 100644 index 09063949120a1203154d62c43886b8ce8ebfdd6d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/ae.pt deleted file mode 100644 index 40dd21ac7d496e3636df93a54b447b75bca1c077..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8de72270cab9c46aa2cdb3c51a7e986bab6f43b2e5512a1d77f4c43613e20e4e -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/config.json deleted file mode 100644 index 80b0d76eaf22b0a203d03b6092bb8719ac4a2e25..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_0_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 20, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json deleted file mode 100644 index dc776d2046806eb569f5e55f887eae44a103d188..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/ae.pt deleted file mode 100644 index c2c5da148cdcd94dff9f61e014f20bdacc9ff08e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:610e1d15ff4fcb05fe0db164879b316f1205732e25850e145091c9cb48bfa09c -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/config.json deleted file mode 100644 index 34bcb2f70999246e0fc515625435ee5c2d9187e0..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/ae.pt deleted file mode 100644 index ecef60e1823561fbce88eee519f44413987ec7d2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d9d3b8aef0f52860267de45ac12977fe86826f35cdb6b87a3829673a37c36cb -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/config.json deleted file mode 100644 index e7869912100c2521663c3266f9d850afb695f818..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/ae.pt deleted file mode 100644 index a6736b1de0b6a87e46adb4e7b9d35cd8c63dfe39..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8190d85699dad6aaeef16cad0731e96b63676f479e8f4fe151062e2eece8e4aa -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/config.json deleted file mode 100644 index 8287051f7f2f5a9631c318026c1529e987b6a662..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/ae.pt deleted file mode 100644 index 1a09daf61b17f175b471f27031d2c5a9d5344fc3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8e5458365646730ae06d8e514b5c728bd501dab0ba227af64729218b2c76dd9d -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/config.json deleted file mode 100644 index 87ba0b65e19147eecdda3155f5179689ba82b90b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/ae.pt deleted file mode 100644 index b9f645e06d583cbdf81d1eb7eae33793966e6031..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e4a2260a96e754b304bdbfda0175f9dde53527e2c3cc76023e1f21eadc6889fd -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/config.json deleted file mode 100644 index 151644f8d99eb21bd9f63019c0d4f16b8228aeb6..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/ae.pt deleted file mode 100644 index 2e29a7327d35c4923a9c2aeb038a4026c8174ce5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c4fafb152c01023057a05eb8d0e2f2b50263ce78eb201cb1269ce0dbbc5c7585 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/config.json deleted file mode 100644 index ab700373567238ce23cc2bdd3a6c72bb7cdbc176..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_1_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 40, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json deleted file mode 100644 index 3e6415b24fe46d6ea879acccabb8311e690bd47c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/ae.pt deleted file mode 100644 index 421bd8078bf805e8236ee914b61cbdb1cad2df53..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:819dec7bf756472ec9ad3ce387cd15ff50e18491d98df4775c70db889f84745e -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/config.json deleted file mode 100644 index b8a8a2aae9387b1dea2d90f5bda4891a9ede947b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/ae.pt deleted file mode 100644 index 70eb52aae3a63ea451f01fb16cf4c18c5c8359db..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4956f6f43595e7dc95488bf8f4eac64e76b2b22f50d0a488bcc5088a229747c8 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/config.json deleted file mode 100644 index cca52be82b03456fc1d4161b43a1d63c2440b348..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/ae.pt deleted file mode 100644 index 2dd4cabccb157563ca0fb6b2837313fd59215719..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2b8ca264d34fc9c813271d4740f8354d920adc3a8bb2575e010e191f6d652af8 -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/config.json deleted file mode 100644 index 8593f979a7492addb7aead09b0f72d9b6088ffd7..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/ae.pt deleted file mode 100644 index 412d83236bf06a8e8cffd1f5f29fe5508f7f31e6..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:435d42cfbfe4fb8260ba563ecedb62184ff808afd8f7070a8c23b2b1f503838e -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/config.json deleted file mode 100644 index 2b8a18cd614d0a945068de20924fc185d109b31e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/ae.pt deleted file mode 100644 index dd827d235eeec470656a8c216f730b6dad6582f6..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f8af3df52dba4e0b8ae0f464cf3c7c7c2fc55b12e7e1ebd5e325e49f5d487b69 -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/config.json deleted file mode 100644 index cdf6417992e880fb7b1bd24b58df16b2d2d40eae..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/ae.pt deleted file mode 100644 index 42019e57b978ca42f2993bf4c3eac13fd7606455..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:025b7d7aa2e0085f3c34e1cff16b900a16cb18bf6e8d8e7984dfead442d22ca2 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/config.json deleted file mode 100644 index 2b94e6d5828bb5e8684c0d685d058b70b7bd6fb9..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_2_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 80, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json deleted file mode 100644 index 9045ad04508b7a5b8d9e53399e41894fb19035a7..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/ae.pt deleted file mode 100644 index 17f10a0cee69a3f0b6cb74495c95cd887b79e970..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f1172e3e921375af16476b723059354adca19d37dadbd0e5c022ba9cc633bec2 -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/config.json deleted file mode 100644 index 0fd46d917df3414969bde32dbcd712114a7d1ac5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/ae.pt deleted file mode 100644 index 8247d769d39658c211484b3ca54d83ab4adb8ff3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:12b637cb1114124801da785a1af70fd65bce57142a6d7bc824308e49caba8a64 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/config.json deleted file mode 100644 index a51bb293523dc5254ae5c7942e06528d4e6ba28b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/ae.pt deleted file mode 100644 index 42d5aa81d29b0feef2574461a7739ace879cbb71..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:821b99c90698176c46a4ad714484fbe8f816ed7deb4cd1b0fde7b2791d5f0a6e -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/config.json deleted file mode 100644 index 33a381be79328f832a5e282870ea661046fb9c18..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/ae.pt deleted file mode 100644 index 4b35a637f57e27d505396ed100f717949a6e47bb..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9dbeb3944bfa5aed345d091ecb19eae1873bdc00720b533dc196b0e5cee2def9 -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/config.json deleted file mode 100644 index ea6bfce4be4b380a1003faa9cba83b32be172d7f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/ae.pt deleted file mode 100644 index 692321cf7418bb7e70110c7937bf33dc8f7d54c1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:27172f07df06c92c65a02235ee3e4a47b5045307c77f5ca1213c2ca93cf695a4 -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/config.json deleted file mode 100644 index 3045e36c7652921768d32125931a6066a44c0692..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/ae.pt deleted file mode 100644 index de2631d782146c4354115ce0e723c02d2fabedd8..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c238784c8fa39b48277e1b47048027e553add8e2e0d5f1f46c21e18150c8cdfa -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/config.json deleted file mode 100644 index 05b8ad7fa8aa6ef048ece7e4be542276a046d97f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_3_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 160, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json deleted file mode 100644 index 2d84c7f8eebb88b6a6dbb063bb90f51fd4bad05e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/ae.pt deleted file mode 100644 index bd417def2ad8d4f9a9192fbccea5513454e35e2d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f6081a5b6e5a30ecd8aca0d29bf0abce3a76c011ca0ed199b081c2d5ca38c61d -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/config.json deleted file mode 100644 index bd7c5f9cdd5474e69062bd40120b83336c1ea013..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/ae.pt deleted file mode 100644 index 1109ef1883b684035d5843eef6e0f6f1bffba88c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:edc3845bda73209ad791526f730e4caa8fc27fdbedc7e0e9fb881e49ef11445a -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/config.json deleted file mode 100644 index e62f5a40085e57ade88bf796bb9d5a238b92f056..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/ae.pt deleted file mode 100644 index c85afef37672616b4a737e3fd053e6f19a2b652f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0923a9e807e7d0a15948d7da2e9afbe095a1764d850e889807b99744816358a7 -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/config.json deleted file mode 100644 index 0aa4414fbe70ee2762cdb6f6620aee0f63dc5b0a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/ae.pt deleted file mode 100644 index d941612ab079cb3219480d56b9b9db158c5d6896..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0edfd6bc01706233b5a034332879fe5ea2c49ca0d42f8c4c1ee249562cdefcf4 -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/config.json deleted file mode 100644 index cbb542011b51df679b800e440b3ac5c4e86257a2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/ae.pt deleted file mode 100644 index 964de01179fa129dddb51fb7edaf4f70b2a53c68..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2236f43033c1069cda9177a1233a487b1f23c71a92ab8c6277fa7e0753098f24 -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/config.json deleted file mode 100644 index 35d168e1569ba0e0eced1b7e01be04e4a2e38cd7..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/ae.pt deleted file mode 100644 index d63e7208da96d84c3907b8a7d74acdae88d47c56..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:85e6bbd8e3bf2d890f516d488d66eaa7d887f3ca1ef90ab28a411f4674747957 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/config.json deleted file mode 100644 index 8b895f0aecf321f31e6c91c2b9659dd416a67bf6..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_4_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 320, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt deleted file mode 100644 index 9f91c26925465dda4babcff5a3a0161738b8920c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2fa6020d346a61f1248b174c40ae3a225c988426c118ed376952b74cc14a391 -size 1208232760 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json deleted file mode 100644 index ea53b33ad2144d200f8126be541ec3c69c769003..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/ae.pt deleted file mode 100644 index 13aba694a9f5820a52bcd952907b90e946145827..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:75a6abf7f8b3922cec39af58fdd26a6430c1a3c8e7a4045ef17aa7e8a565609b -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/config.json deleted file mode 100644 index 744869cde9b08744c5a3eb480c681528173a9028..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_308/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "308", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/ae.pt deleted file mode 100644 index 6cdae55abf7b76eecdae06ea7b3dd4f4416a60da..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:344408d5a9da83ab4e40e9a0088c345b0a4027bc2664759fc28122eeabc9c766 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/config.json deleted file mode 100644 index 1c26e9c3c3ca1cda3d213d3ea04a1c98a40aa971..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_3088/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "3088", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/ae.pt deleted file mode 100644 index 665dbc989ad506f13c5022b20e57278c6c7ee41e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:511c2d9cebc5831b10c25f07676123517d73039146d12201f7f9b171fe045541 -size 1208233048 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/config.json deleted file mode 100644 index baff67436379a82b3c647e3d5adc87afd997e89d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_30881/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "30881", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/ae.pt deleted file mode 100644 index 941c9925e8c3375f68a372b2699d86274cb3bd5a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd39ad6897102b5a94bf2ae7b4f54568f348af31ff9f27459f8a15aab9e7a13d -size 1208232768 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/config.json deleted file mode 100644 index 263819313122c4f2081537dd8b8edddff605d39c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_97/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "97", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/ae.pt deleted file mode 100644 index 5afee02f645e46a5b84dbe6b96f725106ae4a10a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9cefcd92ddc24cbafe039584f0248a9890bcd164736643da22eb0fc7055da0bc -size 1208232776 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/config.json deleted file mode 100644 index 763c8f27a6e197b0e8a11d7a620253fe239bc366..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_976/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "976", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/ae.pt deleted file mode 100644 index d891c550fb07a82cef7cb7c1ea8c0c59693fb4cc..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e76fb79765eda9f2834bb29299a1e279a97d9a2c35e61fa41ce618d906b70ec3 -size 1208232848 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/config.json deleted file mode 100644 index 01ff5b9407287f774963024ebbab6fc6cb37a06d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_5_checkpoints/trainer_5_step_9765/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.0001, - "steps": "9765", - "seed": 0, - "activation_dim": 2304, - "dict_size": 65536, - "k": 640, - "device": "cuda:0", - "layer": 5, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_5", - "submodule_name": "resid_post_layer_5" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2048, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 4096, - "device": "cuda:0" - } -} \ No newline at end of file