diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/config.json deleted file mode 100644 index bcdcf300a8c7c46181df0f36777b9b1110357265..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/ae.pt deleted file mode 100644 index 2785c62173d33439c0871584da8f9596a5396357..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ae513ee96d00f991d178c3175705385db954be2ace3c14c55d8fe5afe53e1240 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/config.json deleted file mode 100644 index 8a903ef63d6f557153f5b1dac04284f2291d6ff3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_1953/config.json deleted file mode 100644 index a6f73fa1bbc5a9646babb534e73083fd8766ad73..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_19531/config.json deleted file mode 100644 index 23119c8ac6e4a0114fcf5fa90318289b0cde4169..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_617/config.json deleted file mode 100644 index 5e04f05fe587b134b79c0f01a1936636d2a1d983..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_6176/config.json deleted file mode 100644 index c70307fe72fec2849900bb4fcde41f9fc26ea455..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_61763/config.json deleted file mode 100644 index aa91edeaf8814f58d6fc1a116258a797b0619768..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_0_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 20, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/config.json deleted file mode 100644 index 5831a7512a977d3551501796c1c8662569aafcbb..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/ae.pt deleted file mode 100644 index 9b210aae9aa35aee110377b8b9e434a787d32665..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9e0f5988fd15c6170506894e6309023c272e4c9aabe7cb807b434088799c6c67 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/config.json deleted file mode 100644 index 897529480126ac429cddd054811bdf02019b1cef..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/ae.pt deleted file mode 100644 index 79d744d9442513bfb508b0f79e4967e65bc9a19a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:11ecb94de0079b249ace915f6fb558ef187a11b5fd463fb3a65ebe0dff5850ca -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/config.json deleted file mode 100644 index a9013d02cf990d82bed6bb9f8fecd5ccf2c21516..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/ae.pt deleted file mode 100644 index efe81c55a62bc7a9bda85e0e7a034ed498a2786e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d12aa6d1d0167c0cfa925610f1ea27c8fe56a5a382635f31c9d5e68211dec97a -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/config.json deleted file mode 100644 index 25dc02b3faa0c472774be9aee5978a2d196b3be2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/ae.pt deleted file mode 100644 index 816e6dd55c4e9e56e8f8f7f9b031298296aa07f2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ea8ec2b4131dec7f52d2772af0502e3658008b5f0cf35af2529d80256a12a350 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/config.json deleted file mode 100644 index 5ccc3e855d459b1a9489477ebe9d7c0eed2c58b3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/ae.pt deleted file mode 100644 index b7f856c362da38c3c771d2e4ffecd4c68ebcf627..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5169cb2decddc91af20ec1d2aa1681bb7c9d75f74ce4052c72d7d6c6b2305fad -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/config.json deleted file mode 100644 index d53491b8edfa669edfa759bd2109571f2d2e67c9..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/ae.pt deleted file mode 100644 index fa0b868486fdf16413d4ba0cc7b4aada31d43df2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a1d7aeef9a3f42b21329ff32e0f6b3b3092d71e36d7c455c3c402186b1ddf1d9 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/config.json deleted file mode 100644 index 4958588cb58c481c6d0dddc5bb5bf2b7eddeaa46..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_1_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 40, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/config.json deleted file mode 100644 index 51c298759ac313dd133a8dc8a5977886826a6109..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/ae.pt deleted file mode 100644 index c67ef34099dc88020c9c2edcfec06261eb2203d2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0b5f543a8b790108264e9f11a9bc5f39e4246abca94d7ff43339d7245acc2f0e -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/config.json deleted file mode 100644 index faefab690106b5a4ff1f4e1373ff71e360690cdb..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/ae.pt deleted file mode 100644 index 62ac020599e785f88a33ac053ae05a1b2825cdfe..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1c98dc746b35b2de998cd9f3c2c1bfd483ef2bdc789f60bcb1b041acdde97917 -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/config.json deleted file mode 100644 index 5f9ad7a501398453415e0c0335f1c3b9b9bdde0c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/ae.pt deleted file mode 100644 index 937d83b6a43a55a59a7aaf1c6088058d787d7209..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6a4ed0c6f1c643f7857f1ed5863f02881d061cb2664272488cbbe6b1a995bd78 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/config.json deleted file mode 100644 index fd9295c5a964e68fa883043cabe98c7556e8f018..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/ae.pt deleted file mode 100644 index 080529795a52edaf8f17d5453fb0d651ad2b7f75..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8f5a58bec7b367bed4f09c06fc8f6bcc96f9f78d8fea6812979aaab284ade153 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/config.json deleted file mode 100644 index e030c82081e27bb2b67663303cd2a7f3685972d3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/ae.pt deleted file mode 100644 index 572c5e994894440783e50ac7879fdb7a8b3e61ab..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:04d8b0de11a5d09081caf84c4b823e891a6c2a6977acf5e1c9a25f845dc05b7a -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/config.json deleted file mode 100644 index 1a1e13809963122f8ce29e725c1a12f3c45a8489..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/ae.pt deleted file mode 100644 index be1d2747f1fbed3c6da19731e1244ea96c3777b0..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c65b8a48410eec893b0937ebb297ab23dabea2eea039ab0b109adacd02c42a06 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/config.json deleted file mode 100644 index d8e022cfa7e263d4c9638c20ada654091e46fd10..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_2_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 80, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/config.json deleted file mode 100644 index 1dda5d9193b80e28f8790f634dbc725b37d4995c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/ae.pt deleted file mode 100644 index b0282c9e730c35cac4c20ade5a072d4b32d4e3dc..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:71fb799dd4d8d998590171679863d0d7177a214a78563cb687ef62821bf4a7a8 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/config.json deleted file mode 100644 index 1fb8962a752150badd59c46dc544299fb9f80bf2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/ae.pt deleted file mode 100644 index 55137de38390e2e47f7bbfaa17808648d7099dd3..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33b132d92e179c7887e837bb409d19ff97240b686b001e2091dac81e5601675b -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/config.json deleted file mode 100644 index 04deba4556b98a992f559ffc335b7aa0ca4f1db5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/ae.pt deleted file mode 100644 index 929195310143619de214f7e2bece4c5a423e42ac..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8cfbbcd14b061661c6351f3e166f8b13698160bde5b250b67b0b0b07795b0a09 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/config.json deleted file mode 100644 index d2d71cc819c6406ee7726fe152eca8a4f7121c95..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/ae.pt deleted file mode 100644 index 5b2f1006cd761a2477f6b7fda02e3281a015e279..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6224021693529c16c3807f387250ee50a1cee07255b7bfb129072e45ddaf21db -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/config.json deleted file mode 100644 index cbf55e339b2cb3c6427911d3c61a8c3ea6297ff9..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/ae.pt deleted file mode 100644 index 8a3cf254d3540370b8f2de10ba95c244d43faa8c..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7e026a8e2e8a265e55f787540211dc8ff9ca74b534e1e9349ae9f7cba55f05a4 -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/config.json deleted file mode 100644 index 9f971bd71b2721f5e1fc67c643bdfa215b2478ad..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/ae.pt deleted file mode 100644 index 8e9584f08dcceb54b61fdfdf22537b6a43373263..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f8d63b38228f299c9cf43ec402178f21dd6ec564cd91ff3bbd913f96e5b5486b -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/config.json deleted file mode 100644 index c3ce1207b26713a03d7036d02669e01f4057238a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_3_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 160, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/config.json deleted file mode 100644 index 8368acf4a36031819f3b3fe6731b2fc4c2639835..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/ae.pt deleted file mode 100644 index ee95e6fbc1854201ddb70ba4624b320d7b54ae7f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6265f4118f240523af0d2fa9a9d7e595109d58a45c62671705466b4e16eef4a6 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/config.json deleted file mode 100644 index 58d5980b15870bcc58a267e23651b24dec15fd1b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/ae.pt deleted file mode 100644 index dc2408d340654255d69c275e9e4db9b65e3cf314..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:547f0cf26b2cbc0e0045eacde8e9bea6f10fdbb53b6602e17adf7dee6e143c6d -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/config.json deleted file mode 100644 index a93e839623cf2b453b06a9d2de176ea701c19a2b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/ae.pt deleted file mode 100644 index 0d5a928e21c760ff8740eb91845e7d9a316bffa5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:29e854c7888f4ff4d99c26160d280a06d9ef75d7f65e82410772159fb4312ced -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/config.json deleted file mode 100644 index 806ab56acc235eb60c3cd1406a02fa6367f3b543..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/ae.pt deleted file mode 100644 index 7b864bc32514b71fab3518472b3812e122fc273b..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a0db784a9a2f3d807be507b5fe2fd4f476a36ef24e2b47729e07c1b7de89dbb7 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/config.json deleted file mode 100644 index bf8a86aac9d852b6f96a18382df0689999da0cd2..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/ae.pt deleted file mode 100644 index ef450d2abd333f72e65c9e5133c6e8557b0b870e..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e248d69606a34cdd29551a14bf37b09d2aacdb4e328760ca18f575809a4bed3f -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/config.json deleted file mode 100644 index 3d8868d686ad99aa0ce96323fa984ef3eff17cf1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/ae.pt deleted file mode 100644 index c4a8383f9d7814511ae7f01c490318fbaf10a421..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f4e079da5092a95a27d21ea65a5effa1cd29875878ff8638d1d05657cc9a8c11 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/config.json deleted file mode 100644 index 5ff384a0d5e076479185ab4b75dd1dba46c51b47..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_4_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 320, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/ae.pt deleted file mode 100644 index c1b20f921383fb62d38c3ae1c0c692f4f27f7fb1..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9882317ab593dbcdc4c1289214117307d075cff2fe9c60af6b59cb1009c8b014 -size 1189354296 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/config.json deleted file mode 100644 index 2677e8a0369966694e13ce7d7275757c99657230..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_0/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "0", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/ae.pt deleted file mode 100644 index cd55dacfe3ebe7356de054ed69b337e1a50e55d9..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a03f5b69235ebc0d53c815000a5057eaceffc7cbfed4b2a934b566225a214c35 -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/config.json deleted file mode 100644 index 7c39d7afee7b831dc4591e6604d2baf5bd6cbeac..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_195/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "195", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/ae.pt deleted file mode 100644 index e68f4849344b21d3b84c803bd3128cc0cb3b72f5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:47e53188eb1f14494a6053f0d85dc1e77ec9640ebfe036723df214d65a752189 -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/config.json deleted file mode 100644 index 9af9513425336b178f639959ec79546df646b5ab..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_1953/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "1953", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/ae.pt deleted file mode 100644 index 4c00dba8085d5a560dd4da7a0f833b1b73282850..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:18e68e756e2890f6a56ca5c2d7f01b7a181e9b0eccbe0bac6ba7883ab73e5bad -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/config.json deleted file mode 100644 index a6ef092f5da7117e51af89bcb851c56e81007e97..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_19531/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "19531", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/ae.pt deleted file mode 100644 index 8457ca7d867241392c6147c3d58a3accddb9dd0a..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2bfb718b5f994943cbae3bbeddde1867d24514e32b6bcaeb6d4d9dfe9cb06fbd -size 1189354312 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/config.json deleted file mode 100644 index 2c4109a47de6efd7f788a9c4dce4a11ad452b62f..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_617/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "617", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/ae.pt deleted file mode 100644 index fde6cd97bdb4786b7fc410a15576d7d201424dd6..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a7a24e6855d3e2d1e5c130e6dab38ba0f0cac6a57dbe5090edd496d03c21d7ad -size 1189354384 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/config.json deleted file mode 100644 index 5094c6bace8d5ab73da06dd40903acd6469460f5..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_6176/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "6176", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/ae.pt b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/ae.pt deleted file mode 100644 index d9f31dd0c763c3391dbacd457e0d6fac54d2dbdd..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/ae.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d09c8c7ed714713fd1a5c8446aab9cfc2f912c26792dd9039f97b4525f908ce8 -size 1189354584 diff --git a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/config.json b/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/config.json deleted file mode 100644 index c6389b8b9fc95ce6b611aaeea7be739f8916ea0d..0000000000000000000000000000000000000000 --- a/gemma-2-2b_topk_width-2pow16_date-1109/resid_post_layer_19_checkpoints/trainer_5_step_61763/config.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "trainer": { - "trainer_class": "TrainerTopK", - "dict_class": "AutoEncoderTopK", - "lr": 0.00010079052613579392, - "steps": "61763", - "seed": 0, - "activation_dim": 2304, - "dict_size": 64512, - "k": 640, - "device": "cuda:0", - "layer": 19, - "lm_name": "google/gemma-2-2b", - "wandb_name": "TopKTrainer-google/gemma-2-2b-resid_post_layer_19", - "submodule_name": "resid_post_layer_19" - }, - "buffer": { - "d_submodule": 2304, - "io": "out", - "n_ctxs": 2000, - "ctx_len": 128, - "refresh_batch_size": 24, - "out_batch_size": 2048, - "device": "cuda:0" - } -} \ No newline at end of file