Upload folder using huggingface_hub
Browse files- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[1].attn_0.pt +3 -0
- checkpoints/torso[1].attn_1024.pt +3 -0
- checkpoints/torso[1].attn_1536.pt +3 -0
- checkpoints/torso[1].attn_2048.pt +3 -0
- checkpoints/torso[1].attn_512.pt +3 -0
- checkpoints/torso[1].res_final_0.pt +3 -0
- checkpoints/torso[1].res_final_1024.pt +3 -0
- checkpoints/torso[1].res_final_1536.pt +3 -0
- checkpoints/torso[1].res_final_2048.pt +3 -0
- checkpoints/torso[1].res_final_512.pt +3 -0
- checkpoints/torso[1].res_mlp_0.pt +3 -0
- checkpoints/torso[1].res_mlp_1024.pt +3 -0
- checkpoints/torso[1].res_mlp_1536.pt +3 -0
- checkpoints/torso[1].res_mlp_2048.pt +3 -0
- checkpoints/torso[1].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[1].attn.pt +3 -0
- trainer_0/torso[1].res_final.pt +3 -0
- trainer_0/torso[1].res_mlp.pt +3 -0
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45fc8bccd21a4e338efef28610f6289477f93520fc9ed6dcd23804deca5d0964
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3436d65cd78e9cc4285c56c24f1c15bfd2235d8485045666f521d60f1019834
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae27a59c0f01763c90e6599cccdadae54e73a935aed535b804bfa0a8660f5fcf
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8068d9c05ac2e1ede61ba7b7f19867a8218afd97ae702ad43ba357a3f52b125e
|
3 |
+
size 37778696
|
checkpoints/torso[1].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
|
3 |
+
size 37778576
|
checkpoints/torso[1].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:701f2ded160ac3398fc5c647563bb875bae8c87200004e4ad3cfb8591d676a84
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4252932b2577c5bfb10b1ff4daa0a91f7d57943bc2716157c5eb9c96630eb9a1
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d1d5dcb1174d0b6b14f6571de90a01be9e4d054661ccf5e274919d5690ccaee
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1389878f872db0d97abc6757c51efa373bd28c5ee9dce0de7b1d6794ff479bd1
|
3 |
+
size 37778592
|
checkpoints/torso[1].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
|
3 |
+
size 37778616
|
checkpoints/torso[1].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ef4377b05c3983073a3a0256cabc9ecca03081985936c1f3456f15c22d81234
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea1fff6facffc0db9013abb84dc4212dfd6a8054de6838bf485056ba24d7de82
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1f193475add51ffcfc780b764a99054f301a22103fde397a2e24afa40f6535e
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf2dd6b13c1429ad406e0f3e4b464001b9a7dbba5b715a52f5982191b872d52e
|
3 |
+
size 37778696
|
checkpoints/torso[1].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
|
3 |
+
size 37778600
|
checkpoints/torso[1].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e769eadb062b0d2b84fb5cf7155ca6d7877b41f52937071f9db9fb089b3d35ad
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c72bad6820637140db4b6b8a8e10849ee6b524ea28c6334443377c7d7ae22270
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f1042e6a71ae20f133836168769b9753493f7e18fc01ebdd239c08ba3e7a277
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:261bd38a319db2ee772a97f15fa99ba2eb27d26d2554bec031200d16022333a9
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 1,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bc74e9b0734fc4f914e28b09f7f1a14b9ed8c3d1d47acaa6e7785c888b2b69c
|
3 |
+
size 37778600
|
trainer_0/torso[1].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d16f762aeba8d1ee1c834df4f68d0a7bc9ae3af3dd31463adb9e6cb98761811d
|
3 |
+
size 37778560
|
trainer_0/torso[1].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c6790910cda9b1b9b2dc804a0c0461cea00ec0cd3dde59e00d7711d9c642c8f
|
3 |
+
size 37778600
|
trainer_0/torso[1].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc6456810e9e10dc80878b50332e932cb953308244b7d63298a3f933cbbd20ee
|
3 |
+
size 37778584
|