Upload folder using huggingface_hub
Browse files- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[1].attn_0.pt +3 -0
- checkpoints/torso[1].attn_1024.pt +3 -0
- checkpoints/torso[1].attn_1536.pt +3 -0
- checkpoints/torso[1].attn_2048.pt +3 -0
- checkpoints/torso[1].attn_512.pt +3 -0
- checkpoints/torso[1].res_final_0.pt +3 -0
- checkpoints/torso[1].res_final_1024.pt +3 -0
- checkpoints/torso[1].res_final_1536.pt +3 -0
- checkpoints/torso[1].res_final_2048.pt +3 -0
- checkpoints/torso[1].res_final_512.pt +3 -0
- checkpoints/torso[1].res_mlp_0.pt +3 -0
- checkpoints/torso[1].res_mlp_1024.pt +3 -0
- checkpoints/torso[1].res_mlp_1536.pt +3 -0
- checkpoints/torso[1].res_mlp_2048.pt +3 -0
- checkpoints/torso[1].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[1].attn.pt +3 -0
- trainer_0/torso[1].res_final.pt +3 -0
- trainer_0/torso[1].res_mlp.pt +3 -0
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec086462f868d296edf189191c8fe118770157821389c943a030507b6f8c7295
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b772774cd1e23ef5b0f62a76263db99cc044e8cf9b326931e75c2ad044e1b987
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:683d329b83ffb27e2c599a54c785bf182bb2bfe74b5535a104a2a3269cb43fc1
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:384c07bd31152a34edf753459a30cefdf1f3573369b887e6e0128517223f4b85
|
3 |
+
size 37778696
|
checkpoints/torso[1].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
|
3 |
+
size 37778576
|
checkpoints/torso[1].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a1f4ca84f3ee8247f085d47cdc2d4363da0da03d83c604a6e0f6852eed33190
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca000910eceaddfe6ecfd3cedf6aa27901ffb8500a49db3a859a303f13bdfc14
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9b0b77165b46b6341eead7cf61b54bc07cd62183566f6fda8c68c104059d603
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63640dcf06836591e5b0be1c5cee2da051a5bde5d1ff65c8e2565dbcfbad47e1
|
3 |
+
size 37778592
|
checkpoints/torso[1].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
|
3 |
+
size 37778616
|
checkpoints/torso[1].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:383834b0d1da65c90a8aead0ecf56666cf7d21bd4f96ee6dcf0bb3ee6f70aa70
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5c131c6d22ed8ddfb7ceb58896a878f6c6947b10494da7644fa8871a4e25e86
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:191b2d42dcf079193dc2161613108c574dc76a460e7b6fa30bca2062df1f6a25
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0c2d734dd3a90b3ea9aa1d78b0bf88836accab8b1785f702ef83c1aee6751d5
|
3 |
+
size 37778696
|
checkpoints/torso[1].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
|
3 |
+
size 37778600
|
checkpoints/torso[1].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23a699998dc2ff883164751a3a0ef308c5a526dd16f2e9e78bf3f4ecdad49481
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfd5803564935812b4d5c78541d01b1ab6e1ac110ac93e28fe3abff6296a032b
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5ae00f29283b3b5c7f2f72a95e56a72ff36cb5da17934b28428aed81554dedd
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c720e9945f41176489ecaedda9afd758030a3b0bd5273ebfbc4a8f14a0d3cbd5
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 1,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5695fe6c5f3e26621deff15d32179f7bacbb823862d5e62c355af102564db92c
|
3 |
+
size 37778600
|
trainer_0/torso[1].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b94d352ba0f34153c651c503740503334a479b8a309c31b644e6e404797d46
|
3 |
+
size 37778560
|
trainer_0/torso[1].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e3609c1d3142afa2e27e1abef0832a1f99bd6b5bdf1b502c0c602b18487ade3
|
3 |
+
size 37778600
|
trainer_0/torso[1].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d575f60814a547f07b6944087da6f62a43444e122ec143e3a19f0e9e9fa36fd0
|
3 |
+
size 37778584
|