Upload folder using huggingface_hub
Browse files- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[1].attn_0.pt +3 -0
- checkpoints/torso[1].attn_1024.pt +3 -0
- checkpoints/torso[1].attn_1536.pt +3 -0
- checkpoints/torso[1].attn_2048.pt +3 -0
- checkpoints/torso[1].attn_512.pt +3 -0
- checkpoints/torso[1].res_final_0.pt +3 -0
- checkpoints/torso[1].res_final_1024.pt +3 -0
- checkpoints/torso[1].res_final_1536.pt +3 -0
- checkpoints/torso[1].res_final_2048.pt +3 -0
- checkpoints/torso[1].res_final_512.pt +3 -0
- checkpoints/torso[1].res_mlp_0.pt +3 -0
- checkpoints/torso[1].res_mlp_1024.pt +3 -0
- checkpoints/torso[1].res_mlp_1536.pt +3 -0
- checkpoints/torso[1].res_mlp_2048.pt +3 -0
- checkpoints/torso[1].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[1].attn.pt +3 -0
- trainer_0/torso[1].res_final.pt +3 -0
- trainer_0/torso[1].res_mlp.pt +3 -0
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9d0247b7e3ebaf1664ae27b61a8204ebde95fb36a888ccb5535244a53b25066
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4592bcf8afff4836aa3cad9a88e25f3436ed61f1dabed6675d67abbb327d61b7
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a10eb10457b084e292e0e19a2a3501008ed892747106360a038dd7fd03e6a9b5
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec2c83a42520587a7c0412205ac5eff7d485eb8ed1a4a43e8c9a71918ae69805
|
3 |
+
size 37778696
|
checkpoints/torso[1].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
|
3 |
+
size 37778576
|
checkpoints/torso[1].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ad6a5eed481385f437530b5ff856a8b1748af79bfd338013797f85832f506e8
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f18ab12c4ac461662528167c02a0171c20903dc4537572bc079a6f93f0464da1
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa6caf8dc4853f101ca9d605bee4d24d14973f6a947d94065810e187c275a91a
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a31ca39cd5a6e422b1714f26275934b345b47d6c6596ddd5480c62820a94e8a
|
3 |
+
size 37778592
|
checkpoints/torso[1].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
|
3 |
+
size 37778616
|
checkpoints/torso[1].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee39edcf9ad8af00b894eeb035304062a082f97c1ae720b1e42920ce1ef591c0
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2d157181eb6518d466afb27c6488f9c3b6bf464311f814f875a305cb18e6bd7
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db608634b9f1722fdf97bcaa7dd73b16bead13c0131c4a92c3d37ef00354f0f6
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a0bb79de3718a3860aecb4db4fe3fc8286e242c790adc4b688ae83636d8e8df
|
3 |
+
size 37778696
|
checkpoints/torso[1].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
|
3 |
+
size 37778600
|
checkpoints/torso[1].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:578cd7caeddbc37bbefcebcebc081d4b3998feeddafd348541924c5f113328e7
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a966da388d9032787a086687a27934b288f7a6685735327e319a4aebe64e7538
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80a77fe41c6d3fd4c82923328335edc552a6a6d4cf9fb1605c561d69efb8e3f3
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9b58ba20988f809d4450bdfde48a90e243117079503b74c2770a265d40f9809
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 1,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3dac001e49c3bd477e6bea8ed9a34a225ee8fc032b4689c4ecb9e266d966701
|
3 |
+
size 37778600
|
trainer_0/torso[1].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e69d4a6eac3cd2602818e48f5c200ba9c6745818f7e06570b0b5cca3d7f91cc0
|
3 |
+
size 37778560
|
trainer_0/torso[1].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:146a3fab72a82087ea40b0fb0bd4cd92920e74c2184bbfc858f87f5d508a6d70
|
3 |
+
size 37778600
|
trainer_0/torso[1].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bc2136decd19d447fc2a992be578159b526e36f4ce81d7cdd793937ec4f9038
|
3 |
+
size 37778584
|