Spaces:
Runtime error
Runtime error
Add tinystories model cache files
Browse files- cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/act_count_ft_tkns.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/cb_acts.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/info.txt +10 -0
- cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/metrics.npy +3 -0
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt +10 -0
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy +3 -0
- cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/act_count_ft_tkns.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/cb_acts.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/demo_codes.txt +9 -0
- cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/info.txt +10 -0
- cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/metrics.npy +3 -0
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl +3 -0
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt +12 -0
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt +10 -0
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy +3 -0
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/act_count_ft_tkns.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a8780a33abdec2f60358bed0fd21a8a5610f35c3e3b0759f517b7bdde11ebe4
|
3 |
+
size 400172
|
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/cb_acts.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15ab7ae8de8dcd8559b6858a8559c722e1c2887b063e371355dbde1a5d362ad5
|
3 |
+
size 819200181
|
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/info.txt
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
num_codes: 50000
|
2 |
+
cb_at: mlp
|
3 |
+
ccb: False
|
4 |
+
n_layers: 1
|
5 |
+
n_heads: 16
|
6 |
+
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
+
pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/
|
8 |
+
seed: 42
|
9 |
+
max_samples: 2000
|
10 |
+
dataset_name: roneneldan/TinyStories
|
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/metrics.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8131533bfd013b6ce186d936cb63e697c598037c97add794ab0933bb89adf690
|
3 |
+
size 619
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3761ef12e28333f43574b945a544fbc0d2e58e9171f8c818a234c1c0cc05503
|
3 |
+
size 400172
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f980fd5b9410f146d8c96c10d6782b0d2d091b3557ec204cc5deb7666ad29247
|
3 |
+
size 819200181
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
num_codes: 50000
|
2 |
+
cb_at: mlp
|
3 |
+
ccb: False
|
4 |
+
n_layers: 1
|
5 |
+
n_heads: 16
|
6 |
+
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
+
pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/checkpoint-10000/
|
8 |
+
seed: 42
|
9 |
+
max_samples: 2000
|
10 |
+
dataset_name: roneneldan/TinyStories
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:950f175d9e284e6efbfe7a23d2d17477a337d04005d61fbf389e683c4537219e
|
3 |
+
size 619
|
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/act_count_ft_tkns.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e758972a97ebdbe4ef6bffb70239519df798fc9c3dea334c0701fb8001463c3
|
3 |
+
size 3201565
|
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/cb_acts.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c6510084cfa3824b07dafed7ab4af4751ba3155fcf53417475a4ce6791e0d40
|
3 |
+
size 1048577327
|
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/demo_codes.txt
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
# Catch/Grab/Pick:
|
3 |
+
layer: 0, head: 0, code: 1, num_acts: 234
|
4 |
+
|
5 |
+
# scared / fear:
|
6 |
+
layer: 0, head: 0, code: 3, num_acts: 428
|
7 |
+
|
8 |
+
# Dialogue that starts with "You are/must/can...":
|
9 |
+
layer: 0, head: 0, code: 6, num_acts: 654
|
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/info.txt
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
num_codes: 25000
|
2 |
+
cb_at: attn_preproj
|
3 |
+
ccb: True
|
4 |
+
n_layers: 1
|
5 |
+
n_heads: 16
|
6 |
+
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
+
pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
|
8 |
+
seed: 42
|
9 |
+
max_samples: 2000
|
10 |
+
dataset_name: roneneldan/TinyStories
|
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/metrics.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5a804661a5ce3e58e7a52455cff44d412e7a93904ec4bacb2bc6d08c41ad801
|
3 |
+
size 619
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5454a081fbaf5abca451fc9e913e0a239d20e4fa4ddbe889330b73780a152ee
|
3 |
+
size 3201565
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8ce533d002762ea010334c8308cce352cb78aecdd035d5a4be5a20629dd0e0f
|
3 |
+
size 1048577327
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
# fear and worry:
|
3 |
+
layer: 0, head: 0, code: 3, num_acts: 238
|
4 |
+
|
5 |
+
# where people / things have been:
|
6 |
+
layer: 0, head: 0, code: 4, num_acts: 13
|
7 |
+
|
8 |
+
# describing newly introduced things:
|
9 |
+
layer: 0, head: 0, code: 5, num_acts: 114
|
10 |
+
|
11 |
+
# dialogue that starts with "You are/must/can…":
|
12 |
+
layer: 0, head: 0, code: 6, num_acts: 556
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
num_codes: 25000
|
2 |
+
cb_at: attn_preproj
|
3 |
+
ccb: True
|
4 |
+
n_layers: 1
|
5 |
+
n_heads: 16
|
6 |
+
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
+
pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
|
8 |
+
seed: 42
|
9 |
+
max_samples: 2000
|
10 |
+
dataset_name: roneneldan/TinyStories
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06b515fcc353399ce82bff99ac0a9882480482d40b772cf6b7f7750bca32a7f1
|
3 |
+
size 619
|