Spaces:
Runtime error
Runtime error
Update models cache
Browse files- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl +0 -3
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl +0 -3
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt +0 -10
- cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy +0 -3
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl +0 -3
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl +0 -3
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt +0 -12
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt +0 -10
- cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy +0 -3
- cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/act_count_ft_tkns.pkl +0 -0
- cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/cb_acts.pkl +0 -0
- cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/demo_codes.txt +0 -0
- cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/info.txt +0 -0
- cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/metrics.npy +0 -0
- cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/act_count_ft_tkns.pkl +0 -0
- cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/cb_acts.pkl +0 -0
- cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/info.txt +0 -0
- cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/metrics.npy +0 -0
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:b3761ef12e28333f43574b945a544fbc0d2e58e9171f8c818a234c1c0cc05503
|
3 |
-
size 400172
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:f980fd5b9410f146d8c96c10d6782b0d2d091b3557ec204cc5deb7666ad29247
|
3 |
-
size 819200181
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
num_codes: 50000
|
2 |
-
cb_at: mlp
|
3 |
-
ccb: False
|
4 |
-
n_layers: 1
|
5 |
-
n_heads: 16
|
6 |
-
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
-
pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/checkpoint-10000/
|
8 |
-
seed: 42
|
9 |
-
max_samples: 2000
|
10 |
-
dataset_name: roneneldan/TinyStories
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:950f175d9e284e6efbfe7a23d2d17477a337d04005d61fbf389e683c4537219e
|
3 |
-
size 619
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:f5454a081fbaf5abca451fc9e913e0a239d20e4fa4ddbe889330b73780a152ee
|
3 |
-
size 3201565
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:a8ce533d002762ea010334c8308cce352cb78aecdd035d5a4be5a20629dd0e0f
|
3 |
-
size 1048577327
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt
DELETED
@@ -1,12 +0,0 @@
|
|
1 |
-
|
2 |
-
# fear and worry:
|
3 |
-
layer: 0, head: 0, code: 3, num_acts: 238
|
4 |
-
|
5 |
-
# where people / things have been:
|
6 |
-
layer: 0, head: 0, code: 4, num_acts: 13
|
7 |
-
|
8 |
-
# describing newly introduced things:
|
9 |
-
layer: 0, head: 0, code: 5, num_acts: 114
|
10 |
-
|
11 |
-
# dialogue that starts with "You are/must/canβ¦":
|
12 |
-
layer: 0, head: 0, code: 6, num_acts: 556
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt
DELETED
@@ -1,10 +0,0 @@
|
|
1 |
-
num_codes: 25000
|
2 |
-
cb_at: attn_preproj
|
3 |
-
ccb: True
|
4 |
-
n_layers: 1
|
5 |
-
n_heads: 16
|
6 |
-
model_name: roneneldan/TinyStories-1Layer-21M
|
7 |
-
pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
|
8 |
-
seed: 42
|
9 |
-
max_samples: 2000
|
10 |
-
dataset_name: roneneldan/TinyStories
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:06b515fcc353399ce82bff99ac0a9882480482d40b772cf6b7f7750bca32a7f1
|
3 |
-
size 619
|
|
|
|
|
|
|
|
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/act_count_ft_tkns.pkl
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/cb_acts.pkl
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/demo_codes.txt
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/info.txt
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/metrics.npy
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/act_count_ft_tkns.pkl
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/cb_acts.pkl
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/info.txt
RENAMED
File without changes
|
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/metrics.npy
RENAMED
File without changes
|