Saving weights and logs of step 300
Browse files
.gitignore
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
__pycache__/*
|
2 |
+
*~
|
3 |
+
.idea/*
|
4 |
+
venv/*
|
5 |
+
ckpt*
|
config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"architectures": [
|
3 |
-
"
|
4 |
],
|
5 |
"d_ff": 3072,
|
6 |
"d_kv": 64,
|
@@ -52,5 +52,5 @@
|
|
52 |
},
|
53 |
"transformers_version": "4.9.0.dev0",
|
54 |
"use_cache": true,
|
55 |
-
"vocab_size":
|
56 |
}
|
|
|
1 |
{
|
2 |
"architectures": [
|
3 |
+
"T5ForConditionalGeneration"
|
4 |
],
|
5 |
"d_ff": 3072,
|
6 |
"d_kv": 64,
|
|
|
52 |
},
|
53 |
"transformers_version": "4.9.0.dev0",
|
54 |
"use_cache": true,
|
55 |
+
"vocab_size": 32103
|
56 |
}
|
flax_model.msgpack
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6554fc39fc36959fc1ed967d23d2bd7bfbb244c2d85f72d70e8b03224adad6fd
|
3 |
+
size 891548548
|
runs/Jul09_21-28-23_t1v-n-0e7426e8-w-0/events.out.tfevents.1625866241.t1v-n-0e7426e8-w-0.417321.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efed27a99c31a4b3656e323ded245a663569c2d1609cf015f02374f2897a6022
|
3 |
+
size 31755
|
runs/Jul09_21-43-10_t1v-n-0e7426e8-w-0/events.out.tfevents.1625867209.t1v-n-0e7426e8-w-0.420316.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adb128a2e8b82dffce5c7408471ea0b58958ab99dc75b945b01bcbb35ca4b211
|
3 |
+
size 45399
|