rolf-mozilla commited on
Commit
d90b33a
·
unverified ·
1 Parent(s): 56bb4af

upbeat-eon-195 training run with multiple decoder layers removed to reduce model size. Based on flan-t5-small

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "pious-butterfly-170",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
@@ -18,9 +18,9 @@
18
  "layer_norm_epsilon": 1e-06,
19
  "model_type": "t5",
20
  "n_positions": 512,
21
- "num_decoder_layers": 3,
22
  "num_heads": 6,
23
- "num_layers": 3,
24
  "output_past": true,
25
  "pad_token_id": 0,
26
  "relative_attention_max_distance": 128,
 
1
  {
2
+ "_name_or_path": "upbeat-eon-195",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
18
  "layer_norm_epsilon": 1e-06,
19
  "model_type": "t5",
20
  "n_positions": 512,
21
+ "num_decoder_layers": 5,
22
  "num_heads": 6,
23
+ "num_layers": 8,
24
  "output_past": true,
25
  "pad_token_id": 0,
26
  "relative_attention_max_distance": 128,
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:568444304b19da5c4a8eb3c7282fe53e4c08c57991e5812ea19fbd846e25e9a6
3
- size 169472577
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c42c13f2c807648441e6aaaefb03e1ec7676a3f603344d4262875916c30a0c7a
3
+ size 194707491
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fba6c06c12046fa4b9c7b680f9fc6093e1210bcaa7c345456f335d791dffb50
3
- size 169578954
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee901d6cd9fe4ca0d3c52bc311e5489234e04c8d176fa2e5fa9240fff0fe50a7
3
+ size 194867022
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe83a419e30af7f28066f20c6178956963dae41cd9da67781d03398e18bad42e
3
- size 42895009
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d4b53b38b10d59646b9917597238dd4bb265c303294531fc1985ef633df934
3
+ size 49416454
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3aeaa9f321ebd94bf26537f423fe31a817d85d0d48378a1fe0751e18ca4adf6
3
- size 42753828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd5531a83e650de1ab2e732a6d3050d88dd95c444d40294f451efba7f5711038
3
+ size 49199890
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40a0ee7a12e84d445f2fd76f9aa779130d77391cf257f1df27a85519c4e814f9
3
- size 164738287
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99c47d5c15aa4caff6e1fd11c6ffe0187bc95df5bc1e0259645d8999f63f6261
3
+ size 186815283
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af0ab350e4137be691706d89bb9d5dea92ee871620361481be583afdb2dcd96e
3
- size 41540983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f766885bcf66a024047c816415b8c80b1ba1d7049f2f46f1f64133382aa75c4
3
+ size 47176839
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61c4716849d3d0fe971611531f33a1cef3e7cad9b839cf9cc90112ef6b62002f
3
- size 94183774
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b80ea5dce243671eee3df40c4fc5c1b33d2f30bf68833da654825ac9060fbc1
3
+ size 141467235
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dffba65048f543e7598826fe6c5a86f1d10cf41b13e1e03420995e3d03cf81b
3
- size 23688378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aebcc67f8be6efee38e1df8decb5d8f55f6da3403563f4979b146afdee396d97
3
+ size 35726832