Upload T5ForConditionalGeneration
Browse files- config.json +2 -2
- generation_config.json +6 -0
- model-00001-of-00003.safetensors +1 -1
- model-00002-of-00003.safetensors +1 -1
- model-00003-of-00003.safetensors +2 -2
- model.safetensors.index.json +2 -1
config.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "./checkpoints/iconic-breeze-483/checkpoint-
|
3 |
"architectures": [
|
4 |
-
"
|
5 |
],
|
6 |
"classifier_dropout": 0.0,
|
7 |
"d_ff": 5120,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "./checkpoints/iconic-breeze-483/checkpoint-1900",
|
3 |
"architectures": [
|
4 |
+
"T5ForConditionalGeneration"
|
5 |
],
|
6 |
"classifier_dropout": 0.0,
|
7 |
"d_ff": 5120,
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"decoder_start_token_id": 0,
|
3 |
+
"eos_token_id": 1,
|
4 |
+
"pad_token_id": 0,
|
5 |
+
"transformers_version": "4.36.2"
|
6 |
+
}
|
model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4994813208
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b98fd73be92c1dd23e2ed1dfe1f2615d4c84e1022730776093fa5796d5e60cd
|
3 |
size 4994813208
|
model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4974952864
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67804f1f3549e493e1682948682dd7149364eb5d619b95232b02c3841b096328
|
3 |
size 4974952864
|
model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:041a13d31cd0f728a786cdcb1e34c34504de3a6b585c351987759ee71e273141
|
3 |
+
size 1429331352
|
model.safetensors.index.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
-
"total_size":
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"decoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00003.safetensors",
|
@@ -559,6 +559,7 @@
|
|
559 |
"encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00001-of-00003.safetensors",
|
560 |
"encoder.block.9.layer.1.layer_norm.weight": "model-00001-of-00003.safetensors",
|
561 |
"encoder.final_layer_norm.weight": "model-00001-of-00003.safetensors",
|
|
|
562 |
"shared.weight": "model-00001-of-00003.safetensors"
|
563 |
}
|
564 |
}
|
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
+
"total_size": 11399028736
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"decoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00003.safetensors",
|
|
|
559 |
"encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00001-of-00003.safetensors",
|
560 |
"encoder.block.9.layer.1.layer_norm.weight": "model-00001-of-00003.safetensors",
|
561 |
"encoder.final_layer_norm.weight": "model-00001-of-00003.safetensors",
|
562 |
+
"lm_head.weight": "model-00003-of-00003.safetensors",
|
563 |
"shared.weight": "model-00001-of-00003.safetensors"
|
564 |
}
|
565 |
}
|