Vlasta commited on
Commit
c1bdd7d
·
verified ·
1 Parent(s): 61305fc

Upload T5ForConditionalGeneration

Browse files
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "./checkpoints/iconic-breeze-483/checkpoint-2100",
3
  "architectures": [
4
- "T5Model"
5
  ],
6
  "classifier_dropout": 0.0,
7
  "d_ff": 5120,
 
1
  {
2
+ "_name_or_path": "./checkpoints/iconic-breeze-483/checkpoint-1900",
3
  "architectures": [
4
+ "T5ForConditionalGeneration"
5
  ],
6
  "classifier_dropout": 0.0,
7
  "d_ff": 5120,
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "decoder_start_token_id": 0,
3
+ "eos_token_id": 1,
4
+ "pad_token_id": 0,
5
+ "transformers_version": "4.36.2"
6
+ }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5052db6de9f91446330aa22ecec910e78d4b31d1700b41c3dd205d9603068c1
3
  size 4994813208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b98fd73be92c1dd23e2ed1dfe1f2615d4c84e1022730776093fa5796d5e60cd
3
  size 4994813208
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73870d1b3fd7a31ecbcaa60859c2f62494b83dc783174080d1f28fb8f61fefe1
3
  size 4974952864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67804f1f3549e493e1682948682dd7149364eb5d619b95232b02c3841b096328
3
  size 4974952864
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:595ed459d91ef50e3fd187350015f398242051eb7a53754e0172a6e0cc754c15
3
- size 1166138680
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:041a13d31cd0f728a786cdcb1e34c34504de3a6b585c351987759ee71e273141
3
+ size 1429331352
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 11135836160
4
  },
5
  "weight_map": {
6
  "decoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00003.safetensors",
@@ -559,6 +559,7 @@
559
  "encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00001-of-00003.safetensors",
560
  "encoder.block.9.layer.1.layer_norm.weight": "model-00001-of-00003.safetensors",
561
  "encoder.final_layer_norm.weight": "model-00001-of-00003.safetensors",
 
562
  "shared.weight": "model-00001-of-00003.safetensors"
563
  }
564
  }
 
1
  {
2
  "metadata": {
3
+ "total_size": 11399028736
4
  },
5
  "weight_map": {
6
  "decoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00003.safetensors",
 
559
  "encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00001-of-00003.safetensors",
560
  "encoder.block.9.layer.1.layer_norm.weight": "model-00001-of-00003.safetensors",
561
  "encoder.final_layer_norm.weight": "model-00001-of-00003.safetensors",
562
+ "lm_head.weight": "model-00003-of-00003.safetensors",
563
  "shared.weight": "model-00001-of-00003.safetensors"
564
  }
565
  }