ElDestructo commited on
Commit
ed9f3d8
·
verified ·
1 Parent(s): 4668de1

End of training

Browse files
README.md CHANGED
@@ -32,13 +32,13 @@ More information needed
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
35
- - learning_rate: 0.0005
36
  - train_batch_size: 8
37
  - eval_batch_size: 8
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
- - num_epochs: 10
42
 
43
  ### Training results
44
 
@@ -46,7 +46,7 @@ The following hyperparameters were used during training:
46
 
47
  ### Framework versions
48
 
49
- - Transformers 4.35.2
50
  - Pytorch 2.1.0+cu121
51
- - Datasets 2.17.0
52
- - Tokenizers 0.15.1
 
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
35
+ - learning_rate: 0.001
36
  - train_batch_size: 8
37
  - eval_batch_size: 8
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 5
42
 
43
  ### Training results
44
 
 
46
 
47
  ### Framework versions
48
 
49
+ - Transformers 4.37.2
50
  - Pytorch 2.1.0+cu121
51
+ - Datasets 2.17.1
52
+ - Tokenizers 0.15.2
config.json CHANGED
@@ -56,7 +56,7 @@
56
  },
57
  "tie_word_embeddings": false,
58
  "torch_dtype": "float32",
59
- "transformers_version": "4.35.2",
60
  "use_cache": true,
61
  "vocab_size": 32128
62
  }
 
56
  },
57
  "tie_word_embeddings": false,
58
  "torch_dtype": "float32",
59
+ "transformers_version": "4.37.2",
60
  "use_cache": true,
61
  "vocab_size": 32128
62
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.35.2"
7
  }
 
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.37.2"
7
  }
logs/events.out.tfevents.1709191609.ff1fe9468526.163.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e156d5748ad274f7361c5b30ff2672b9ca8b7fd26556a9a4d30a82e544ec4ea
3
+ size 6463
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7986a098d3918ddf468a2e09f20d35666582f40c27dbc6090e4cd6c777aa7d2
3
  size 990345064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e385e0f0427487600e7962d5d4c1ddd0739c5c005aa0f2fa997bc64c9c7b62d
3
  size 990345064
special_tokens_map.json CHANGED
@@ -101,7 +101,25 @@
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
- "eos_token": "</s>",
105
- "pad_token": "<pad>",
106
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  }
 
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
+ "eos_token": {
105
+ "content": "</s>",
106
+ "lstrip": false,
107
+ "normalized": false,
108
+ "rstrip": false,
109
+ "single_word": false
110
+ },
111
+ "pad_token": {
112
+ "content": "<pad>",
113
+ "lstrip": false,
114
+ "normalized": false,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "unk_token": {
119
+ "content": "<unk>",
120
+ "lstrip": false,
121
+ "normalized": false,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ }
125
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8610b9e67d2f1b12f843b2b355dd712731be3c0e1d3d9b2d2f25d13e6103e4ec
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:902c20a2f7ccd7a7ff4b2420ce563b149346c9413563a318635f94f5e64a85bf
3
+ size 4856