k4black commited on
Commit
992edb1
1 Parent(s): b722e48

Training in progress, step 4800

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7143fe76dbf46bf9442f8a1d204e06a2a81c24eeb986929fd120efb94de838a
3
  size 997351173
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ab00c9ddd34f1cf2964b1096db77b9d715fbc02bdd5c7d43b00066b8085e40d
3
  size 997351173
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9edb507618309c51118ca819a7d1a4dc21aced15d900dc58a9a3c689cecd7b17
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d45968dc773842b4524edf097410728d62c61752f13cc8b835d523befb79b605
3
  size 498665141
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43080b83229b77060a1c70537fc3b3d1446585e032227c6e29f72d1a997537c4
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed4ae02de340745a578ad716a6dcb1ee42a03a56073f856062cfc5a83e2e3b94
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5f4434ed1f1c9d80d68b0f8157be0f9ddae46dd2e0f2023b9b90a13272136f7
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d5d506efbd8a343664b3029e84353da8bd575421aff1c64d55aebab3313dcd
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.984626969048982,
3
- "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-2800",
4
- "epoch": 0.3727865796831314,
5
- "global_step": 3200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -134,11 +134,75 @@
134
  "eval_samples_per_second": 2203.364,
135
  "eval_steps_per_second": 34.477,
136
  "step": 3200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
137
  }
138
  ],
139
  "max_steps": 25752,
140
  "num_train_epochs": 3,
141
- "total_flos": 8479257445588608.0,
142
  "trial_name": null,
143
  "trial_params": null
144
  }
 
1
  {
2
+ "best_metric": 0.9870629938253499,
3
+ "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-4800",
4
+ "epoch": 0.5591798695246971,
5
+ "global_step": 4800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
134
  "eval_samples_per_second": 2203.364,
135
  "eval_steps_per_second": 34.477,
136
  "step": 3200
137
+ },
138
+ {
139
+ "epoch": 0.42,
140
+ "learning_rate": 9.054937867887508e-06,
141
+ "loss": 0.0822,
142
+ "step": 3600
143
+ },
144
+ {
145
+ "epoch": 0.42,
146
+ "eval_accuracy": 0.9861816703921967,
147
+ "eval_f1": 0.9861489775586069,
148
+ "eval_loss": 0.05556264892220497,
149
+ "eval_runtime": 4.7392,
150
+ "eval_samples_per_second": 2076.706,
151
+ "eval_steps_per_second": 32.495,
152
+ "step": 3600
153
+ },
154
+ {
155
+ "epoch": 0.47,
156
+ "learning_rate": 8.891432308698496e-06,
157
+ "loss": 0.0764,
158
+ "step": 4000
159
+ },
160
+ {
161
+ "epoch": 0.47,
162
+ "eval_accuracy": 0.9852672221093274,
163
+ "eval_f1": 0.9852285614441253,
164
+ "eval_loss": 0.05288001894950867,
165
+ "eval_runtime": 4.2997,
166
+ "eval_samples_per_second": 2288.976,
167
+ "eval_steps_per_second": 35.816,
168
+ "step": 4000
169
+ },
170
+ {
171
+ "epoch": 0.51,
172
+ "learning_rate": 8.727926749509485e-06,
173
+ "loss": 0.0782,
174
+ "step": 4400
175
+ },
176
+ {
177
+ "epoch": 0.51,
178
+ "eval_accuracy": 0.9860800650274334,
179
+ "eval_f1": 0.9860421413180931,
180
+ "eval_loss": 0.05745375156402588,
181
+ "eval_runtime": 4.289,
182
+ "eval_samples_per_second": 2294.686,
183
+ "eval_steps_per_second": 35.905,
184
+ "step": 4400
185
+ },
186
+ {
187
+ "epoch": 0.56,
188
+ "learning_rate": 8.564421190320473e-06,
189
+ "loss": 0.0722,
190
+ "step": 4800
191
+ },
192
+ {
193
+ "epoch": 0.56,
194
+ "eval_accuracy": 0.9870961186750661,
195
+ "eval_f1": 0.9870629938253499,
196
+ "eval_loss": 0.053428150713443756,
197
+ "eval_runtime": 4.4266,
198
+ "eval_samples_per_second": 2223.361,
199
+ "eval_steps_per_second": 34.789,
200
+ "step": 4800
201
  }
202
  ],
203
  "max_steps": 25752,
204
  "num_train_epochs": 3,
205
+ "total_flos": 1.2774452433289344e+16,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9edb507618309c51118ca819a7d1a4dc21aced15d900dc58a9a3c689cecd7b17
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d45968dc773842b4524edf097410728d62c61752f13cc8b835d523befb79b605
3
  size 498665141