k4black commited on
Commit
b722e48
·
1 Parent(s): db662cf

Training in progress, step 3200

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c42a5366840794b0c0fb0432bbaa031a842391943e8331fed713b5cd64f82ef1
3
  size 997351173
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7143fe76dbf46bf9442f8a1d204e06a2a81c24eeb986929fd120efb94de838a
3
  size 997351173
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e6bae183954f5d437ff9de22f8b455d34e8c948c4e9f409b7fdf25253e5efed
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9edb507618309c51118ca819a7d1a4dc21aced15d900dc58a9a3c689cecd7b17
3
  size 498665141
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55354db435c68678b6f94b24e84f2902d2393e19e425a5be089c34ccf6838fe5
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43080b83229b77060a1c70537fc3b3d1446585e032227c6e29f72d1a997537c4
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9ab84b3e9a31d3636ab888c3f3b4b43181ed71041b39e64d169f508e5b3f134
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5f4434ed1f1c9d80d68b0f8157be0f9ddae46dd2e0f2023b9b90a13272136f7
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.983300542812346,
3
- "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-2000",
4
- "epoch": 0.23299161230195714,
5
- "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -86,11 +86,59 @@
86
  "eval_samples_per_second": 2304.409,
87
  "eval_steps_per_second": 36.058,
88
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
89
  }
90
  ],
91
  "max_steps": 25752,
92
  "num_train_epochs": 3,
93
- "total_flos": 5305451844244608.0,
94
  "trial_name": null,
95
  "trial_params": null
96
  }
 
1
  {
2
+ "best_metric": 0.984626969048982,
3
+ "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-2800",
4
+ "epoch": 0.3727865796831314,
5
+ "global_step": 3200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
86
  "eval_samples_per_second": 2304.409,
87
  "eval_steps_per_second": 36.058,
88
  "step": 2000
89
+ },
90
+ {
91
+ "epoch": 0.28,
92
+ "learning_rate": 9.545454545454547e-06,
93
+ "loss": 0.0888,
94
+ "step": 2400
95
+ },
96
+ {
97
+ "epoch": 0.28,
98
+ "eval_accuracy": 0.983539930908352,
99
+ "eval_f1": 0.9834936652245868,
100
+ "eval_loss": 0.06838709861040115,
101
+ "eval_runtime": 4.2889,
102
+ "eval_samples_per_second": 2294.739,
103
+ "eval_steps_per_second": 35.906,
104
+ "step": 2400
105
+ },
106
+ {
107
+ "epoch": 0.33,
108
+ "learning_rate": 9.381948986265533e-06,
109
+ "loss": 0.0833,
110
+ "step": 2800
111
+ },
112
+ {
113
+ "epoch": 0.33,
114
+ "eval_accuracy": 0.9846575899207478,
115
+ "eval_f1": 0.984626969048982,
116
+ "eval_loss": 0.05881618708372116,
117
+ "eval_runtime": 4.3142,
118
+ "eval_samples_per_second": 2281.283,
119
+ "eval_steps_per_second": 35.696,
120
+ "step": 2800
121
+ },
122
+ {
123
+ "epoch": 0.37,
124
+ "learning_rate": 9.218443427076522e-06,
125
+ "loss": 0.0802,
126
+ "step": 3200
127
+ },
128
+ {
129
+ "epoch": 0.37,
130
+ "eval_accuracy": 0.9832351148140622,
131
+ "eval_f1": 0.9831849160413134,
132
+ "eval_loss": 0.06230289116501808,
133
+ "eval_runtime": 4.4668,
134
+ "eval_samples_per_second": 2203.364,
135
+ "eval_steps_per_second": 34.477,
136
+ "step": 3200
137
  }
138
  ],
139
  "max_steps": 25752,
140
  "num_train_epochs": 3,
141
+ "total_flos": 8479257445588608.0,
142
  "trial_name": null,
143
  "trial_params": null
144
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e6bae183954f5d437ff9de22f8b455d34e8c948c4e9f409b7fdf25253e5efed
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9edb507618309c51118ca819a7d1a4dc21aced15d900dc58a9a3c689cecd7b17
3
  size 498665141