RodrigoSalazar-U commited on
Commit
18d6e18
·
verified ·
1 Parent(s): 249e072

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55fb81428939778dab08e7922db21d016e3f504c05107e029c92f5fce46fe882
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee0f7f6efa259946627904facc17872a7c399f185f2fa3c1cfc100a6322fb601
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a229809403e9c000da99928a1a77232623f005939cd31324d820e5637351f23b
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0539557cdcb1b310091e9a740e6565900f4359018a39a195ddb6d9bc8daf4959
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eba198d9667b25aa3e1e3ed428937b84fcb61b09b165df40f8a2db486d218cb8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd393a0ba2edec99a3162827022ce552435f0d62f37eef791559e57aae2a12ab
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.3691128148959475,
5
  "eval_steps": 500,
6
- "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -182,6 +182,41 @@
182
  "learning_rate": 9.107512678178223e-05,
183
  "loss": 1.1572,
184
  "step": 2500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
185
  }
186
  ],
187
  "logging_steps": 100,
@@ -201,7 +236,7 @@
201
  "attributes": {}
202
  }
203
  },
204
- "total_flos": 1.2070042691739648e+18,
205
  "train_batch_size": 16,
206
  "trial_name": null,
207
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.642935377875137,
5
  "eval_steps": 500,
6
+ "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
182
  "learning_rate": 9.107512678178223e-05,
183
  "loss": 1.1572,
184
  "step": 2500
185
+ },
186
+ {
187
+ "epoch": 1.4238773274917853,
188
+ "grad_norm": 2.1899495124816895,
189
+ "learning_rate": 8.99553475612544e-05,
190
+ "loss": 1.0975,
191
+ "step": 2600
192
+ },
193
+ {
194
+ "epoch": 1.4786418400876231,
195
+ "grad_norm": 2.541968822479248,
196
+ "learning_rate": 8.877717071624055e-05,
197
+ "loss": 1.1102,
198
+ "step": 2700
199
+ },
200
+ {
201
+ "epoch": 1.5334063526834611,
202
+ "grad_norm": 1.9248064756393433,
203
+ "learning_rate": 8.754231823724187e-05,
204
+ "loss": 1.1012,
205
+ "step": 2800
206
+ },
207
+ {
208
+ "epoch": 1.588170865279299,
209
+ "grad_norm": 2.002230644226074,
210
+ "learning_rate": 8.62525949502896e-05,
211
+ "loss": 1.0992,
212
+ "step": 2900
213
+ },
214
+ {
215
+ "epoch": 1.642935377875137,
216
+ "grad_norm": 2.2088050842285156,
217
+ "learning_rate": 8.490988587906137e-05,
218
+ "loss": 1.1102,
219
+ "step": 3000
220
  }
221
  ],
222
  "logging_steps": 100,
 
236
  "attributes": {}
237
  }
238
  },
239
+ "total_flos": 1.4496265837006356e+18,
240
  "train_batch_size": 16,
241
  "trial_name": null,
242
  "trial_params": null