prxy5605 commited on
Commit
b64c9ac
·
verified ·
1 Parent(s): 1ebc9c2

Training in progress, epoch 1, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b2187cfea95a2eca680241463ddf253050b5d1c67d3f6926c4c7461e2017e6b
3
  size 125918320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e275e42a6e1a9d58cee44c2ad4d640cdf4c9a19deda114a48cace1ba0d46c984
3
  size 125918320
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b11230822a821b7c8912e91766e9cf86ee2e3eaed9c397b82b4547c8d6d21bf1
3
  size 64684244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a24831531cd867bb57b3034524a71f4862c189ab56900454001f822fd0baa92c
3
  size 64684244
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39d6ba09f3ca3721d72b9f77c49ba758bdc2025a005905ac6b40e79eb7b4d2ed
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b149951a969917452b67be40996b6fadd1beb1de150bbcc21cd57e242cfb0b5d
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:937b90285b79cb43fd1a74e2715c85320817d948429e0cf325617783fd5b98c7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e89df09ab5e0094d5655fa2536a552489bcab945628e8953beb9fd485709b6b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9971563981042654,
5
  "eval_steps": 66,
6
- "global_step": 263,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -403,6 +403,14 @@
403
  "learning_rate": 7.208147179291192e-08,
404
  "loss": 1.0496,
405
  "step": 260
 
 
 
 
 
 
 
 
406
  }
407
  ],
408
  "logging_steps": 5,
@@ -417,12 +425,12 @@
417
  "should_evaluate": false,
418
  "should_log": false,
419
  "should_save": true,
420
- "should_training_stop": false
421
  },
422
  "attributes": {}
423
  }
424
  },
425
- "total_flos": 1.623917388229509e+17,
426
  "train_batch_size": 2,
427
  "trial_name": null,
428
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0028436018957345,
5
  "eval_steps": 66,
6
+ "global_step": 264,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
403
  "learning_rate": 7.208147179291192e-08,
404
  "loss": 1.0496,
405
  "step": 260
406
+ },
407
+ {
408
+ "epoch": 1.0028436018957345,
409
+ "eval_loss": 1.1479114294052124,
410
+ "eval_runtime": 15.1375,
411
+ "eval_samples_per_second": 7.333,
412
+ "eval_steps_per_second": 3.699,
413
+ "step": 264
414
  }
415
  ],
416
  "logging_steps": 5,
 
425
  "should_evaluate": false,
426
  "should_log": false,
427
  "should_save": true,
428
+ "should_training_stop": true
429
  },
430
  "attributes": {}
431
  }
432
  },
433
+ "total_flos": 1.631756088414044e+17,
434
  "train_batch_size": 2,
435
  "trial_name": null,
436
  "trial_params": null