RodrigoSalazar-U commited on
Commit
3e1ffe4
·
verified ·
1 Parent(s): ec5a72f

Training in progress, step 6500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c69edaf91c86caf6a7a0fd42996899325e932c7927930f0bbb216780ecee6505
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c6623b2d67d7ace83c58db6e667a1f5efaf969454228665bd2f42fa58c63130
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:788a1d6cd203b01bb14f4804f15ed88e7a7c43e26dd6d552eee5a686613ecee8
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65c7c78a887b874f5d12d4183e0f20f21628e49864c34d49004e15388d95fe55
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95b37961c6d0193de06c3efbf48a168df2b148e000c09c167a07902751b74f66
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaedc92244071d34424437252c1cb2fe4ebf2e5cbfa092fca056c799d5a64b9c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.285870755750274,
5
  "eval_steps": 500,
6
- "global_step": 6000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -427,6 +427,41 @@
427
  "learning_rate": 3.172786461221279e-05,
428
  "loss": 0.3146,
429
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
430
  }
431
  ],
432
  "logging_steps": 100,
@@ -446,7 +481,7 @@
446
  "attributes": {}
447
  }
448
  },
449
- "total_flos": 2.8822031507389317e+18,
450
  "train_batch_size": 16,
451
  "trial_name": null,
452
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.5596933187294635,
5
  "eval_steps": 500,
6
+ "global_step": 6500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
427
  "learning_rate": 3.172786461221279e-05,
428
  "loss": 0.3146,
429
  "step": 6000
430
+ },
431
+ {
432
+ "epoch": 3.340635268346112,
433
+ "grad_norm": 1.7206776142120361,
434
+ "learning_rate": 2.996222995345437e-05,
435
+ "loss": 0.3138,
436
+ "step": 6100
437
+ },
438
+ {
439
+ "epoch": 3.3953997809419496,
440
+ "grad_norm": 1.966302514076233,
441
+ "learning_rate": 2.822588194196941e-05,
442
+ "loss": 0.3059,
443
+ "step": 6200
444
+ },
445
+ {
446
+ "epoch": 3.4501642935377874,
447
+ "grad_norm": 1.6685985326766968,
448
+ "learning_rate": 2.6521358375708428e-05,
449
+ "loss": 0.3006,
450
+ "step": 6300
451
+ },
452
+ {
453
+ "epoch": 3.5049288061336252,
454
+ "grad_norm": 1.6338154077529907,
455
+ "learning_rate": 2.4851150538898028e-05,
456
+ "loss": 0.3017,
457
+ "step": 6400
458
+ },
459
+ {
460
+ "epoch": 3.5596933187294635,
461
+ "grad_norm": 1.6607939004898071,
462
+ "learning_rate": 2.321769956084937e-05,
463
+ "loss": 0.2991,
464
+ "step": 6500
465
  }
466
  ],
467
  "logging_steps": 100,
 
481
  "attributes": {}
482
  }
483
  },
484
+ "total_flos": 3.1238589889308426e+18,
485
  "train_batch_size": 16,
486
  "trial_name": null,
487
  "trial_params": null