RodrigoSalazar-U commited on
Commit
3661c69
·
verified ·
1 Parent(s): db09cd5

Training in progress, step 9000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0278328958930d3beaacbe8bed27397e998fbcabe1fca7fa0eae8eafd80ecf51
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa462ee315f6286d0560d178e1576f9f7bc266cda332e3573e24a9be44be436
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e59834f34401a93fcb0300abb81ffe29f6ae8d1c35b22ab4a0642dde9c40b2e
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc3a6d3b8afe0402070b9a53be5a23ab45e598fb6abf993ecb0f8d70a9dec5b9
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4a81dafce04c7537f75efee5aacdd30a9f6039bc0738e6674b85fdce84b597c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c66a678ee8f615fe14ce6e44cecc141a68321a0815a7952fb61c3673d46702bf
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.6549835706462215,
5
  "eval_steps": 500,
6
- "global_step": 8500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -602,6 +602,41 @@
602
  "learning_rate": 1.4434228048932796e-06,
603
  "loss": 0.1657,
604
  "step": 8500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
605
  }
606
  ],
607
  "logging_steps": 100,
@@ -621,7 +656,7 @@
621
  "attributes": {}
622
  }
623
  },
624
- "total_flos": 4.086908592883286e+18,
625
  "train_batch_size": 16,
626
  "trial_name": null,
627
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.928806133625411,
5
  "eval_steps": 500,
6
+ "global_step": 9000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
602
  "learning_rate": 1.4434228048932796e-06,
603
  "loss": 0.1657,
604
  "step": 8500
605
+ },
606
+ {
607
+ "epoch": 4.709748083242059,
608
+ "grad_norm": 1.020652174949646,
609
+ "learning_rate": 1.023006467000115e-06,
610
+ "loss": 0.1708,
611
+ "step": 8600
612
+ },
613
+ {
614
+ "epoch": 4.764512595837897,
615
+ "grad_norm": 1.2859959602355957,
616
+ "learning_rate": 6.741735403739901e-07,
617
+ "loss": 0.1712,
618
+ "step": 8700
619
+ },
620
+ {
621
+ "epoch": 4.8192771084337345,
622
+ "grad_norm": 0.8666063547134399,
623
+ "learning_rate": 3.974338695163393e-07,
624
+ "loss": 0.1657,
625
+ "step": 8800
626
+ },
627
+ {
628
+ "epoch": 4.874041621029573,
629
+ "grad_norm": 0.6807364821434021,
630
+ "learning_rate": 1.9319192943152986e-07,
631
+ "loss": 0.1675,
632
+ "step": 8900
633
+ },
634
+ {
635
+ "epoch": 4.928806133625411,
636
+ "grad_norm": 1.1967036724090576,
637
+ "learning_rate": 6.174623445742155e-08,
638
+ "loss": 0.1721,
639
+ "step": 9000
640
  }
641
  ],
642
  "logging_steps": 100,
 
656
  "attributes": {}
657
  }
658
  },
659
+ "total_flos": 4.325169651624493e+18,
660
  "train_batch_size": 16,
661
  "trial_name": null,
662
  "trial_params": null