RoyJoy commited on
Commit
29cd41b
·
verified ·
1 Parent(s): 69f509a

Training in progress, step 77, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65b19418aef8a7cd6b5e699fc18e768f4d6ade9623bd0d5ce166c2d6d37355fd
3
  size 159967880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f168ff95e21d7e001bd1a3b1c57099edf617adefb0c1f7ec23bbb05717a2cb7d
3
  size 159967880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25f1aacb1fb33c14dfab10c45142209ca75e483b5214e07e7eb72da8bfcc0935
3
  size 320194002
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef97e873fef8428d5ee45258a46de7b905c21f526cba43111d625f862ecfb7d
3
  size 320194002
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22deae5baca73acdf1bdd6e465712b37190f83ff08b421ce09036b19ad30759d
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c6ced4bf2df8499dc2d96058780757c73d89a1bccdc6734025259075700e12
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5792623e62c69eb6d06441cf884e7d8e99d996c1745ea35dc4e4377c5a48dc2
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67bd5523eb2f6525efd0012a7616311251148ea6642802ae5209bd53c6895710
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:becbc0b7a9b1e331e23f7a70974c3f85981af0327a464ead257baec11a3461c4
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e896da01a6c9857fb0ecb9a5c5461d55445ae811dff82321390080b9f89d0092
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02a7b59d54862a0ca175393f2a7f6ae8c2a3eabcb876d78099157512c18e1fa1
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44d86ae4695cd217f4cbe149c2822a38bad3d2db57b9d0bc7a48c5f181d9914
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3576cca3b6a084e5b9dbc713d787dac1e4381b121fdf3f476ee9adbb805713a7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24b79c0dbdbaf1db6f5e9f86b4075e23cb507805053cd78cf5bfb81ecd493496
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9411764705882355,
5
  "eval_steps": 7,
6
- "global_step": 75,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -620,6 +620,28 @@
620
  "learning_rate": 2.1970089890509527e-07,
621
  "loss": 0.3324,
622
  "step": 75
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
623
  }
624
  ],
625
  "logging_steps": 1,
@@ -634,12 +656,12 @@
634
  "should_evaluate": false,
635
  "should_log": false,
636
  "should_save": true,
637
- "should_training_stop": false
638
  },
639
  "attributes": {}
640
  }
641
  },
642
- "total_flos": 2.0956683733408154e+17,
643
  "train_batch_size": 8,
644
  "trial_name": null,
645
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.019607843137255,
5
  "eval_steps": 7,
6
+ "global_step": 77,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
620
  "learning_rate": 2.1970089890509527e-07,
621
  "loss": 0.3324,
622
  "step": 75
623
+ },
624
+ {
625
+ "epoch": 2.980392156862745,
626
+ "grad_norm": 0.11286412179470062,
627
+ "learning_rate": 5.4955425714431353e-08,
628
+ "loss": 0.4175,
629
+ "step": 76
630
+ },
631
+ {
632
+ "epoch": 3.019607843137255,
633
+ "grad_norm": 0.16945837438106537,
634
+ "learning_rate": 0.0,
635
+ "loss": 0.5248,
636
+ "step": 77
637
+ },
638
+ {
639
+ "epoch": 3.019607843137255,
640
+ "eval_loss": 0.41082337498664856,
641
+ "eval_runtime": 1.7311,
642
+ "eval_samples_per_second": 49.679,
643
+ "eval_steps_per_second": 1.733,
644
+ "step": 77
645
  }
646
  ],
647
  "logging_steps": 1,
 
656
  "should_evaluate": false,
657
  "should_log": false,
658
  "should_save": true,
659
+ "should_training_stop": true
660
  },
661
  "attributes": {}
662
  }
663
  },
664
+ "total_flos": 2.1485559026915738e+17,
665
  "train_batch_size": 8,
666
  "trial_name": null,
667
  "trial_params": null