rootxhacker commited on
Commit
b7d96d9
·
verified ·
1 Parent(s): 890fef1

Training in progress, step 27301, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ecb2f2e99a3f55ce283ec3c73dc04b2a38b8d596c5eb8a739f6b0463f816d0e
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c0c310c1ea72db9327b79c3262d5c740e995fdf0b4ee984a5e16a1808195ffd
3
  size 36730224
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4aa7532d5b46ff1991d1c3ddb490b4cebca7a510adb0c584bc416f8e750a93e4
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e6a3fff60354b408c8d516a28100919c40cc962e313e3c5944958f8dce11df
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7cb9cecde71619f5455094db9dbc10b01ced14b7fff166fcfd1f46df6e480f1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a29b39a8e376f23acf3c1b4114f67a384379a770783936ae950c5b920178bb90
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38e8022c7f3002679e6fa3f97f4fe89fb5c796e6e8d168c42ccf78f18e8bd32d
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:119728a071df48b2f95f13bda28fdcc42605f68fc14083a4d008966987fd7a1b
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84d9c773d9d655234bd445b24c5fab29b1818f6d34a0b08096443007d2a42d37
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f622dd98ef6fc2bcd7320e2559be8d58ca57d1000667a66610f8a68cd0ffa59
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 24500,
3
  "best_metric": 1.4431298971176147,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints/checkpoint-24500",
5
- "epoch": 2.076763325898008,
6
  "eval_steps": 250,
7
- "global_step": 27000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4652,6 +4652,56 @@
4652
  "eval_samples_per_second": 55.107,
4653
  "eval_steps_per_second": 13.777,
4654
  "step": 27000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4655
  }
4656
  ],
4657
  "logging_steps": 50,
@@ -4666,7 +4716,7 @@
4666
  "should_evaluate": false,
4667
  "should_log": false,
4668
  "should_save": true,
4669
- "should_training_stop": false
4670
  },
4671
  "attributes": {}
4672
  }
 
2
  "best_global_step": 24500,
3
  "best_metric": 1.4431298971176147,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints/checkpoint-24500",
5
+ "epoch": 2.09991539112376,
6
  "eval_steps": 250,
7
+ "global_step": 27301,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4652
  "eval_samples_per_second": 55.107,
4653
  "eval_steps_per_second": 13.777,
4654
  "step": 27000
4655
+ },
4656
+ {
4657
+ "epoch": 2.0806091839089302,
4658
+ "grad_norm": 0.9924139380455017,
4659
+ "learning_rate": 1.3587735745009373e-06,
4660
+ "loss": 1.5088,
4661
+ "step": 27050
4662
+ },
4663
+ {
4664
+ "epoch": 2.084455041919852,
4665
+ "grad_norm": 1.1177709102630615,
4666
+ "learning_rate": 1.1014300944818204e-06,
4667
+ "loss": 1.4285,
4668
+ "step": 27100
4669
+ },
4670
+ {
4671
+ "epoch": 2.0883008999307746,
4672
+ "grad_norm": 1.7112759351730347,
4673
+ "learning_rate": 8.440866144627034e-07,
4674
+ "loss": 1.433,
4675
+ "step": 27150
4676
+ },
4677
+ {
4678
+ "epoch": 2.0921467579416966,
4679
+ "grad_norm": 1.9338856935501099,
4680
+ "learning_rate": 5.867431344435866e-07,
4681
+ "loss": 1.4008,
4682
+ "step": 27200
4683
+ },
4684
+ {
4685
+ "epoch": 2.095992615952619,
4686
+ "grad_norm": 3.0200393199920654,
4687
+ "learning_rate": 3.2939965442446964e-07,
4688
+ "loss": 1.4285,
4689
+ "step": 27250
4690
+ },
4691
+ {
4692
+ "epoch": 2.095992615952619,
4693
+ "eval_loss": 1.4686814546585083,
4694
+ "eval_runtime": 18.028,
4695
+ "eval_samples_per_second": 55.469,
4696
+ "eval_steps_per_second": 13.867,
4697
+ "step": 27250
4698
+ },
4699
+ {
4700
+ "epoch": 2.0998384739635414,
4701
+ "grad_norm": 1.5137439966201782,
4702
+ "learning_rate": 7.205617440535274e-08,
4703
+ "loss": 1.4596,
4704
+ "step": 27300
4705
  }
4706
  ],
4707
  "logging_steps": 50,
 
4716
  "should_evaluate": false,
4717
  "should_log": false,
4718
  "should_save": true,
4719
+ "should_training_stop": true
4720
  },
4721
  "attributes": {}
4722
  }