rootxhacker commited on
Commit
2fbae45
·
verified ·
1 Parent(s): 3721712

Training in progress, step 38500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a045cd1651964484e35a7ee4cc80f394400bcf32d399ca366f907f0dafb8b29
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8e43e89b9bebeb74f5a3f59777b202fc9109955aeb97f2af35e0e442d7a452
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47093e48c8dcb6ad57ae3eda9ce7141b8c756fad2f39a70827cbbb9ed49f5649
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fc4122df013355a6969e434d41cc8fcea9f612e4d30ef5a56450eacb41efce6
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b60bdca21a24c4c9f76b11b903c37c4127fc1f54a299af327f2fe260c58ff720
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e190ed0010bdd235ac8bd29945114b8053051431b822dc222d819209c07d8d07
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0df6fc486b7517363afca4fd7698726ecbf63a16d3ce84e06ce60f5376cd9b7e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbb02a8ec0b72b513f298ee44dab19beae5aff0d3cdf5658defb30f6a23c5a12
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97243af249b903bf91950a8fcb37e9bd58551a34f032c66a6b68e32bc4197313
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ccae9e6b2d4eb2fcfe967592fa19a2d659f2463aeb2c7a929d0ba46b4b319dc
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:541cb6dea9c80e2359e5134078f161ec83a5de3af8e29b3e9b6b880e5dd9058f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74b6ef3f8e20f0529905c960a3004917dd68d119006b5c8315cb84a5724c015e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 38000,
3
  "best_metric": 0.98431396484375,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-38000",
5
- "epoch": 2.9228520883008997,
6
  "eval_steps": 250,
7
- "global_step": 38000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6544,6 +6544,92 @@
6544
  "eval_samples_per_second": 57.482,
6545
  "eval_steps_per_second": 14.371,
6546
  "step": 38000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6547
  }
6548
  ],
6549
  "logging_steps": 50,
 
2
  "best_global_step": 38000,
3
  "best_metric": 0.98431396484375,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-38000",
5
+ "epoch": 2.961310668410122,
6
  "eval_steps": 250,
7
+ "global_step": 38500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6544
  "eval_samples_per_second": 57.482,
6545
  "eval_steps_per_second": 14.371,
6546
  "step": 38000
6547
+ },
6548
+ {
6549
+ "epoch": 2.926697946311822,
6550
+ "grad_norm": 0.9615415930747986,
6551
+ "learning_rate": 5.038568423239748e-06,
6552
+ "loss": 0.9715,
6553
+ "step": 38050
6554
+ },
6555
+ {
6556
+ "epoch": 2.9305438043227445,
6557
+ "grad_norm": 0.5959100127220154,
6558
+ "learning_rate": 4.778848401423266e-06,
6559
+ "loss": 0.936,
6560
+ "step": 38100
6561
+ },
6562
+ {
6563
+ "epoch": 2.9343896623336665,
6564
+ "grad_norm": 1.0181951522827148,
6565
+ "learning_rate": 4.519128379606784e-06,
6566
+ "loss": 0.969,
6567
+ "step": 38150
6568
+ },
6569
+ {
6570
+ "epoch": 2.938235520344589,
6571
+ "grad_norm": 0.8716458082199097,
6572
+ "learning_rate": 4.259408357790302e-06,
6573
+ "loss": 1.002,
6574
+ "step": 38200
6575
+ },
6576
+ {
6577
+ "epoch": 2.9420813783555113,
6578
+ "grad_norm": 1.6100435256958008,
6579
+ "learning_rate": 3.99968833597382e-06,
6580
+ "loss": 0.9425,
6581
+ "step": 38250
6582
+ },
6583
+ {
6584
+ "epoch": 2.9420813783555113,
6585
+ "eval_loss": 0.9931854009628296,
6586
+ "eval_runtime": 17.3406,
6587
+ "eval_samples_per_second": 57.668,
6588
+ "eval_steps_per_second": 14.417,
6589
+ "step": 38250
6590
+ },
6591
+ {
6592
+ "epoch": 2.9459272363664333,
6593
+ "grad_norm": 1.1552485227584839,
6594
+ "learning_rate": 3.7399683141573383e-06,
6595
+ "loss": 1.0424,
6596
+ "step": 38300
6597
+ },
6598
+ {
6599
+ "epoch": 2.9497730943773557,
6600
+ "grad_norm": 1.441148042678833,
6601
+ "learning_rate": 3.480248292340857e-06,
6602
+ "loss": 1.0688,
6603
+ "step": 38350
6604
+ },
6605
+ {
6606
+ "epoch": 2.953618952388278,
6607
+ "grad_norm": 0.8127447366714478,
6608
+ "learning_rate": 3.220528270524375e-06,
6609
+ "loss": 0.9497,
6610
+ "step": 38400
6611
+ },
6612
+ {
6613
+ "epoch": 2.9574648103992,
6614
+ "grad_norm": 0.9566346406936646,
6615
+ "learning_rate": 2.9608082487078933e-06,
6616
+ "loss": 0.9628,
6617
+ "step": 38450
6618
+ },
6619
+ {
6620
+ "epoch": 2.961310668410122,
6621
+ "grad_norm": 0.7955614924430847,
6622
+ "learning_rate": 2.7010882268914113e-06,
6623
+ "loss": 1.016,
6624
+ "step": 38500
6625
+ },
6626
+ {
6627
+ "epoch": 2.961310668410122,
6628
+ "eval_loss": 0.9919273257255554,
6629
+ "eval_runtime": 17.3829,
6630
+ "eval_samples_per_second": 57.528,
6631
+ "eval_steps_per_second": 14.382,
6632
+ "step": 38500
6633
  }
6634
  ],
6635
  "logging_steps": 50,