joe611 commited on
Commit
0fe2df4
·
verified ·
1 Parent(s): 193cb6c

Training in progress, epoch 47, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87ad9da164f90ea744048b81b6e35a735052df0bf62c64a7beaadf896e199c1a
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d5ce355db46607a95aec28c8b78c3595e784c5a4d7b633fba4e3a9ee15eb38c
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d08a40bb963af55260213aa96db9795ec46c8ced8e1e958c67197b7a6e73bdd
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ba6ec41c0dc6f0e349a76e70dac0de7bab1ad5a9835e860fb1ac13bdcf45e24
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f82f9668f7fedf5f119dd94c496b08d68f0842eece575c8646e2c5421dad242
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ad003c0a9f67fd2fbb27db20929ec58a84ae23e961e581a1f533296d899603
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23d8e99991fb0f832a4848719eeed140cdeda876cf038df0ed1de594bd36ed59
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3fe3dee209f5f42e53fe323f65577065b213541550cd1190559073b9095da7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.29740211367607117,
3
- "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
4
- "epoch": 46.0,
5
  "eval_steps": 500,
6
- "global_step": 23000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -6565,6 +6565,151 @@
6565
  "eval_samples_per_second": 19.89,
6566
  "eval_steps_per_second": 2.586,
6567
  "step": 23000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6568
  }
6569
  ],
6570
  "logging_steps": 30,
@@ -6584,7 +6729,7 @@
6584
  "attributes": {}
6585
  }
6586
  },
6587
- "total_flos": 7.9125315969024e+18,
6588
  "train_batch_size": 2,
6589
  "trial_name": null,
6590
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.29506856203079224,
3
+ "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-23500",
4
+ "epoch": 47.0,
5
  "eval_steps": 500,
6
+ "global_step": 23500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
6565
  "eval_samples_per_second": 19.89,
6566
  "eval_steps_per_second": 2.586,
6567
  "step": 23000
6568
+ },
6569
+ {
6570
+ "epoch": 46.02,
6571
+ "grad_norm": 82.24079132080078,
6572
+ "learning_rate": 1.2807743509648745e-06,
6573
+ "loss": 0.459,
6574
+ "step": 23010
6575
+ },
6576
+ {
6577
+ "epoch": 46.08,
6578
+ "grad_norm": 35.353336334228516,
6579
+ "learning_rate": 1.2702942728790897e-06,
6580
+ "loss": 0.4215,
6581
+ "step": 23040
6582
+ },
6583
+ {
6584
+ "epoch": 46.14,
6585
+ "grad_norm": 38.322479248046875,
6586
+ "learning_rate": 1.2598510054830888e-06,
6587
+ "loss": 0.3925,
6588
+ "step": 23070
6589
+ },
6590
+ {
6591
+ "epoch": 46.2,
6592
+ "grad_norm": 53.787445068359375,
6593
+ "learning_rate": 1.2494446518477022e-06,
6594
+ "loss": 0.349,
6595
+ "step": 23100
6596
+ },
6597
+ {
6598
+ "epoch": 46.26,
6599
+ "grad_norm": 37.92025375366211,
6600
+ "learning_rate": 1.2390753146794438e-06,
6601
+ "loss": 0.3578,
6602
+ "step": 23130
6603
+ },
6604
+ {
6605
+ "epoch": 46.32,
6606
+ "grad_norm": 68.19427490234375,
6607
+ "learning_rate": 1.2287430963194807e-06,
6608
+ "loss": 0.4342,
6609
+ "step": 23160
6610
+ },
6611
+ {
6612
+ "epoch": 46.38,
6613
+ "grad_norm": 108.89007568359375,
6614
+ "learning_rate": 1.218448098742641e-06,
6615
+ "loss": 0.4607,
6616
+ "step": 23190
6617
+ },
6618
+ {
6619
+ "epoch": 46.44,
6620
+ "grad_norm": 83.83390808105469,
6621
+ "learning_rate": 1.2081904235563908e-06,
6622
+ "loss": 0.4169,
6623
+ "step": 23220
6624
+ },
6625
+ {
6626
+ "epoch": 46.5,
6627
+ "grad_norm": 46.47811508178711,
6628
+ "learning_rate": 1.1979701719998454e-06,
6629
+ "loss": 0.3965,
6630
+ "step": 23250
6631
+ },
6632
+ {
6633
+ "epoch": 46.56,
6634
+ "grad_norm": 83.35205841064453,
6635
+ "learning_rate": 1.18778744494276e-06,
6636
+ "loss": 0.685,
6637
+ "step": 23280
6638
+ },
6639
+ {
6640
+ "epoch": 46.62,
6641
+ "grad_norm": 61.895530700683594,
6642
+ "learning_rate": 1.1776423428845423e-06,
6643
+ "loss": 0.3723,
6644
+ "step": 23310
6645
+ },
6646
+ {
6647
+ "epoch": 46.68,
6648
+ "grad_norm": 68.6615982055664,
6649
+ "learning_rate": 1.1675349659532514e-06,
6650
+ "loss": 0.4277,
6651
+ "step": 23340
6652
+ },
6653
+ {
6654
+ "epoch": 46.74,
6655
+ "grad_norm": 34.00867462158203,
6656
+ "learning_rate": 1.1574654139046171e-06,
6657
+ "loss": 0.4321,
6658
+ "step": 23370
6659
+ },
6660
+ {
6661
+ "epoch": 46.8,
6662
+ "grad_norm": 40.27052688598633,
6663
+ "learning_rate": 1.1474337861210543e-06,
6664
+ "loss": 0.3798,
6665
+ "step": 23400
6666
+ },
6667
+ {
6668
+ "epoch": 46.86,
6669
+ "grad_norm": 58.309085845947266,
6670
+ "learning_rate": 1.1374401816106778e-06,
6671
+ "loss": 0.4083,
6672
+ "step": 23430
6673
+ },
6674
+ {
6675
+ "epoch": 46.92,
6676
+ "grad_norm": 43.79540252685547,
6677
+ "learning_rate": 1.1274846990063314e-06,
6678
+ "loss": 0.3961,
6679
+ "step": 23460
6680
+ },
6681
+ {
6682
+ "epoch": 46.98,
6683
+ "grad_norm": 48.5699462890625,
6684
+ "learning_rate": 1.1175674365646067e-06,
6685
+ "loss": 0.4257,
6686
+ "step": 23490
6687
+ },
6688
+ {
6689
+ "epoch": 47.0,
6690
+ "eval_loss": 0.29506856203079224,
6691
+ "eval_map": 0.792,
6692
+ "eval_map_50": 0.9625,
6693
+ "eval_map_75": 0.9172,
6694
+ "eval_map_chicken": 0.7961,
6695
+ "eval_map_duck": 0.7572,
6696
+ "eval_map_large": 0.8802,
6697
+ "eval_map_medium": 0.7855,
6698
+ "eval_map_plant": 0.8226,
6699
+ "eval_map_small": 0.2075,
6700
+ "eval_mar_1": 0.3067,
6701
+ "eval_mar_10": 0.8262,
6702
+ "eval_mar_100": 0.8309,
6703
+ "eval_mar_100_chicken": 0.8338,
6704
+ "eval_mar_100_duck": 0.7907,
6705
+ "eval_mar_100_plant": 0.8683,
6706
+ "eval_mar_large": 0.9197,
6707
+ "eval_mar_medium": 0.836,
6708
+ "eval_mar_small": 0.3468,
6709
+ "eval_runtime": 5.0742,
6710
+ "eval_samples_per_second": 19.708,
6711
+ "eval_steps_per_second": 2.562,
6712
+ "step": 23500
6713
  }
6714
  ],
6715
  "logging_steps": 30,
 
6729
  "attributes": {}
6730
  }
6731
  },
6732
+ "total_flos": 8.0845431533568e+18,
6733
  "train_batch_size": 2,
6734
  "trial_name": null,
6735
  "trial_params": null