joe611 commited on
Commit
c3ad3b1
·
verified ·
1 Parent(s): 1b9cb19

Training in progress, epoch 43, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:848953d25d5a9f4f9b7b663d111bb668c6455ace866e6c0d8c2d2253dcd1b6f9
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d69a853ce44d2a4c6a1f289809b194fbf5a858060c6c022ed50371f82355daf
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fa989f187882ac7dd49a61086937b636de2892613dde482a88e0faf39426ed5
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8897b9557334ef700d8217bf78bf859bb2374469468874a040168b0470cc76f
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0d931d489a6ecaf38c7d11c5f9d1ed6d115bfa7679ca5bd4cd5a652e7c55db7
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85e4133488da63327fc9ea031838bb6fd69fb43cc377eec164eb44278dfb4b45
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91946c64eb5ced4862f474458840a35ce7039f1ebfd0264eda91b7e2f3af5260
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:545d510515f5179456e33cb07c6feb588b2ff2a682f4164e86878f83fb45a36d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.30137816071510315,
3
- "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21000",
4
- "epoch": 42.0,
5
  "eval_steps": 500,
6
- "global_step": 21000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5999,6 +5999,144 @@
5999
  "eval_samples_per_second": 19.708,
6000
  "eval_steps_per_second": 2.562,
6001
  "step": 21000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6002
  }
6003
  ],
6004
  "logging_steps": 30,
@@ -6018,7 +6156,7 @@
6018
  "attributes": {}
6019
  }
6020
  },
6021
- "total_flos": 7.2244853710848e+18,
6022
  "train_batch_size": 2,
6023
  "trial_name": null,
6024
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.29740211367607117,
3
+ "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
4
+ "epoch": 43.0,
5
  "eval_steps": 500,
6
+ "global_step": 21500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5999
  "eval_samples_per_second": 19.708,
6000
  "eval_steps_per_second": 2.562,
6001
  "step": 21000
6002
+ },
6003
+ {
6004
+ "epoch": 42.06,
6005
+ "grad_norm": 41.583213806152344,
6006
+ "learning_rate": 2.0483802532185286e-06,
6007
+ "loss": 0.4022,
6008
+ "step": 21030
6009
+ },
6010
+ {
6011
+ "epoch": 42.12,
6012
+ "grad_norm": 320.62518310546875,
6013
+ "learning_rate": 2.035715899194704e-06,
6014
+ "loss": 0.4408,
6015
+ "step": 21060
6016
+ },
6017
+ {
6018
+ "epoch": 42.18,
6019
+ "grad_norm": 42.51158142089844,
6020
+ "learning_rate": 2.0230808014582265e-06,
6021
+ "loss": 0.4566,
6022
+ "step": 21090
6023
+ },
6024
+ {
6025
+ "epoch": 42.24,
6026
+ "grad_norm": 0.00034786213655024767,
6027
+ "learning_rate": 2.0104750847124075e-06,
6028
+ "loss": 0.5319,
6029
+ "step": 21120
6030
+ },
6031
+ {
6032
+ "epoch": 42.3,
6033
+ "grad_norm": 93.6717529296875,
6034
+ "learning_rate": 1.9978988733705807e-06,
6035
+ "loss": 0.4083,
6036
+ "step": 21150
6037
+ },
6038
+ {
6039
+ "epoch": 42.36,
6040
+ "grad_norm": 52.52644348144531,
6041
+ "learning_rate": 1.9853522915548777e-06,
6042
+ "loss": 0.4354,
6043
+ "step": 21180
6044
+ },
6045
+ {
6046
+ "epoch": 42.42,
6047
+ "grad_norm": 36.161460876464844,
6048
+ "learning_rate": 1.9728354630949935e-06,
6049
+ "loss": 0.4591,
6050
+ "step": 21210
6051
+ },
6052
+ {
6053
+ "epoch": 42.48,
6054
+ "grad_norm": 60.393306732177734,
6055
+ "learning_rate": 1.9603485115269743e-06,
6056
+ "loss": 0.5063,
6057
+ "step": 21240
6058
+ },
6059
+ {
6060
+ "epoch": 42.54,
6061
+ "grad_norm": 223.328857421875,
6062
+ "learning_rate": 1.9478915600919877e-06,
6063
+ "loss": 0.4404,
6064
+ "step": 21270
6065
+ },
6066
+ {
6067
+ "epoch": 42.6,
6068
+ "grad_norm": 42.48649215698242,
6069
+ "learning_rate": 1.9354647317351187e-06,
6070
+ "loss": 0.4508,
6071
+ "step": 21300
6072
+ },
6073
+ {
6074
+ "epoch": 42.66,
6075
+ "grad_norm": 46.062191009521484,
6076
+ "learning_rate": 1.9230681491041425e-06,
6077
+ "loss": 0.4275,
6078
+ "step": 21330
6079
+ },
6080
+ {
6081
+ "epoch": 42.72,
6082
+ "grad_norm": 0.0008085273439064622,
6083
+ "learning_rate": 1.910701934548329e-06,
6084
+ "loss": 0.4588,
6085
+ "step": 21360
6086
+ },
6087
+ {
6088
+ "epoch": 42.78,
6089
+ "grad_norm": 44.36118698120117,
6090
+ "learning_rate": 1.8983662101172217e-06,
6091
+ "loss": 0.4563,
6092
+ "step": 21390
6093
+ },
6094
+ {
6095
+ "epoch": 42.84,
6096
+ "grad_norm": 139.61676025390625,
6097
+ "learning_rate": 1.8860610975594384e-06,
6098
+ "loss": 0.3606,
6099
+ "step": 21420
6100
+ },
6101
+ {
6102
+ "epoch": 42.9,
6103
+ "grad_norm": 37.38964080810547,
6104
+ "learning_rate": 1.873786718321476e-06,
6105
+ "loss": 0.4464,
6106
+ "step": 21450
6107
+ },
6108
+ {
6109
+ "epoch": 42.96,
6110
+ "grad_norm": 72.3614730834961,
6111
+ "learning_rate": 1.8615431935464984e-06,
6112
+ "loss": 0.4322,
6113
+ "step": 21480
6114
+ },
6115
+ {
6116
+ "epoch": 43.0,
6117
+ "eval_loss": 0.29740211367607117,
6118
+ "eval_map": 0.7974,
6119
+ "eval_map_50": 0.9595,
6120
+ "eval_map_75": 0.9169,
6121
+ "eval_map_chicken": 0.8005,
6122
+ "eval_map_duck": 0.7586,
6123
+ "eval_map_large": 0.8951,
6124
+ "eval_map_medium": 0.7927,
6125
+ "eval_map_plant": 0.8331,
6126
+ "eval_map_small": 0.1879,
6127
+ "eval_mar_1": 0.3078,
6128
+ "eval_mar_10": 0.8296,
6129
+ "eval_mar_100": 0.834,
6130
+ "eval_mar_100_chicken": 0.8369,
6131
+ "eval_mar_100_duck": 0.7876,
6132
+ "eval_mar_100_plant": 0.8775,
6133
+ "eval_mar_large": 0.931,
6134
+ "eval_mar_medium": 0.8411,
6135
+ "eval_mar_small": 0.3085,
6136
+ "eval_runtime": 5.6419,
6137
+ "eval_samples_per_second": 17.724,
6138
+ "eval_steps_per_second": 2.304,
6139
+ "step": 21500
6140
  }
6141
  ],
6142
  "logging_steps": 30,
 
6156
  "attributes": {}
6157
  }
6158
  },
6159
+ "total_flos": 7.3964969275392e+18,
6160
  "train_batch_size": 2,
6161
  "trial_name": null,
6162
  "trial_params": null