Training in progress, epoch 43, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d69a853ce44d2a4c6a1f289809b194fbf5a858060c6c022ed50371f82355daf
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8897b9557334ef700d8217bf78bf859bb2374469468874a040168b0470cc76f
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85e4133488da63327fc9ea031838bb6fd69fb43cc377eec164eb44278dfb4b45
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:545d510515f5179456e33cb07c6feb588b2ff2a682f4164e86878f83fb45a36d
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -5999,6 +5999,144 @@
|
|
5999 |
"eval_samples_per_second": 19.708,
|
6000 |
"eval_steps_per_second": 2.562,
|
6001 |
"step": 21000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6002 |
}
|
6003 |
],
|
6004 |
"logging_steps": 30,
|
@@ -6018,7 +6156,7 @@
|
|
6018 |
"attributes": {}
|
6019 |
}
|
6020 |
},
|
6021 |
-
"total_flos": 7.
|
6022 |
"train_batch_size": 2,
|
6023 |
"trial_name": null,
|
6024 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.29740211367607117,
|
3 |
+
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
|
4 |
+
"epoch": 43.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 21500,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
5999 |
"eval_samples_per_second": 19.708,
|
6000 |
"eval_steps_per_second": 2.562,
|
6001 |
"step": 21000
|
6002 |
+
},
|
6003 |
+
{
|
6004 |
+
"epoch": 42.06,
|
6005 |
+
"grad_norm": 41.583213806152344,
|
6006 |
+
"learning_rate": 2.0483802532185286e-06,
|
6007 |
+
"loss": 0.4022,
|
6008 |
+
"step": 21030
|
6009 |
+
},
|
6010 |
+
{
|
6011 |
+
"epoch": 42.12,
|
6012 |
+
"grad_norm": 320.62518310546875,
|
6013 |
+
"learning_rate": 2.035715899194704e-06,
|
6014 |
+
"loss": 0.4408,
|
6015 |
+
"step": 21060
|
6016 |
+
},
|
6017 |
+
{
|
6018 |
+
"epoch": 42.18,
|
6019 |
+
"grad_norm": 42.51158142089844,
|
6020 |
+
"learning_rate": 2.0230808014582265e-06,
|
6021 |
+
"loss": 0.4566,
|
6022 |
+
"step": 21090
|
6023 |
+
},
|
6024 |
+
{
|
6025 |
+
"epoch": 42.24,
|
6026 |
+
"grad_norm": 0.00034786213655024767,
|
6027 |
+
"learning_rate": 2.0104750847124075e-06,
|
6028 |
+
"loss": 0.5319,
|
6029 |
+
"step": 21120
|
6030 |
+
},
|
6031 |
+
{
|
6032 |
+
"epoch": 42.3,
|
6033 |
+
"grad_norm": 93.6717529296875,
|
6034 |
+
"learning_rate": 1.9978988733705807e-06,
|
6035 |
+
"loss": 0.4083,
|
6036 |
+
"step": 21150
|
6037 |
+
},
|
6038 |
+
{
|
6039 |
+
"epoch": 42.36,
|
6040 |
+
"grad_norm": 52.52644348144531,
|
6041 |
+
"learning_rate": 1.9853522915548777e-06,
|
6042 |
+
"loss": 0.4354,
|
6043 |
+
"step": 21180
|
6044 |
+
},
|
6045 |
+
{
|
6046 |
+
"epoch": 42.42,
|
6047 |
+
"grad_norm": 36.161460876464844,
|
6048 |
+
"learning_rate": 1.9728354630949935e-06,
|
6049 |
+
"loss": 0.4591,
|
6050 |
+
"step": 21210
|
6051 |
+
},
|
6052 |
+
{
|
6053 |
+
"epoch": 42.48,
|
6054 |
+
"grad_norm": 60.393306732177734,
|
6055 |
+
"learning_rate": 1.9603485115269743e-06,
|
6056 |
+
"loss": 0.5063,
|
6057 |
+
"step": 21240
|
6058 |
+
},
|
6059 |
+
{
|
6060 |
+
"epoch": 42.54,
|
6061 |
+
"grad_norm": 223.328857421875,
|
6062 |
+
"learning_rate": 1.9478915600919877e-06,
|
6063 |
+
"loss": 0.4404,
|
6064 |
+
"step": 21270
|
6065 |
+
},
|
6066 |
+
{
|
6067 |
+
"epoch": 42.6,
|
6068 |
+
"grad_norm": 42.48649215698242,
|
6069 |
+
"learning_rate": 1.9354647317351187e-06,
|
6070 |
+
"loss": 0.4508,
|
6071 |
+
"step": 21300
|
6072 |
+
},
|
6073 |
+
{
|
6074 |
+
"epoch": 42.66,
|
6075 |
+
"grad_norm": 46.062191009521484,
|
6076 |
+
"learning_rate": 1.9230681491041425e-06,
|
6077 |
+
"loss": 0.4275,
|
6078 |
+
"step": 21330
|
6079 |
+
},
|
6080 |
+
{
|
6081 |
+
"epoch": 42.72,
|
6082 |
+
"grad_norm": 0.0008085273439064622,
|
6083 |
+
"learning_rate": 1.910701934548329e-06,
|
6084 |
+
"loss": 0.4588,
|
6085 |
+
"step": 21360
|
6086 |
+
},
|
6087 |
+
{
|
6088 |
+
"epoch": 42.78,
|
6089 |
+
"grad_norm": 44.36118698120117,
|
6090 |
+
"learning_rate": 1.8983662101172217e-06,
|
6091 |
+
"loss": 0.4563,
|
6092 |
+
"step": 21390
|
6093 |
+
},
|
6094 |
+
{
|
6095 |
+
"epoch": 42.84,
|
6096 |
+
"grad_norm": 139.61676025390625,
|
6097 |
+
"learning_rate": 1.8860610975594384e-06,
|
6098 |
+
"loss": 0.3606,
|
6099 |
+
"step": 21420
|
6100 |
+
},
|
6101 |
+
{
|
6102 |
+
"epoch": 42.9,
|
6103 |
+
"grad_norm": 37.38964080810547,
|
6104 |
+
"learning_rate": 1.873786718321476e-06,
|
6105 |
+
"loss": 0.4464,
|
6106 |
+
"step": 21450
|
6107 |
+
},
|
6108 |
+
{
|
6109 |
+
"epoch": 42.96,
|
6110 |
+
"grad_norm": 72.3614730834961,
|
6111 |
+
"learning_rate": 1.8615431935464984e-06,
|
6112 |
+
"loss": 0.4322,
|
6113 |
+
"step": 21480
|
6114 |
+
},
|
6115 |
+
{
|
6116 |
+
"epoch": 43.0,
|
6117 |
+
"eval_loss": 0.29740211367607117,
|
6118 |
+
"eval_map": 0.7974,
|
6119 |
+
"eval_map_50": 0.9595,
|
6120 |
+
"eval_map_75": 0.9169,
|
6121 |
+
"eval_map_chicken": 0.8005,
|
6122 |
+
"eval_map_duck": 0.7586,
|
6123 |
+
"eval_map_large": 0.8951,
|
6124 |
+
"eval_map_medium": 0.7927,
|
6125 |
+
"eval_map_plant": 0.8331,
|
6126 |
+
"eval_map_small": 0.1879,
|
6127 |
+
"eval_mar_1": 0.3078,
|
6128 |
+
"eval_mar_10": 0.8296,
|
6129 |
+
"eval_mar_100": 0.834,
|
6130 |
+
"eval_mar_100_chicken": 0.8369,
|
6131 |
+
"eval_mar_100_duck": 0.7876,
|
6132 |
+
"eval_mar_100_plant": 0.8775,
|
6133 |
+
"eval_mar_large": 0.931,
|
6134 |
+
"eval_mar_medium": 0.8411,
|
6135 |
+
"eval_mar_small": 0.3085,
|
6136 |
+
"eval_runtime": 5.6419,
|
6137 |
+
"eval_samples_per_second": 17.724,
|
6138 |
+
"eval_steps_per_second": 2.304,
|
6139 |
+
"step": 21500
|
6140 |
}
|
6141 |
],
|
6142 |
"logging_steps": 30,
|
|
|
6156 |
"attributes": {}
|
6157 |
}
|
6158 |
},
|
6159 |
+
"total_flos": 7.3964969275392e+18,
|
6160 |
"train_batch_size": 2,
|
6161 |
"trial_name": null,
|
6162 |
"trial_params": null
|