Training in progress, epoch 44, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf72785f9e61f422066d5a55b0560c4c8a69464b26be32f4db1debc616942689
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a41339ed91a0fc5aebfb27479aad8c07d748b799c7840c36fbe1be25b37e1ab
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef8c417a427a4d61d5632cb068a6069c159668c42d4b0b7a6a15b8a00b11eecc
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fa74708df9c1325cdd60797f5ccc467462cf147fdacd71b5f8d7ef24d6392cd
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.29740211367607117,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -6137,6 +6137,151 @@
|
|
6137 |
"eval_samples_per_second": 17.724,
|
6138 |
"eval_steps_per_second": 2.304,
|
6139 |
"step": 21500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6140 |
}
|
6141 |
],
|
6142 |
"logging_steps": 30,
|
@@ -6156,7 +6301,7 @@
|
|
6156 |
"attributes": {}
|
6157 |
}
|
6158 |
},
|
6159 |
-
"total_flos": 7.
|
6160 |
"train_batch_size": 2,
|
6161 |
"trial_name": null,
|
6162 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.29740211367607117,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
|
4 |
+
"epoch": 44.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 22000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
6137 |
"eval_samples_per_second": 17.724,
|
6138 |
"eval_steps_per_second": 2.304,
|
6139 |
"step": 21500
|
6140 |
+
},
|
6141 |
+
{
|
6142 |
+
"epoch": 43.02,
|
6143 |
+
"grad_norm": 44.15309143066406,
|
6144 |
+
"learning_rate": 1.8493306440731557e-06,
|
6145 |
+
"loss": 0.4896,
|
6146 |
+
"step": 21510
|
6147 |
+
},
|
6148 |
+
{
|
6149 |
+
"epoch": 43.08,
|
6150 |
+
"grad_norm": 35.48102951049805,
|
6151 |
+
"learning_rate": 1.837149190434378e-06,
|
6152 |
+
"loss": 0.5013,
|
6153 |
+
"step": 21540
|
6154 |
+
},
|
6155 |
+
{
|
6156 |
+
"epoch": 43.14,
|
6157 |
+
"grad_norm": 35.87041473388672,
|
6158 |
+
"learning_rate": 1.824998952856198e-06,
|
6159 |
+
"loss": 0.4439,
|
6160 |
+
"step": 21570
|
6161 |
+
},
|
6162 |
+
{
|
6163 |
+
"epoch": 43.2,
|
6164 |
+
"grad_norm": 26.650522232055664,
|
6165 |
+
"learning_rate": 1.8128800512565514e-06,
|
6166 |
+
"loss": 0.4186,
|
6167 |
+
"step": 21600
|
6168 |
+
},
|
6169 |
+
{
|
6170 |
+
"epoch": 43.26,
|
6171 |
+
"grad_norm": 48.30433654785156,
|
6172 |
+
"learning_rate": 1.800792605244109e-06,
|
6173 |
+
"loss": 0.4345,
|
6174 |
+
"step": 21630
|
6175 |
+
},
|
6176 |
+
{
|
6177 |
+
"epoch": 43.32,
|
6178 |
+
"grad_norm": 70.63233184814453,
|
6179 |
+
"learning_rate": 1.7887367341170781e-06,
|
6180 |
+
"loss": 0.4639,
|
6181 |
+
"step": 21660
|
6182 |
+
},
|
6183 |
+
{
|
6184 |
+
"epoch": 43.38,
|
6185 |
+
"grad_norm": 29.950109481811523,
|
6186 |
+
"learning_rate": 1.7767125568620442e-06,
|
6187 |
+
"loss": 0.3931,
|
6188 |
+
"step": 21690
|
6189 |
+
},
|
6190 |
+
{
|
6191 |
+
"epoch": 43.44,
|
6192 |
+
"grad_norm": 40.98532485961914,
|
6193 |
+
"learning_rate": 1.7647201921527802e-06,
|
6194 |
+
"loss": 0.3728,
|
6195 |
+
"step": 21720
|
6196 |
+
},
|
6197 |
+
{
|
6198 |
+
"epoch": 43.5,
|
6199 |
+
"grad_norm": 107.21430969238281,
|
6200 |
+
"learning_rate": 1.7527597583490825e-06,
|
6201 |
+
"loss": 0.3679,
|
6202 |
+
"step": 21750
|
6203 |
+
},
|
6204 |
+
{
|
6205 |
+
"epoch": 43.56,
|
6206 |
+
"grad_norm": 41.53556442260742,
|
6207 |
+
"learning_rate": 1.7408313734956074e-06,
|
6208 |
+
"loss": 0.4278,
|
6209 |
+
"step": 21780
|
6210 |
+
},
|
6211 |
+
{
|
6212 |
+
"epoch": 43.62,
|
6213 |
+
"grad_norm": 30.475116729736328,
|
6214 |
+
"learning_rate": 1.7289351553206952e-06,
|
6215 |
+
"loss": 0.4995,
|
6216 |
+
"step": 21810
|
6217 |
+
},
|
6218 |
+
{
|
6219 |
+
"epoch": 43.68,
|
6220 |
+
"grad_norm": 65.69325256347656,
|
6221 |
+
"learning_rate": 1.7170712212352187e-06,
|
6222 |
+
"loss": 0.4236,
|
6223 |
+
"step": 21840
|
6224 |
+
},
|
6225 |
+
{
|
6226 |
+
"epoch": 43.74,
|
6227 |
+
"grad_norm": 83.24858856201172,
|
6228 |
+
"learning_rate": 1.7052396883314154e-06,
|
6229 |
+
"loss": 0.4865,
|
6230 |
+
"step": 21870
|
6231 |
+
},
|
6232 |
+
{
|
6233 |
+
"epoch": 43.8,
|
6234 |
+
"grad_norm": 49.75985336303711,
|
6235 |
+
"learning_rate": 1.6934406733817417e-06,
|
6236 |
+
"loss": 0.4061,
|
6237 |
+
"step": 21900
|
6238 |
+
},
|
6239 |
+
{
|
6240 |
+
"epoch": 43.86,
|
6241 |
+
"grad_norm": 0.0012297651264816523,
|
6242 |
+
"learning_rate": 1.6816742928377072e-06,
|
6243 |
+
"loss": 0.4391,
|
6244 |
+
"step": 21930
|
6245 |
+
},
|
6246 |
+
{
|
6247 |
+
"epoch": 43.92,
|
6248 |
+
"grad_norm": 107.39283752441406,
|
6249 |
+
"learning_rate": 1.6699406628287423e-06,
|
6250 |
+
"loss": 0.4027,
|
6251 |
+
"step": 21960
|
6252 |
+
},
|
6253 |
+
{
|
6254 |
+
"epoch": 43.98,
|
6255 |
+
"grad_norm": 53.299110412597656,
|
6256 |
+
"learning_rate": 1.658239899161036e-06,
|
6257 |
+
"loss": 0.7057,
|
6258 |
+
"step": 21990
|
6259 |
+
},
|
6260 |
+
{
|
6261 |
+
"epoch": 44.0,
|
6262 |
+
"eval_loss": 0.3092344403266907,
|
6263 |
+
"eval_map": 0.7822,
|
6264 |
+
"eval_map_50": 0.9563,
|
6265 |
+
"eval_map_75": 0.9171,
|
6266 |
+
"eval_map_chicken": 0.7941,
|
6267 |
+
"eval_map_duck": 0.7348,
|
6268 |
+
"eval_map_large": 0.8688,
|
6269 |
+
"eval_map_medium": 0.7813,
|
6270 |
+
"eval_map_plant": 0.8177,
|
6271 |
+
"eval_map_small": 0.1985,
|
6272 |
+
"eval_mar_1": 0.3003,
|
6273 |
+
"eval_mar_10": 0.8165,
|
6274 |
+
"eval_mar_100": 0.821,
|
6275 |
+
"eval_mar_100_chicken": 0.8307,
|
6276 |
+
"eval_mar_100_duck": 0.766,
|
6277 |
+
"eval_mar_100_plant": 0.8663,
|
6278 |
+
"eval_mar_large": 0.9117,
|
6279 |
+
"eval_mar_medium": 0.8292,
|
6280 |
+
"eval_mar_small": 0.3663,
|
6281 |
+
"eval_runtime": 5.0773,
|
6282 |
+
"eval_samples_per_second": 19.696,
|
6283 |
+
"eval_steps_per_second": 2.56,
|
6284 |
+
"step": 22000
|
6285 |
}
|
6286 |
],
|
6287 |
"logging_steps": 30,
|
|
|
6301 |
"attributes": {}
|
6302 |
}
|
6303 |
},
|
6304 |
+
"total_flos": 7.5685084839936e+18,
|
6305 |
"train_batch_size": 2,
|
6306 |
"trial_name": null,
|
6307 |
"trial_params": null
|