Training in progress, epoch 24, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31fa9c03b236f3326abdb4196194072fbc949d245254e9cdd13231fc0ff9b3a1
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e06dc7f754a56ad9ba987b678b0f2d0c44a55075024d1d86ef926192c38101b
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83af2978e1223e5ba59e9c2a394b19ba33d5e55d1f204b990d525feddec0613f
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a639bc5a01160d5eb2cc6041c59f4ef1d6b5b5f12eeaae15618a65a0588847a
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -3286,6 +3286,151 @@
|
|
3286 |
"eval_samples_per_second": 19.71,
|
3287 |
"eval_steps_per_second": 2.562,
|
3288 |
"step": 11500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3289 |
}
|
3290 |
],
|
3291 |
"logging_steps": 30,
|
@@ -3305,7 +3450,7 @@
|
|
3305 |
"attributes": {}
|
3306 |
}
|
3307 |
},
|
3308 |
-
"total_flos":
|
3309 |
"train_batch_size": 2,
|
3310 |
"trial_name": null,
|
3311 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.4076879024505615,
|
3 |
+
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-12000",
|
4 |
+
"epoch": 24.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 12000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
3286 |
"eval_samples_per_second": 19.71,
|
3287 |
"eval_steps_per_second": 2.562,
|
3288 |
"step": 11500
|
3289 |
+
},
|
3290 |
+
{
|
3291 |
+
"epoch": 23.04,
|
3292 |
+
"grad_norm": 42.534297943115234,
|
3293 |
+
"learning_rate": 6.782059393566254e-06,
|
3294 |
+
"loss": 0.4992,
|
3295 |
+
"step": 11520
|
3296 |
+
},
|
3297 |
+
{
|
3298 |
+
"epoch": 23.1,
|
3299 |
+
"grad_norm": 0.002314250450581312,
|
3300 |
+
"learning_rate": 6.767374218896286e-06,
|
3301 |
+
"loss": 0.474,
|
3302 |
+
"step": 11550
|
3303 |
+
},
|
3304 |
+
{
|
3305 |
+
"epoch": 23.16,
|
3306 |
+
"grad_norm": 33.95319366455078,
|
3307 |
+
"learning_rate": 6.752671600956295e-06,
|
3308 |
+
"loss": 0.5098,
|
3309 |
+
"step": 11580
|
3310 |
+
},
|
3311 |
+
{
|
3312 |
+
"epoch": 23.22,
|
3313 |
+
"grad_norm": 65.58226013183594,
|
3314 |
+
"learning_rate": 6.737951684855185e-06,
|
3315 |
+
"loss": 0.6279,
|
3316 |
+
"step": 11610
|
3317 |
+
},
|
3318 |
+
{
|
3319 |
+
"epoch": 23.28,
|
3320 |
+
"grad_norm": 38.85221481323242,
|
3321 |
+
"learning_rate": 6.723214615872585e-06,
|
3322 |
+
"loss": 0.5288,
|
3323 |
+
"step": 11640
|
3324 |
+
},
|
3325 |
+
{
|
3326 |
+
"epoch": 23.34,
|
3327 |
+
"grad_norm": 31.03350067138672,
|
3328 |
+
"learning_rate": 6.708460539457418e-06,
|
3329 |
+
"loss": 0.5167,
|
3330 |
+
"step": 11670
|
3331 |
+
},
|
3332 |
+
{
|
3333 |
+
"epoch": 23.4,
|
3334 |
+
"grad_norm": 74.7662353515625,
|
3335 |
+
"learning_rate": 6.693689601226458e-06,
|
3336 |
+
"loss": 0.5782,
|
3337 |
+
"step": 11700
|
3338 |
+
},
|
3339 |
+
{
|
3340 |
+
"epoch": 23.46,
|
3341 |
+
"grad_norm": 30.249208450317383,
|
3342 |
+
"learning_rate": 6.6789019469629034e-06,
|
3343 |
+
"loss": 0.4759,
|
3344 |
+
"step": 11730
|
3345 |
+
},
|
3346 |
+
{
|
3347 |
+
"epoch": 23.52,
|
3348 |
+
"grad_norm": 32.10087966918945,
|
3349 |
+
"learning_rate": 6.664097722614934e-06,
|
3350 |
+
"loss": 0.4923,
|
3351 |
+
"step": 11760
|
3352 |
+
},
|
3353 |
+
{
|
3354 |
+
"epoch": 23.58,
|
3355 |
+
"grad_norm": 129.60997009277344,
|
3356 |
+
"learning_rate": 6.649277074294265e-06,
|
3357 |
+
"loss": 0.5149,
|
3358 |
+
"step": 11790
|
3359 |
+
},
|
3360 |
+
{
|
3361 |
+
"epoch": 23.64,
|
3362 |
+
"grad_norm": 74.41838073730469,
|
3363 |
+
"learning_rate": 6.634440148274712e-06,
|
3364 |
+
"loss": 0.5063,
|
3365 |
+
"step": 11820
|
3366 |
+
},
|
3367 |
+
{
|
3368 |
+
"epoch": 23.7,
|
3369 |
+
"grad_norm": 37.93177032470703,
|
3370 |
+
"learning_rate": 6.619587090990748e-06,
|
3371 |
+
"loss": 0.4632,
|
3372 |
+
"step": 11850
|
3373 |
+
},
|
3374 |
+
{
|
3375 |
+
"epoch": 23.76,
|
3376 |
+
"grad_norm": 40.77086639404297,
|
3377 |
+
"learning_rate": 6.604718049036047e-06,
|
3378 |
+
"loss": 0.5137,
|
3379 |
+
"step": 11880
|
3380 |
+
},
|
3381 |
+
{
|
3382 |
+
"epoch": 23.82,
|
3383 |
+
"grad_norm": 29.192161560058594,
|
3384 |
+
"learning_rate": 6.589833169162055e-06,
|
3385 |
+
"loss": 0.5527,
|
3386 |
+
"step": 11910
|
3387 |
+
},
|
3388 |
+
{
|
3389 |
+
"epoch": 23.88,
|
3390 |
+
"grad_norm": 86.26991271972656,
|
3391 |
+
"learning_rate": 6.574932598276524e-06,
|
3392 |
+
"loss": 0.4662,
|
3393 |
+
"step": 11940
|
3394 |
+
},
|
3395 |
+
{
|
3396 |
+
"epoch": 23.94,
|
3397 |
+
"grad_norm": 35.82132339477539,
|
3398 |
+
"learning_rate": 6.5600164834420754e-06,
|
3399 |
+
"loss": 0.5318,
|
3400 |
+
"step": 11970
|
3401 |
+
},
|
3402 |
+
{
|
3403 |
+
"epoch": 24.0,
|
3404 |
+
"grad_norm": 53.413780212402344,
|
3405 |
+
"learning_rate": 6.545084971874738e-06,
|
3406 |
+
"loss": 0.5184,
|
3407 |
+
"step": 12000
|
3408 |
+
},
|
3409 |
+
{
|
3410 |
+
"epoch": 24.0,
|
3411 |
+
"eval_loss": 0.4076879024505615,
|
3412 |
+
"eval_map": 0.7097,
|
3413 |
+
"eval_map_50": 0.9464,
|
3414 |
+
"eval_map_75": 0.854,
|
3415 |
+
"eval_map_chicken": 0.7126,
|
3416 |
+
"eval_map_duck": 0.6338,
|
3417 |
+
"eval_map_large": 0.8335,
|
3418 |
+
"eval_map_medium": 0.7156,
|
3419 |
+
"eval_map_plant": 0.7828,
|
3420 |
+
"eval_map_small": 0.1197,
|
3421 |
+
"eval_mar_1": 0.2741,
|
3422 |
+
"eval_mar_10": 0.757,
|
3423 |
+
"eval_mar_100": 0.7607,
|
3424 |
+
"eval_mar_100_chicken": 0.7667,
|
3425 |
+
"eval_mar_100_duck": 0.6784,
|
3426 |
+
"eval_mar_100_plant": 0.8372,
|
3427 |
+
"eval_mar_large": 0.8828,
|
3428 |
+
"eval_mar_medium": 0.7738,
|
3429 |
+
"eval_mar_small": 0.2553,
|
3430 |
+
"eval_runtime": 4.9733,
|
3431 |
+
"eval_samples_per_second": 20.107,
|
3432 |
+
"eval_steps_per_second": 2.614,
|
3433 |
+
"step": 12000
|
3434 |
}
|
3435 |
],
|
3436 |
"logging_steps": 30,
|
|
|
3450 |
"attributes": {}
|
3451 |
}
|
3452 |
},
|
3453 |
+
"total_flos": 4.1282773549056e+18,
|
3454 |
"train_batch_size": 2,
|
3455 |
"trial_name": null,
|
3456 |
"trial_params": null
|