joe611 commited on
Commit
b75c95c
·
verified ·
1 Parent(s): 81851ad

Training in progress, epoch 24, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0b155b6c159aad5d499dbbfcd000f172ecfda66b201d4940a5f789194a7ca81
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31fa9c03b236f3326abdb4196194072fbc949d245254e9cdd13231fc0ff9b3a1
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93dc21f8623c3f6028f166852f07242a27af2a9e42ec647d8950119cb47b32d3
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e06dc7f754a56ad9ba987b678b0f2d0c44a55075024d1d86ef926192c38101b
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afe5f3e38edc53d84c568132d5a1fe6617c029725cb5ed6465b95e27267304ae
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83af2978e1223e5ba59e9c2a394b19ba33d5e55d1f204b990d525feddec0613f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:685c336afeba3f61098971b07e0888920b1e8afabd8b33c977a10c5f12a34b13
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a639bc5a01160d5eb2cc6041c59f4ef1d6b5b5f12eeaae15618a65a0588847a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.41423293948173523,
3
- "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-11000",
4
- "epoch": 23.0,
5
  "eval_steps": 500,
6
- "global_step": 11500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3286,6 +3286,151 @@
3286
  "eval_samples_per_second": 19.71,
3287
  "eval_steps_per_second": 2.562,
3288
  "step": 11500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3289
  }
3290
  ],
3291
  "logging_steps": 30,
@@ -3305,7 +3450,7 @@
3305
  "attributes": {}
3306
  }
3307
  },
3308
- "total_flos": 3.9562657984512e+18,
3309
  "train_batch_size": 2,
3310
  "trial_name": null,
3311
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.4076879024505615,
3
+ "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-12000",
4
+ "epoch": 24.0,
5
  "eval_steps": 500,
6
+ "global_step": 12000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3286
  "eval_samples_per_second": 19.71,
3287
  "eval_steps_per_second": 2.562,
3288
  "step": 11500
3289
+ },
3290
+ {
3291
+ "epoch": 23.04,
3292
+ "grad_norm": 42.534297943115234,
3293
+ "learning_rate": 6.782059393566254e-06,
3294
+ "loss": 0.4992,
3295
+ "step": 11520
3296
+ },
3297
+ {
3298
+ "epoch": 23.1,
3299
+ "grad_norm": 0.002314250450581312,
3300
+ "learning_rate": 6.767374218896286e-06,
3301
+ "loss": 0.474,
3302
+ "step": 11550
3303
+ },
3304
+ {
3305
+ "epoch": 23.16,
3306
+ "grad_norm": 33.95319366455078,
3307
+ "learning_rate": 6.752671600956295e-06,
3308
+ "loss": 0.5098,
3309
+ "step": 11580
3310
+ },
3311
+ {
3312
+ "epoch": 23.22,
3313
+ "grad_norm": 65.58226013183594,
3314
+ "learning_rate": 6.737951684855185e-06,
3315
+ "loss": 0.6279,
3316
+ "step": 11610
3317
+ },
3318
+ {
3319
+ "epoch": 23.28,
3320
+ "grad_norm": 38.85221481323242,
3321
+ "learning_rate": 6.723214615872585e-06,
3322
+ "loss": 0.5288,
3323
+ "step": 11640
3324
+ },
3325
+ {
3326
+ "epoch": 23.34,
3327
+ "grad_norm": 31.03350067138672,
3328
+ "learning_rate": 6.708460539457418e-06,
3329
+ "loss": 0.5167,
3330
+ "step": 11670
3331
+ },
3332
+ {
3333
+ "epoch": 23.4,
3334
+ "grad_norm": 74.7662353515625,
3335
+ "learning_rate": 6.693689601226458e-06,
3336
+ "loss": 0.5782,
3337
+ "step": 11700
3338
+ },
3339
+ {
3340
+ "epoch": 23.46,
3341
+ "grad_norm": 30.249208450317383,
3342
+ "learning_rate": 6.6789019469629034e-06,
3343
+ "loss": 0.4759,
3344
+ "step": 11730
3345
+ },
3346
+ {
3347
+ "epoch": 23.52,
3348
+ "grad_norm": 32.10087966918945,
3349
+ "learning_rate": 6.664097722614934e-06,
3350
+ "loss": 0.4923,
3351
+ "step": 11760
3352
+ },
3353
+ {
3354
+ "epoch": 23.58,
3355
+ "grad_norm": 129.60997009277344,
3356
+ "learning_rate": 6.649277074294265e-06,
3357
+ "loss": 0.5149,
3358
+ "step": 11790
3359
+ },
3360
+ {
3361
+ "epoch": 23.64,
3362
+ "grad_norm": 74.41838073730469,
3363
+ "learning_rate": 6.634440148274712e-06,
3364
+ "loss": 0.5063,
3365
+ "step": 11820
3366
+ },
3367
+ {
3368
+ "epoch": 23.7,
3369
+ "grad_norm": 37.93177032470703,
3370
+ "learning_rate": 6.619587090990748e-06,
3371
+ "loss": 0.4632,
3372
+ "step": 11850
3373
+ },
3374
+ {
3375
+ "epoch": 23.76,
3376
+ "grad_norm": 40.77086639404297,
3377
+ "learning_rate": 6.604718049036047e-06,
3378
+ "loss": 0.5137,
3379
+ "step": 11880
3380
+ },
3381
+ {
3382
+ "epoch": 23.82,
3383
+ "grad_norm": 29.192161560058594,
3384
+ "learning_rate": 6.589833169162055e-06,
3385
+ "loss": 0.5527,
3386
+ "step": 11910
3387
+ },
3388
+ {
3389
+ "epoch": 23.88,
3390
+ "grad_norm": 86.26991271972656,
3391
+ "learning_rate": 6.574932598276524e-06,
3392
+ "loss": 0.4662,
3393
+ "step": 11940
3394
+ },
3395
+ {
3396
+ "epoch": 23.94,
3397
+ "grad_norm": 35.82132339477539,
3398
+ "learning_rate": 6.5600164834420754e-06,
3399
+ "loss": 0.5318,
3400
+ "step": 11970
3401
+ },
3402
+ {
3403
+ "epoch": 24.0,
3404
+ "grad_norm": 53.413780212402344,
3405
+ "learning_rate": 6.545084971874738e-06,
3406
+ "loss": 0.5184,
3407
+ "step": 12000
3408
+ },
3409
+ {
3410
+ "epoch": 24.0,
3411
+ "eval_loss": 0.4076879024505615,
3412
+ "eval_map": 0.7097,
3413
+ "eval_map_50": 0.9464,
3414
+ "eval_map_75": 0.854,
3415
+ "eval_map_chicken": 0.7126,
3416
+ "eval_map_duck": 0.6338,
3417
+ "eval_map_large": 0.8335,
3418
+ "eval_map_medium": 0.7156,
3419
+ "eval_map_plant": 0.7828,
3420
+ "eval_map_small": 0.1197,
3421
+ "eval_mar_1": 0.2741,
3422
+ "eval_mar_10": 0.757,
3423
+ "eval_mar_100": 0.7607,
3424
+ "eval_mar_100_chicken": 0.7667,
3425
+ "eval_mar_100_duck": 0.6784,
3426
+ "eval_mar_100_plant": 0.8372,
3427
+ "eval_mar_large": 0.8828,
3428
+ "eval_mar_medium": 0.7738,
3429
+ "eval_mar_small": 0.2553,
3430
+ "eval_runtime": 4.9733,
3431
+ "eval_samples_per_second": 20.107,
3432
+ "eval_steps_per_second": 2.614,
3433
+ "step": 12000
3434
  }
3435
  ],
3436
  "logging_steps": 30,
 
3450
  "attributes": {}
3451
  }
3452
  },
3453
+ "total_flos": 4.1282773549056e+18,
3454
  "train_batch_size": 2,
3455
  "trial_name": null,
3456
  "trial_params": null