joe611 commited on
Commit
ea2ccfc
·
verified ·
1 Parent(s): 655cba4

Training in progress, epoch 25, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31fa9c03b236f3326abdb4196194072fbc949d245254e9cdd13231fc0ff9b3a1
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd97dd8765dc1f4b908a232e8ef49fc36e02ae099f595ec2c827bde8c262164
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e06dc7f754a56ad9ba987b678b0f2d0c44a55075024d1d86ef926192c38101b
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6542aefd316db02c22779974ccf65e3583e7b60d2968b36d4e35421d0930b8
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83af2978e1223e5ba59e9c2a394b19ba33d5e55d1f204b990d525feddec0613f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45ae187a6921fbe09ae0badebce148b0a1efba8d5e43dc914da848aff37f805
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a639bc5a01160d5eb2cc6041c59f4ef1d6b5b5f12eeaae15618a65a0588847a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ea6dd56bd7b979b6581387262242dcc226985f82ef204d6b0a2805bc6677327
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.4076879024505615,
3
- "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-12000",
4
- "epoch": 24.0,
5
  "eval_steps": 500,
6
- "global_step": 12000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3431,6 +3431,144 @@
3431
  "eval_samples_per_second": 20.107,
3432
  "eval_steps_per_second": 2.614,
3433
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3434
  }
3435
  ],
3436
  "logging_steps": 30,
@@ -3450,7 +3588,7 @@
3450
  "attributes": {}
3451
  }
3452
  },
3453
- "total_flos": 4.1282773549056e+18,
3454
  "train_batch_size": 2,
3455
  "trial_name": null,
3456
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.4043169915676117,
3
+ "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-12500",
4
+ "epoch": 25.0,
5
  "eval_steps": 500,
6
+ "global_step": 12500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3431
  "eval_samples_per_second": 20.107,
3432
  "eval_steps_per_second": 2.614,
3433
  "step": 12000
3434
+ },
3435
+ {
3436
+ "epoch": 24.06,
3437
+ "grad_norm": 52.72776412963867,
3438
+ "learning_rate": 6.530138210942505e-06,
3439
+ "loss": 0.5589,
3440
+ "step": 12030
3441
+ },
3442
+ {
3443
+ "epoch": 24.12,
3444
+ "grad_norm": 29.438343048095703,
3445
+ "learning_rate": 6.5151763481638705e-06,
3446
+ "loss": 0.5368,
3447
+ "step": 12060
3448
+ },
3449
+ {
3450
+ "epoch": 24.18,
3451
+ "grad_norm": 54.32796859741211,
3452
+ "learning_rate": 6.500199531206381e-06,
3453
+ "loss": 0.5092,
3454
+ "step": 12090
3455
+ },
3456
+ {
3457
+ "epoch": 24.24,
3458
+ "grad_norm": 69.30450439453125,
3459
+ "learning_rate": 6.485207907885175e-06,
3460
+ "loss": 0.4992,
3461
+ "step": 12120
3462
+ },
3463
+ {
3464
+ "epoch": 24.3,
3465
+ "grad_norm": 42.193634033203125,
3466
+ "learning_rate": 6.47020162616152e-06,
3467
+ "loss": 0.4091,
3468
+ "step": 12150
3469
+ },
3470
+ {
3471
+ "epoch": 24.36,
3472
+ "grad_norm": 30.120336532592773,
3473
+ "learning_rate": 6.455180834141359e-06,
3474
+ "loss": 0.471,
3475
+ "step": 12180
3476
+ },
3477
+ {
3478
+ "epoch": 24.42,
3479
+ "grad_norm": 30.613067626953125,
3480
+ "learning_rate": 6.440145680073847e-06,
3481
+ "loss": 0.5791,
3482
+ "step": 12210
3483
+ },
3484
+ {
3485
+ "epoch": 24.48,
3486
+ "grad_norm": 38.11183166503906,
3487
+ "learning_rate": 6.425096312349881e-06,
3488
+ "loss": 0.4348,
3489
+ "step": 12240
3490
+ },
3491
+ {
3492
+ "epoch": 24.54,
3493
+ "grad_norm": 46.21797180175781,
3494
+ "learning_rate": 6.410032879500647e-06,
3495
+ "loss": 0.5827,
3496
+ "step": 12270
3497
+ },
3498
+ {
3499
+ "epoch": 24.6,
3500
+ "grad_norm": 39.75735855102539,
3501
+ "learning_rate": 6.3949555301961474e-06,
3502
+ "loss": 0.4915,
3503
+ "step": 12300
3504
+ },
3505
+ {
3506
+ "epoch": 24.66,
3507
+ "grad_norm": 55.170345306396484,
3508
+ "learning_rate": 6.3798644132437304e-06,
3509
+ "loss": 0.4253,
3510
+ "step": 12330
3511
+ },
3512
+ {
3513
+ "epoch": 24.72,
3514
+ "grad_norm": 30.651851654052734,
3515
+ "learning_rate": 6.364759677586627e-06,
3516
+ "loss": 0.5383,
3517
+ "step": 12360
3518
+ },
3519
+ {
3520
+ "epoch": 24.78,
3521
+ "grad_norm": 110.5732421875,
3522
+ "learning_rate": 6.349641472302484e-06,
3523
+ "loss": 0.4379,
3524
+ "step": 12390
3525
+ },
3526
+ {
3527
+ "epoch": 24.84,
3528
+ "grad_norm": 37.65018081665039,
3529
+ "learning_rate": 6.334509946601879e-06,
3530
+ "loss": 0.4374,
3531
+ "step": 12420
3532
+ },
3533
+ {
3534
+ "epoch": 24.9,
3535
+ "grad_norm": 48.68293762207031,
3536
+ "learning_rate": 6.3193652498268656e-06,
3537
+ "loss": 0.5241,
3538
+ "step": 12450
3539
+ },
3540
+ {
3541
+ "epoch": 24.96,
3542
+ "grad_norm": 131.17486572265625,
3543
+ "learning_rate": 6.304207531449486e-06,
3544
+ "loss": 0.4849,
3545
+ "step": 12480
3546
+ },
3547
+ {
3548
+ "epoch": 25.0,
3549
+ "eval_loss": 0.4043169915676117,
3550
+ "eval_map": 0.7096,
3551
+ "eval_map_50": 0.949,
3552
+ "eval_map_75": 0.8366,
3553
+ "eval_map_chicken": 0.7483,
3554
+ "eval_map_duck": 0.596,
3555
+ "eval_map_large": 0.8412,
3556
+ "eval_map_medium": 0.7084,
3557
+ "eval_map_plant": 0.7843,
3558
+ "eval_map_small": 0.1234,
3559
+ "eval_mar_1": 0.2739,
3560
+ "eval_mar_10": 0.7538,
3561
+ "eval_mar_100": 0.7611,
3562
+ "eval_mar_100_chicken": 0.7902,
3563
+ "eval_mar_100_duck": 0.6546,
3564
+ "eval_mar_100_plant": 0.8383,
3565
+ "eval_mar_large": 0.8891,
3566
+ "eval_mar_medium": 0.7703,
3567
+ "eval_mar_small": 0.258,
3568
+ "eval_runtime": 5.051,
3569
+ "eval_samples_per_second": 19.798,
3570
+ "eval_steps_per_second": 2.574,
3571
+ "step": 12500
3572
  }
3573
  ],
3574
  "logging_steps": 30,
 
3588
  "attributes": {}
3589
  }
3590
  },
3591
+ "total_flos": 4.30028891136e+18,
3592
  "train_batch_size": 2,
3593
  "trial_name": null,
3594
  "trial_params": null