joe611 commited on
Commit
dcd85d9
·
verified ·
1 Parent(s): 2096a9f

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91f65e969be4028fe272c5483c861732ab6037b3ce2126b309ae32a493ba3d05
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:196cc2cfcc2664c4fd5cf36c41954ce899b20038eb4dc555ce085b5683692307
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94bf5a4b75c7e86d1548a14506e57038d254b2ba030b41984e3d46327faaaab7
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33f735862ccde6d0b31db8e86029731e0868fe7eade6541461c4ecdf8a55753b
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cff47de40d69968bf56457151c7d483f89f49db23f02a8d0ea32914d1d258248
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33f5213c99792362a6ad6f5e9bebafef268fa11b8180f752f261508437c870dc
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4033ac437c9bdc023a8e8010339474a4e6dc76e6f5e0758831867a9a3f523e9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0568bedf04967b808836c597b9b41e2761cceefa383ed9c5db4174e2423ab9f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.1410857439041138,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-1000",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -290,6 +290,151 @@
290
  "eval_samples_per_second": 20.183,
291
  "eval_steps_per_second": 2.624,
292
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
293
  }
294
  ],
295
  "logging_steps": 30,
@@ -309,7 +454,7 @@
309
  "attributes": {}
310
  }
311
  },
312
- "total_flos": 3.440231129088e+17,
313
  "train_batch_size": 2,
314
  "trial_name": null,
315
  "trial_params": null
 
1
  {
2
  "best_metric": 1.1410857439041138,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-1000",
4
+ "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 1500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
290
  "eval_samples_per_second": 20.183,
291
  "eval_steps_per_second": 2.624,
292
  "step": 1000
293
+ },
294
+ {
295
+ "epoch": 2.04,
296
+ "grad_norm": 69.85189056396484,
297
+ "learning_rate": 9.971503951984996e-06,
298
+ "loss": 1.1616,
299
+ "step": 1020
300
+ },
301
+ {
302
+ "epoch": 2.1,
303
+ "grad_norm": 37.134403228759766,
304
+ "learning_rate": 9.9698047772759e-06,
305
+ "loss": 1.0393,
306
+ "step": 1050
307
+ },
308
+ {
309
+ "epoch": 2.16,
310
+ "grad_norm": 52.74504852294922,
311
+ "learning_rate": 9.968056552600043e-06,
312
+ "loss": 1.1147,
313
+ "step": 1080
314
+ },
315
+ {
316
+ "epoch": 2.22,
317
+ "grad_norm": 70.72219848632812,
318
+ "learning_rate": 9.966259295211698e-06,
319
+ "loss": 1.0797,
320
+ "step": 1110
321
+ },
322
+ {
323
+ "epoch": 2.2800000000000002,
324
+ "grad_norm": 104.32415771484375,
325
+ "learning_rate": 9.964413022849069e-06,
326
+ "loss": 0.9984,
327
+ "step": 1140
328
+ },
329
+ {
330
+ "epoch": 2.34,
331
+ "grad_norm": 65.52819061279297,
332
+ "learning_rate": 9.96251775373412e-06,
333
+ "loss": 1.036,
334
+ "step": 1170
335
+ },
336
+ {
337
+ "epoch": 2.4,
338
+ "grad_norm": 43.15259552001953,
339
+ "learning_rate": 9.960573506572391e-06,
340
+ "loss": 1.3154,
341
+ "step": 1200
342
+ },
343
+ {
344
+ "epoch": 2.46,
345
+ "grad_norm": 76.51600646972656,
346
+ "learning_rate": 9.958580300552816e-06,
347
+ "loss": 1.1412,
348
+ "step": 1230
349
+ },
350
+ {
351
+ "epoch": 2.52,
352
+ "grad_norm": 0.6177086234092712,
353
+ "learning_rate": 9.956538155347534e-06,
354
+ "loss": 1.2674,
355
+ "step": 1260
356
+ },
357
+ {
358
+ "epoch": 2.58,
359
+ "grad_norm": 53.222103118896484,
360
+ "learning_rate": 9.954447091111695e-06,
361
+ "loss": 1.1138,
362
+ "step": 1290
363
+ },
364
+ {
365
+ "epoch": 2.64,
366
+ "grad_norm": 94.70368194580078,
367
+ "learning_rate": 9.952307128483257e-06,
368
+ "loss": 1.0613,
369
+ "step": 1320
370
+ },
371
+ {
372
+ "epoch": 2.7,
373
+ "grad_norm": 89.58301544189453,
374
+ "learning_rate": 9.95011828858279e-06,
375
+ "loss": 1.0912,
376
+ "step": 1350
377
+ },
378
+ {
379
+ "epoch": 2.76,
380
+ "grad_norm": 43.07695388793945,
381
+ "learning_rate": 9.947880593013256e-06,
382
+ "loss": 1.1115,
383
+ "step": 1380
384
+ },
385
+ {
386
+ "epoch": 2.82,
387
+ "grad_norm": 52.474220275878906,
388
+ "learning_rate": 9.94559406385981e-06,
389
+ "loss": 0.9757,
390
+ "step": 1410
391
+ },
392
+ {
393
+ "epoch": 2.88,
394
+ "grad_norm": 46.698448181152344,
395
+ "learning_rate": 9.94325872368957e-06,
396
+ "loss": 1.1364,
397
+ "step": 1440
398
+ },
399
+ {
400
+ "epoch": 2.94,
401
+ "grad_norm": 49.13819885253906,
402
+ "learning_rate": 9.940874595551403e-06,
403
+ "loss": 0.9772,
404
+ "step": 1470
405
+ },
406
+ {
407
+ "epoch": 3.0,
408
+ "grad_norm": 101.07115173339844,
409
+ "learning_rate": 9.938441702975689e-06,
410
+ "loss": 1.06,
411
+ "step": 1500
412
+ },
413
+ {
414
+ "epoch": 3.0,
415
+ "eval_loss": 1.5299323797225952,
416
+ "eval_map": 0.1865,
417
+ "eval_map_50": 0.2571,
418
+ "eval_map_75": 0.2063,
419
+ "eval_map_chicken": 0.0,
420
+ "eval_map_duck": 0.0,
421
+ "eval_map_large": 0.6155,
422
+ "eval_map_medium": 0.1497,
423
+ "eval_map_plant": 0.5595,
424
+ "eval_map_small": 0.0172,
425
+ "eval_mar_1": 0.0695,
426
+ "eval_mar_10": 0.2154,
427
+ "eval_mar_100": 0.2187,
428
+ "eval_mar_100_chicken": 0.0,
429
+ "eval_mar_100_duck": 0.0,
430
+ "eval_mar_100_plant": 0.6562,
431
+ "eval_mar_large": 0.6971,
432
+ "eval_mar_medium": 0.199,
433
+ "eval_mar_small": 0.0583,
434
+ "eval_runtime": 4.9962,
435
+ "eval_samples_per_second": 20.015,
436
+ "eval_steps_per_second": 2.602,
437
+ "step": 1500
438
  }
439
  ],
440
  "logging_steps": 30,
 
454
  "attributes": {}
455
  }
456
  },
457
+ "total_flos": 5.160346693632e+17,
458
  "train_batch_size": 2,
459
  "trial_name": null,
460
  "trial_params": null