Training in progress, epoch 47, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d5ce355db46607a95aec28c8b78c3595e784c5a4d7b633fba4e3a9ee15eb38c
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ba6ec41c0dc6f0e349a76e70dac0de7bab1ad5a9835e860fb1ac13bdcf45e24
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02ad003c0a9f67fd2fbb27db20929ec58a84ae23e961e581a1f533296d899603
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa3fe3dee209f5f42e53fe323f65577065b213541550cd1190559073b9095da7
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -6565,6 +6565,151 @@
|
|
6565 |
"eval_samples_per_second": 19.89,
|
6566 |
"eval_steps_per_second": 2.586,
|
6567 |
"step": 23000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6568 |
}
|
6569 |
],
|
6570 |
"logging_steps": 30,
|
@@ -6584,7 +6729,7 @@
|
|
6584 |
"attributes": {}
|
6585 |
}
|
6586 |
},
|
6587 |
-
"total_flos":
|
6588 |
"train_batch_size": 2,
|
6589 |
"trial_name": null,
|
6590 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.29506856203079224,
|
3 |
+
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-23500",
|
4 |
+
"epoch": 47.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 23500,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
6565 |
"eval_samples_per_second": 19.89,
|
6566 |
"eval_steps_per_second": 2.586,
|
6567 |
"step": 23000
|
6568 |
+
},
|
6569 |
+
{
|
6570 |
+
"epoch": 46.02,
|
6571 |
+
"grad_norm": 82.24079132080078,
|
6572 |
+
"learning_rate": 1.2807743509648745e-06,
|
6573 |
+
"loss": 0.459,
|
6574 |
+
"step": 23010
|
6575 |
+
},
|
6576 |
+
{
|
6577 |
+
"epoch": 46.08,
|
6578 |
+
"grad_norm": 35.353336334228516,
|
6579 |
+
"learning_rate": 1.2702942728790897e-06,
|
6580 |
+
"loss": 0.4215,
|
6581 |
+
"step": 23040
|
6582 |
+
},
|
6583 |
+
{
|
6584 |
+
"epoch": 46.14,
|
6585 |
+
"grad_norm": 38.322479248046875,
|
6586 |
+
"learning_rate": 1.2598510054830888e-06,
|
6587 |
+
"loss": 0.3925,
|
6588 |
+
"step": 23070
|
6589 |
+
},
|
6590 |
+
{
|
6591 |
+
"epoch": 46.2,
|
6592 |
+
"grad_norm": 53.787445068359375,
|
6593 |
+
"learning_rate": 1.2494446518477022e-06,
|
6594 |
+
"loss": 0.349,
|
6595 |
+
"step": 23100
|
6596 |
+
},
|
6597 |
+
{
|
6598 |
+
"epoch": 46.26,
|
6599 |
+
"grad_norm": 37.92025375366211,
|
6600 |
+
"learning_rate": 1.2390753146794438e-06,
|
6601 |
+
"loss": 0.3578,
|
6602 |
+
"step": 23130
|
6603 |
+
},
|
6604 |
+
{
|
6605 |
+
"epoch": 46.32,
|
6606 |
+
"grad_norm": 68.19427490234375,
|
6607 |
+
"learning_rate": 1.2287430963194807e-06,
|
6608 |
+
"loss": 0.4342,
|
6609 |
+
"step": 23160
|
6610 |
+
},
|
6611 |
+
{
|
6612 |
+
"epoch": 46.38,
|
6613 |
+
"grad_norm": 108.89007568359375,
|
6614 |
+
"learning_rate": 1.218448098742641e-06,
|
6615 |
+
"loss": 0.4607,
|
6616 |
+
"step": 23190
|
6617 |
+
},
|
6618 |
+
{
|
6619 |
+
"epoch": 46.44,
|
6620 |
+
"grad_norm": 83.83390808105469,
|
6621 |
+
"learning_rate": 1.2081904235563908e-06,
|
6622 |
+
"loss": 0.4169,
|
6623 |
+
"step": 23220
|
6624 |
+
},
|
6625 |
+
{
|
6626 |
+
"epoch": 46.5,
|
6627 |
+
"grad_norm": 46.47811508178711,
|
6628 |
+
"learning_rate": 1.1979701719998454e-06,
|
6629 |
+
"loss": 0.3965,
|
6630 |
+
"step": 23250
|
6631 |
+
},
|
6632 |
+
{
|
6633 |
+
"epoch": 46.56,
|
6634 |
+
"grad_norm": 83.35205841064453,
|
6635 |
+
"learning_rate": 1.18778744494276e-06,
|
6636 |
+
"loss": 0.685,
|
6637 |
+
"step": 23280
|
6638 |
+
},
|
6639 |
+
{
|
6640 |
+
"epoch": 46.62,
|
6641 |
+
"grad_norm": 61.895530700683594,
|
6642 |
+
"learning_rate": 1.1776423428845423e-06,
|
6643 |
+
"loss": 0.3723,
|
6644 |
+
"step": 23310
|
6645 |
+
},
|
6646 |
+
{
|
6647 |
+
"epoch": 46.68,
|
6648 |
+
"grad_norm": 68.6615982055664,
|
6649 |
+
"learning_rate": 1.1675349659532514e-06,
|
6650 |
+
"loss": 0.4277,
|
6651 |
+
"step": 23340
|
6652 |
+
},
|
6653 |
+
{
|
6654 |
+
"epoch": 46.74,
|
6655 |
+
"grad_norm": 34.00867462158203,
|
6656 |
+
"learning_rate": 1.1574654139046171e-06,
|
6657 |
+
"loss": 0.4321,
|
6658 |
+
"step": 23370
|
6659 |
+
},
|
6660 |
+
{
|
6661 |
+
"epoch": 46.8,
|
6662 |
+
"grad_norm": 40.27052688598633,
|
6663 |
+
"learning_rate": 1.1474337861210543e-06,
|
6664 |
+
"loss": 0.3798,
|
6665 |
+
"step": 23400
|
6666 |
+
},
|
6667 |
+
{
|
6668 |
+
"epoch": 46.86,
|
6669 |
+
"grad_norm": 58.309085845947266,
|
6670 |
+
"learning_rate": 1.1374401816106778e-06,
|
6671 |
+
"loss": 0.4083,
|
6672 |
+
"step": 23430
|
6673 |
+
},
|
6674 |
+
{
|
6675 |
+
"epoch": 46.92,
|
6676 |
+
"grad_norm": 43.79540252685547,
|
6677 |
+
"learning_rate": 1.1274846990063314e-06,
|
6678 |
+
"loss": 0.3961,
|
6679 |
+
"step": 23460
|
6680 |
+
},
|
6681 |
+
{
|
6682 |
+
"epoch": 46.98,
|
6683 |
+
"grad_norm": 48.5699462890625,
|
6684 |
+
"learning_rate": 1.1175674365646067e-06,
|
6685 |
+
"loss": 0.4257,
|
6686 |
+
"step": 23490
|
6687 |
+
},
|
6688 |
+
{
|
6689 |
+
"epoch": 47.0,
|
6690 |
+
"eval_loss": 0.29506856203079224,
|
6691 |
+
"eval_map": 0.792,
|
6692 |
+
"eval_map_50": 0.9625,
|
6693 |
+
"eval_map_75": 0.9172,
|
6694 |
+
"eval_map_chicken": 0.7961,
|
6695 |
+
"eval_map_duck": 0.7572,
|
6696 |
+
"eval_map_large": 0.8802,
|
6697 |
+
"eval_map_medium": 0.7855,
|
6698 |
+
"eval_map_plant": 0.8226,
|
6699 |
+
"eval_map_small": 0.2075,
|
6700 |
+
"eval_mar_1": 0.3067,
|
6701 |
+
"eval_mar_10": 0.8262,
|
6702 |
+
"eval_mar_100": 0.8309,
|
6703 |
+
"eval_mar_100_chicken": 0.8338,
|
6704 |
+
"eval_mar_100_duck": 0.7907,
|
6705 |
+
"eval_mar_100_plant": 0.8683,
|
6706 |
+
"eval_mar_large": 0.9197,
|
6707 |
+
"eval_mar_medium": 0.836,
|
6708 |
+
"eval_mar_small": 0.3468,
|
6709 |
+
"eval_runtime": 5.0742,
|
6710 |
+
"eval_samples_per_second": 19.708,
|
6711 |
+
"eval_steps_per_second": 2.562,
|
6712 |
+
"step": 23500
|
6713 |
}
|
6714 |
],
|
6715 |
"logging_steps": 30,
|
|
|
6729 |
"attributes": {}
|
6730 |
}
|
6731 |
},
|
6732 |
+
"total_flos": 8.0845431533568e+18,
|
6733 |
"train_batch_size": 2,
|
6734 |
"trial_name": null,
|
6735 |
"trial_params": null
|