Training in progress, step 11550, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step11550/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11550/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11550/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11550/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11550/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11550/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11550/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11550/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +93 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae3dba71cea82a584554baed057ef094a4a0c81e9d6ef8aa7cd0b7236e1db1c1
|
3 |
size 29034840
|
last-checkpoint/global_step11550/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f6f8d26d4803e154978ffc0ad9329e13d748fb90c2b01949e5601aa7d3d7f75
|
3 |
+
size 43429616
|
last-checkpoint/global_step11550/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8925be9e1eb9cc71b3fd7218b01dfcd6e9a5dec3c1ac4b469a9b9269ad6a797
|
3 |
+
size 43429616
|
last-checkpoint/global_step11550/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea99df20ac5a646e735c351a7bb0859b35893fd1e67214b44a37168cb804a51f
|
3 |
+
size 43429616
|
last-checkpoint/global_step11550/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b538162e2368499119146bd683a4249328468b5519e13f930b2aa4544e18afc9
|
3 |
+
size 43429616
|
last-checkpoint/global_step11550/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a7afd712c05bdae33641390ba9250cc3896e22737dd0b6d8b186f70f51a7534
|
3 |
+
size 637299
|
last-checkpoint/global_step11550/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71da68a4033276f1cedba39da5ccad002229c19ee1019021b5f511073c967e5
|
3 |
+
size 637171
|
last-checkpoint/global_step11550/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9d3de3e18198eadde56b4608a4231aeb1788c377d49b7302d16bf8fb50aa09
|
3 |
+
size 637171
|
last-checkpoint/global_step11550/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f93ea92ad36b68577557993beae89aac2ee6194908244499a399fef1acc03dce
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step11550
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78499bb2ea148823b7ab171c76eb915f9b4158c659a14c00b9e84ea5435d9cad
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99fce99abc20eefca679982890ea61d2ccdf9eee0cda977258a51a9304bf23ad
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaaee2368ce6f4ddaa847a6a36f132ea0ce34cdf12bf9b7eac5575e8743efd9
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e37b120cfd3886c6a8c324f0d433c2c4559046d72ce821cae05d8193c7218bd
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28dcc470b84c7d0033a14ee408e549a0b0e725782552f4d7cadd6cdebf0f14cf
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -20477,11 +20477,100 @@
|
|
20477 |
"eval_steps_per_second": 0.763,
|
20478 |
"num_input_tokens_seen": 76876640,
|
20479 |
"step": 11500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
20480 |
}
|
20481 |
],
|
20482 |
"logging_steps": 5,
|
20483 |
"max_steps": 16324,
|
20484 |
-
"num_input_tokens_seen":
|
20485 |
"num_train_epochs": 2,
|
20486 |
"save_steps": 50,
|
20487 |
"stateful_callbacks": {
|
@@ -20496,7 +20585,7 @@
|
|
20496 |
"attributes": {}
|
20497 |
}
|
20498 |
},
|
20499 |
-
"total_flos":
|
20500 |
"train_batch_size": 1,
|
20501 |
"trial_name": null,
|
20502 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
+
"epoch": 1.4150562004226517,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 11550,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
20477 |
"eval_steps_per_second": 0.763,
|
20478 |
"num_input_tokens_seen": 76876640,
|
20479 |
"step": 11500
|
20480 |
+
},
|
20481 |
+
{
|
20482 |
+
"epoch": 1.4095433524241217,
|
20483 |
+
"grad_norm": 1.9377460735178373,
|
20484 |
+
"learning_rate": 2.199502336588885e-05,
|
20485 |
+
"loss": 0.2269,
|
20486 |
+
"num_input_tokens_seen": 76910112,
|
20487 |
+
"step": 11505
|
20488 |
+
},
|
20489 |
+
{
|
20490 |
+
"epoch": 1.4101558910906251,
|
20491 |
+
"grad_norm": 1.2074376841787913,
|
20492 |
+
"learning_rate": 2.1953079675050498e-05,
|
20493 |
+
"loss": 0.2547,
|
20494 |
+
"num_input_tokens_seen": 76943248,
|
20495 |
+
"step": 11510
|
20496 |
+
},
|
20497 |
+
{
|
20498 |
+
"epoch": 1.4107684297571284,
|
20499 |
+
"grad_norm": 1.6673139338465959,
|
20500 |
+
"learning_rate": 2.1911164762789682e-05,
|
20501 |
+
"loss": 0.2192,
|
20502 |
+
"num_input_tokens_seen": 76976416,
|
20503 |
+
"step": 11515
|
20504 |
+
},
|
20505 |
+
{
|
20506 |
+
"epoch": 1.4113809684236318,
|
20507 |
+
"grad_norm": 1.0347317776135743,
|
20508 |
+
"learning_rate": 2.1869278672114762e-05,
|
20509 |
+
"loss": 0.1972,
|
20510 |
+
"num_input_tokens_seen": 77010144,
|
20511 |
+
"step": 11520
|
20512 |
+
},
|
20513 |
+
{
|
20514 |
+
"epoch": 1.411993507090135,
|
20515 |
+
"grad_norm": 1.0706084397278428,
|
20516 |
+
"learning_rate": 2.182742144600448e-05,
|
20517 |
+
"loss": 0.1968,
|
20518 |
+
"num_input_tokens_seen": 77044016,
|
20519 |
+
"step": 11525
|
20520 |
+
},
|
20521 |
+
{
|
20522 |
+
"epoch": 1.4126060457566383,
|
20523 |
+
"grad_norm": 1.3935001170007235,
|
20524 |
+
"learning_rate": 2.1785593127407993e-05,
|
20525 |
+
"loss": 0.1695,
|
20526 |
+
"num_input_tokens_seen": 77077688,
|
20527 |
+
"step": 11530
|
20528 |
+
},
|
20529 |
+
{
|
20530 |
+
"epoch": 1.4132185844231417,
|
20531 |
+
"grad_norm": 1.0019449876645863,
|
20532 |
+
"learning_rate": 2.1743793759244807e-05,
|
20533 |
+
"loss": 0.2303,
|
20534 |
+
"num_input_tokens_seen": 77111176,
|
20535 |
+
"step": 11535
|
20536 |
+
},
|
20537 |
+
{
|
20538 |
+
"epoch": 1.413831123089645,
|
20539 |
+
"grad_norm": 1.522429135029562,
|
20540 |
+
"learning_rate": 2.1702023384404706e-05,
|
20541 |
+
"loss": 0.2219,
|
20542 |
+
"num_input_tokens_seen": 77144408,
|
20543 |
+
"step": 11540
|
20544 |
+
},
|
20545 |
+
{
|
20546 |
+
"epoch": 1.4144436617561484,
|
20547 |
+
"grad_norm": 1.1253675763175544,
|
20548 |
+
"learning_rate": 2.1660282045747698e-05,
|
20549 |
+
"loss": 0.2047,
|
20550 |
+
"num_input_tokens_seen": 77177960,
|
20551 |
+
"step": 11545
|
20552 |
+
},
|
20553 |
+
{
|
20554 |
+
"epoch": 1.4150562004226517,
|
20555 |
+
"grad_norm": 1.163967526127202,
|
20556 |
+
"learning_rate": 2.1618569786104063e-05,
|
20557 |
+
"loss": 0.2299,
|
20558 |
+
"num_input_tokens_seen": 77211216,
|
20559 |
+
"step": 11550
|
20560 |
+
},
|
20561 |
+
{
|
20562 |
+
"epoch": 1.4150562004226517,
|
20563 |
+
"eval_loss": 0.18886250257492065,
|
20564 |
+
"eval_runtime": 19.3477,
|
20565 |
+
"eval_samples_per_second": 3.101,
|
20566 |
+
"eval_steps_per_second": 0.775,
|
20567 |
+
"num_input_tokens_seen": 77211216,
|
20568 |
+
"step": 11550
|
20569 |
}
|
20570 |
],
|
20571 |
"logging_steps": 5,
|
20572 |
"max_steps": 16324,
|
20573 |
+
"num_input_tokens_seen": 77211216,
|
20574 |
"num_train_epochs": 2,
|
20575 |
"save_steps": 50,
|
20576 |
"stateful_callbacks": {
|
|
|
20585 |
"attributes": {}
|
20586 |
}
|
20587 |
},
|
20588 |
+
"total_flos": 4842978796765184.0,
|
20589 |
"train_batch_size": 1,
|
20590 |
"trial_name": null,
|
20591 |
"trial_params": null
|