Training in progress, step 11300, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step11300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step11300/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11300/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11300/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step11300/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +93 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13efb40e4419c7d85f3627cf4be90e793b7c958c288dd93caa0f9742cf099b52
|
3 |
size 29034840
|
last-checkpoint/global_step11300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb802d8b86235178665864fbb8ac0a2d8cc103f64e9d72caf23fb6e3b30bc173
|
3 |
+
size 43429616
|
last-checkpoint/global_step11300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d59663bafaeadc76928159ee71b811e9501b3da4277d8cdaee213beabf2b9da
|
3 |
+
size 43429616
|
last-checkpoint/global_step11300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da9971a5df55a8e75ba053ab35e571ac89307b948c81e7a459ad4aa7166413a9
|
3 |
+
size 43429616
|
last-checkpoint/global_step11300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c931493e3d1843ce7136cc5454793b356933d0859834a642a3af1f1f57ab815d
|
3 |
+
size 43429616
|
last-checkpoint/global_step11300/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d27a356619bf2aeb319d6d4b36b16a211f3a00d7a8ad3d979ab97bca0449c25
|
3 |
+
size 637299
|
last-checkpoint/global_step11300/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f06f9ad45b985bd13fd66edcf8c3140a7e5152c4e23ca926082bba24d7b4ae58
|
3 |
+
size 637171
|
last-checkpoint/global_step11300/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03d1a707bf667b2d3b242904ce05774deae98948c837620280dc3f5caa5763cd
|
3 |
+
size 637171
|
last-checkpoint/global_step11300/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db77e63a3d2d066be9e5b032ea872110bfdda0f062186f69470d70f45fd00b4a
|
3 |
+
size 637171
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step11300
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:858ef8d7925623c0290dd48d3c1775956d2df1380248fe1e7339f8a0b415d547
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab44a085ef8790893a6f0df127f223489bfbeac213c9397164eddee9bc6c25eb
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c469fffe8e3187c4d889f94a989ff4da7c85bf387c16e6fe1df6bccdda364757
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee1750daf75d7819cbd209b848de90eebc52fd951d1456db1e437c3e2e58a878
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f966d63b3b12fcd2b927c440da7d42e743950f341fa7654264fd2798d3e54a64
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -20032,11 +20032,100 @@
|
|
20032 |
"eval_steps_per_second": 0.738,
|
20033 |
"num_input_tokens_seen": 75199264,
|
20034 |
"step": 11250
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
20035 |
}
|
20036 |
],
|
20037 |
"logging_steps": 5,
|
20038 |
"max_steps": 16324,
|
20039 |
-
"num_input_tokens_seen":
|
20040 |
"num_train_epochs": 2,
|
20041 |
"save_steps": 50,
|
20042 |
"stateful_callbacks": {
|
@@ -20051,7 +20140,7 @@
|
|
20051 |
"attributes": {}
|
20052 |
}
|
20053 |
},
|
20054 |
-
"total_flos":
|
20055 |
"train_batch_size": 1,
|
20056 |
"trial_name": null,
|
20057 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.04092838987708092,
|
3 |
"best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
|
4 |
+
"epoch": 1.3844292670974856,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 11300,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
20032 |
"eval_steps_per_second": 0.738,
|
20033 |
"num_input_tokens_seen": 75199264,
|
20034 |
"step": 11250
|
20035 |
+
},
|
20036 |
+
{
|
20037 |
+
"epoch": 1.3789164190989556,
|
20038 |
+
"grad_norm": 2.338623943755047,
|
20039 |
+
"learning_rate": 2.4127941590292225e-05,
|
20040 |
+
"loss": 0.2058,
|
20041 |
+
"num_input_tokens_seen": 75232800,
|
20042 |
+
"step": 11255
|
20043 |
+
},
|
20044 |
+
{
|
20045 |
+
"epoch": 1.379528957765459,
|
20046 |
+
"grad_norm": 1.2367938341116378,
|
20047 |
+
"learning_rate": 2.408461444677841e-05,
|
20048 |
+
"loss": 0.2428,
|
20049 |
+
"num_input_tokens_seen": 75266240,
|
20050 |
+
"step": 11260
|
20051 |
+
},
|
20052 |
+
{
|
20053 |
+
"epoch": 1.3801414964319623,
|
20054 |
+
"grad_norm": 1.2910846803839258,
|
20055 |
+
"learning_rate": 2.404131389470223e-05,
|
20056 |
+
"loss": 0.1717,
|
20057 |
+
"num_input_tokens_seen": 75300144,
|
20058 |
+
"step": 11265
|
20059 |
+
},
|
20060 |
+
{
|
20061 |
+
"epoch": 1.3807540350984655,
|
20062 |
+
"grad_norm": 30.973267810423224,
|
20063 |
+
"learning_rate": 2.399803997849381e-05,
|
20064 |
+
"loss": 0.2426,
|
20065 |
+
"num_input_tokens_seen": 75333520,
|
20066 |
+
"step": 11270
|
20067 |
+
},
|
20068 |
+
{
|
20069 |
+
"epoch": 1.381366573764969,
|
20070 |
+
"grad_norm": 1.8951469707567008,
|
20071 |
+
"learning_rate": 2.3954792742555964e-05,
|
20072 |
+
"loss": 0.2372,
|
20073 |
+
"num_input_tokens_seen": 75367128,
|
20074 |
+
"step": 11275
|
20075 |
+
},
|
20076 |
+
{
|
20077 |
+
"epoch": 1.3819791124314722,
|
20078 |
+
"grad_norm": 0.9192799991547025,
|
20079 |
+
"learning_rate": 2.391157223126409e-05,
|
20080 |
+
"loss": 0.1993,
|
20081 |
+
"num_input_tokens_seen": 75400848,
|
20082 |
+
"step": 11280
|
20083 |
+
},
|
20084 |
+
{
|
20085 |
+
"epoch": 1.3825916510979757,
|
20086 |
+
"grad_norm": 1.2457276675807318,
|
20087 |
+
"learning_rate": 2.386837848896619e-05,
|
20088 |
+
"loss": 0.2131,
|
20089 |
+
"num_input_tokens_seen": 75433880,
|
20090 |
+
"step": 11285
|
20091 |
+
},
|
20092 |
+
{
|
20093 |
+
"epoch": 1.383204189764479,
|
20094 |
+
"grad_norm": 1.3290748045560505,
|
20095 |
+
"learning_rate": 2.382521155998283e-05,
|
20096 |
+
"loss": 0.1944,
|
20097 |
+
"num_input_tokens_seen": 75467816,
|
20098 |
+
"step": 11290
|
20099 |
+
},
|
20100 |
+
{
|
20101 |
+
"epoch": 1.3838167284309821,
|
20102 |
+
"grad_norm": 1.4277851260847876,
|
20103 |
+
"learning_rate": 2.378207148860699e-05,
|
20104 |
+
"loss": 0.2091,
|
20105 |
+
"num_input_tokens_seen": 75501792,
|
20106 |
+
"step": 11295
|
20107 |
+
},
|
20108 |
+
{
|
20109 |
+
"epoch": 1.3844292670974856,
|
20110 |
+
"grad_norm": 1.0730262567819877,
|
20111 |
+
"learning_rate": 2.3738958319104145e-05,
|
20112 |
+
"loss": 0.1914,
|
20113 |
+
"num_input_tokens_seen": 75535760,
|
20114 |
+
"step": 11300
|
20115 |
+
},
|
20116 |
+
{
|
20117 |
+
"epoch": 1.3844292670974856,
|
20118 |
+
"eval_loss": 0.12553976476192474,
|
20119 |
+
"eval_runtime": 19.7973,
|
20120 |
+
"eval_samples_per_second": 3.031,
|
20121 |
+
"eval_steps_per_second": 0.758,
|
20122 |
+
"num_input_tokens_seen": 75535760,
|
20123 |
+
"step": 11300
|
20124 |
}
|
20125 |
],
|
20126 |
"logging_steps": 5,
|
20127 |
"max_steps": 16324,
|
20128 |
+
"num_input_tokens_seen": 75535760,
|
20129 |
"num_train_epochs": 2,
|
20130 |
"save_steps": 50,
|
20131 |
"stateful_callbacks": {
|
|
|
20140 |
"attributes": {}
|
20141 |
}
|
20142 |
},
|
20143 |
+
"total_flos": 4737864310456320.0,
|
20144 |
"train_batch_size": 1,
|
20145 |
"trial_name": null,
|
20146 |
"trial_params": null
|