ben81828 commited on
Commit
bc78679
·
verified ·
1 Parent(s): e61069c

Training in progress, step 11300, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90d81778cc2ef2c0aaa7e9d5a71c766e915039a5b82802bed36df17267327dab
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13efb40e4419c7d85f3627cf4be90e793b7c958c288dd93caa0f9742cf099b52
3
  size 29034840
last-checkpoint/global_step11300/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb802d8b86235178665864fbb8ac0a2d8cc103f64e9d72caf23fb6e3b30bc173
3
+ size 43429616
last-checkpoint/global_step11300/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d59663bafaeadc76928159ee71b811e9501b3da4277d8cdaee213beabf2b9da
3
+ size 43429616
last-checkpoint/global_step11300/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da9971a5df55a8e75ba053ab35e571ac89307b948c81e7a459ad4aa7166413a9
3
+ size 43429616
last-checkpoint/global_step11300/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c931493e3d1843ce7136cc5454793b356933d0859834a642a3af1f1f57ab815d
3
+ size 43429616
last-checkpoint/global_step11300/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d27a356619bf2aeb319d6d4b36b16a211f3a00d7a8ad3d979ab97bca0449c25
3
+ size 637299
last-checkpoint/global_step11300/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f06f9ad45b985bd13fd66edcf8c3140a7e5152c4e23ca926082bba24d7b4ae58
3
+ size 637171
last-checkpoint/global_step11300/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03d1a707bf667b2d3b242904ce05774deae98948c837620280dc3f5caa5763cd
3
+ size 637171
last-checkpoint/global_step11300/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db77e63a3d2d066be9e5b032ea872110bfdda0f062186f69470d70f45fd00b4a
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step11250
 
1
+ global_step11300
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9391df12420771e7a23f32c8c5b113ad4ba3e3b50a3af0ebc693d5897bac878c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858ef8d7925623c0290dd48d3c1775956d2df1380248fe1e7339f8a0b415d547
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b40ebbcfd0ebca5d6541a1ff18ce4792f88fde2908fabcabe69adab7e824a131
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab44a085ef8790893a6f0df127f223489bfbeac213c9397164eddee9bc6c25eb
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f69c0d167e1a2d884bd8d50f1c2aab03354407d35f58d8f1af272c5a22f54a6
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c469fffe8e3187c4d889f94a989ff4da7c85bf387c16e6fe1df6bccdda364757
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38b96cd40243779805fff577c7aff03639ba272fbec3e396db7be9f3c4eeb72a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee1750daf75d7819cbd209b848de90eebc52fd951d1456db1e437c3e2e58a878
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc6d4bc5d8885e14143685c986f72b4c0e5389631fdc959ac8dbb2e59c4e74f3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f966d63b3b12fcd2b927c440da7d42e743950f341fa7654264fd2798d3e54a64
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.04092838987708092,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
4
- "epoch": 1.3783038804324523,
5
  "eval_steps": 50,
6
- "global_step": 11250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -20032,11 +20032,100 @@
20032
  "eval_steps_per_second": 0.738,
20033
  "num_input_tokens_seen": 75199264,
20034
  "step": 11250
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20035
  }
20036
  ],
20037
  "logging_steps": 5,
20038
  "max_steps": 16324,
20039
- "num_input_tokens_seen": 75199264,
20040
  "num_train_epochs": 2,
20041
  "save_steps": 50,
20042
  "stateful_callbacks": {
@@ -20051,7 +20140,7 @@
20051
  "attributes": {}
20052
  }
20053
  },
20054
- "total_flos": 4716812931301376.0,
20055
  "train_batch_size": 1,
20056
  "trial_name": null,
20057
  "trial_params": null
 
1
  {
2
  "best_metric": 0.04092838987708092,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_detect_classify_augmented/lora/sft/checkpoint-9050",
4
+ "epoch": 1.3844292670974856,
5
  "eval_steps": 50,
6
+ "global_step": 11300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
20032
  "eval_steps_per_second": 0.738,
20033
  "num_input_tokens_seen": 75199264,
20034
  "step": 11250
20035
+ },
20036
+ {
20037
+ "epoch": 1.3789164190989556,
20038
+ "grad_norm": 2.338623943755047,
20039
+ "learning_rate": 2.4127941590292225e-05,
20040
+ "loss": 0.2058,
20041
+ "num_input_tokens_seen": 75232800,
20042
+ "step": 11255
20043
+ },
20044
+ {
20045
+ "epoch": 1.379528957765459,
20046
+ "grad_norm": 1.2367938341116378,
20047
+ "learning_rate": 2.408461444677841e-05,
20048
+ "loss": 0.2428,
20049
+ "num_input_tokens_seen": 75266240,
20050
+ "step": 11260
20051
+ },
20052
+ {
20053
+ "epoch": 1.3801414964319623,
20054
+ "grad_norm": 1.2910846803839258,
20055
+ "learning_rate": 2.404131389470223e-05,
20056
+ "loss": 0.1717,
20057
+ "num_input_tokens_seen": 75300144,
20058
+ "step": 11265
20059
+ },
20060
+ {
20061
+ "epoch": 1.3807540350984655,
20062
+ "grad_norm": 30.973267810423224,
20063
+ "learning_rate": 2.399803997849381e-05,
20064
+ "loss": 0.2426,
20065
+ "num_input_tokens_seen": 75333520,
20066
+ "step": 11270
20067
+ },
20068
+ {
20069
+ "epoch": 1.381366573764969,
20070
+ "grad_norm": 1.8951469707567008,
20071
+ "learning_rate": 2.3954792742555964e-05,
20072
+ "loss": 0.2372,
20073
+ "num_input_tokens_seen": 75367128,
20074
+ "step": 11275
20075
+ },
20076
+ {
20077
+ "epoch": 1.3819791124314722,
20078
+ "grad_norm": 0.9192799991547025,
20079
+ "learning_rate": 2.391157223126409e-05,
20080
+ "loss": 0.1993,
20081
+ "num_input_tokens_seen": 75400848,
20082
+ "step": 11280
20083
+ },
20084
+ {
20085
+ "epoch": 1.3825916510979757,
20086
+ "grad_norm": 1.2457276675807318,
20087
+ "learning_rate": 2.386837848896619e-05,
20088
+ "loss": 0.2131,
20089
+ "num_input_tokens_seen": 75433880,
20090
+ "step": 11285
20091
+ },
20092
+ {
20093
+ "epoch": 1.383204189764479,
20094
+ "grad_norm": 1.3290748045560505,
20095
+ "learning_rate": 2.382521155998283e-05,
20096
+ "loss": 0.1944,
20097
+ "num_input_tokens_seen": 75467816,
20098
+ "step": 11290
20099
+ },
20100
+ {
20101
+ "epoch": 1.3838167284309821,
20102
+ "grad_norm": 1.4277851260847876,
20103
+ "learning_rate": 2.378207148860699e-05,
20104
+ "loss": 0.2091,
20105
+ "num_input_tokens_seen": 75501792,
20106
+ "step": 11295
20107
+ },
20108
+ {
20109
+ "epoch": 1.3844292670974856,
20110
+ "grad_norm": 1.0730262567819877,
20111
+ "learning_rate": 2.3738958319104145e-05,
20112
+ "loss": 0.1914,
20113
+ "num_input_tokens_seen": 75535760,
20114
+ "step": 11300
20115
+ },
20116
+ {
20117
+ "epoch": 1.3844292670974856,
20118
+ "eval_loss": 0.12553976476192474,
20119
+ "eval_runtime": 19.7973,
20120
+ "eval_samples_per_second": 3.031,
20121
+ "eval_steps_per_second": 0.758,
20122
+ "num_input_tokens_seen": 75535760,
20123
+ "step": 11300
20124
  }
20125
  ],
20126
  "logging_steps": 5,
20127
  "max_steps": 16324,
20128
+ "num_input_tokens_seen": 75535760,
20129
  "num_train_epochs": 2,
20130
  "save_steps": 50,
20131
  "stateful_callbacks": {
 
20140
  "attributes": {}
20141
  }
20142
  },
20143
+ "total_flos": 4737864310456320.0,
20144
  "train_batch_size": 1,
20145
  "trial_name": null,
20146
  "trial_params": null