RodrigoSalazar-U commited on
Commit
775afe4
·
verified ·
1 Parent(s): 13f44cb

Training in progress, step 2500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4380650dcb89ea554e8e522387212bf4d52c5c83459f83e79d11aeaa75e938f3
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55fb81428939778dab08e7922db21d016e3f504c05107e029c92f5fce46fe882
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6265fff472063a8acba8dfd3c39858c1d92510671c7894dd6142eea88a2418a
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a229809403e9c000da99928a1a77232623f005939cd31324d820e5637351f23b
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2b5794f891efa039dc7974b27a227de46156bc8c7ebd7ea9d3d86467b6bab57
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eba198d9667b25aa3e1e3ed428937b84fcb61b09b165df40f8a2db486d218cb8
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.095290251916758,
5
  "eval_steps": 500,
6
- "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -147,6 +147,41 @@
147
  "learning_rate": 9.574389385212366e-05,
148
  "loss": 1.1348,
149
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
150
  }
151
  ],
152
  "logging_steps": 100,
@@ -166,7 +201,7 @@
166
  "attributes": {}
167
  }
168
  },
169
- "total_flos": 9.642466312538358e+17,
170
  "train_batch_size": 16,
171
  "trial_name": null,
172
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.3691128148959475,
5
  "eval_steps": 500,
6
+ "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
147
  "learning_rate": 9.574389385212366e-05,
148
  "loss": 1.1348,
149
  "step": 2000
150
+ },
151
+ {
152
+ "epoch": 1.1500547645125958,
153
+ "grad_norm": 2.488781213760376,
154
+ "learning_rate": 9.493886427336657e-05,
155
+ "loss": 1.1794,
156
+ "step": 2100
157
+ },
158
+ {
159
+ "epoch": 1.2048192771084336,
160
+ "grad_norm": 2.216630697250366,
161
+ "learning_rate": 9.406815330073244e-05,
162
+ "loss": 1.1533,
163
+ "step": 2200
164
+ },
165
+ {
166
+ "epoch": 1.2595837897042717,
167
+ "grad_norm": 2.5205495357513428,
168
+ "learning_rate": 9.313303354115677e-05,
169
+ "loss": 1.1383,
170
+ "step": 2300
171
+ },
172
+ {
173
+ "epoch": 1.3143483023001095,
174
+ "grad_norm": 2.7046151161193848,
175
+ "learning_rate": 9.213487173966623e-05,
176
+ "loss": 1.1639,
177
+ "step": 2400
178
+ },
179
+ {
180
+ "epoch": 1.3691128148959475,
181
+ "grad_norm": 2.2721831798553467,
182
+ "learning_rate": 9.107512678178223e-05,
183
+ "loss": 1.1572,
184
+ "step": 2500
185
  }
186
  ],
187
  "logging_steps": 100,
 
201
  "attributes": {}
202
  }
203
  },
204
+ "total_flos": 1.2070042691739648e+18,
205
  "train_batch_size": 16,
206
  "trial_name": null,
207
  "trial_params": null