joe611 commited on
Commit
28ae9e0
·
verified ·
1 Parent(s): bd09b4b

Training in progress, epoch 44, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d69a853ce44d2a4c6a1f289809b194fbf5a858060c6c022ed50371f82355daf
3
  size 166496880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf72785f9e61f422066d5a55b0560c4c8a69464b26be32f4db1debc616942689
3
  size 166496880
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8897b9557334ef700d8217bf78bf859bb2374469468874a040168b0470cc76f
3
  size 330495866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a41339ed91a0fc5aebfb27479aad8c07d748b799c7840c36fbe1be25b37e1ab
3
  size 330495866
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85e4133488da63327fc9ea031838bb6fd69fb43cc377eec164eb44278dfb4b45
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef8c417a427a4d61d5632cb068a6069c159668c42d4b0b7a6a15b8a00b11eecc
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:545d510515f5179456e33cb07c6feb588b2ff2a682f4164e86878f83fb45a36d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa74708df9c1325cdd60797f5ccc467462cf147fdacd71b5f8d7ef24d6392cd
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.29740211367607117,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
4
- "epoch": 43.0,
5
  "eval_steps": 500,
6
- "global_step": 21500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -6137,6 +6137,151 @@
6137
  "eval_samples_per_second": 17.724,
6138
  "eval_steps_per_second": 2.304,
6139
  "step": 21500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6140
  }
6141
  ],
6142
  "logging_steps": 30,
@@ -6156,7 +6301,7 @@
6156
  "attributes": {}
6157
  }
6158
  },
6159
- "total_flos": 7.3964969275392e+18,
6160
  "train_batch_size": 2,
6161
  "trial_name": null,
6162
  "trial_params": null
 
1
  {
2
  "best_metric": 0.29740211367607117,
3
  "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-21500",
4
+ "epoch": 44.0,
5
  "eval_steps": 500,
6
+ "global_step": 22000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
6137
  "eval_samples_per_second": 17.724,
6138
  "eval_steps_per_second": 2.304,
6139
  "step": 21500
6140
+ },
6141
+ {
6142
+ "epoch": 43.02,
6143
+ "grad_norm": 44.15309143066406,
6144
+ "learning_rate": 1.8493306440731557e-06,
6145
+ "loss": 0.4896,
6146
+ "step": 21510
6147
+ },
6148
+ {
6149
+ "epoch": 43.08,
6150
+ "grad_norm": 35.48102951049805,
6151
+ "learning_rate": 1.837149190434378e-06,
6152
+ "loss": 0.5013,
6153
+ "step": 21540
6154
+ },
6155
+ {
6156
+ "epoch": 43.14,
6157
+ "grad_norm": 35.87041473388672,
6158
+ "learning_rate": 1.824998952856198e-06,
6159
+ "loss": 0.4439,
6160
+ "step": 21570
6161
+ },
6162
+ {
6163
+ "epoch": 43.2,
6164
+ "grad_norm": 26.650522232055664,
6165
+ "learning_rate": 1.8128800512565514e-06,
6166
+ "loss": 0.4186,
6167
+ "step": 21600
6168
+ },
6169
+ {
6170
+ "epoch": 43.26,
6171
+ "grad_norm": 48.30433654785156,
6172
+ "learning_rate": 1.800792605244109e-06,
6173
+ "loss": 0.4345,
6174
+ "step": 21630
6175
+ },
6176
+ {
6177
+ "epoch": 43.32,
6178
+ "grad_norm": 70.63233184814453,
6179
+ "learning_rate": 1.7887367341170781e-06,
6180
+ "loss": 0.4639,
6181
+ "step": 21660
6182
+ },
6183
+ {
6184
+ "epoch": 43.38,
6185
+ "grad_norm": 29.950109481811523,
6186
+ "learning_rate": 1.7767125568620442e-06,
6187
+ "loss": 0.3931,
6188
+ "step": 21690
6189
+ },
6190
+ {
6191
+ "epoch": 43.44,
6192
+ "grad_norm": 40.98532485961914,
6193
+ "learning_rate": 1.7647201921527802e-06,
6194
+ "loss": 0.3728,
6195
+ "step": 21720
6196
+ },
6197
+ {
6198
+ "epoch": 43.5,
6199
+ "grad_norm": 107.21430969238281,
6200
+ "learning_rate": 1.7527597583490825e-06,
6201
+ "loss": 0.3679,
6202
+ "step": 21750
6203
+ },
6204
+ {
6205
+ "epoch": 43.56,
6206
+ "grad_norm": 41.53556442260742,
6207
+ "learning_rate": 1.7408313734956074e-06,
6208
+ "loss": 0.4278,
6209
+ "step": 21780
6210
+ },
6211
+ {
6212
+ "epoch": 43.62,
6213
+ "grad_norm": 30.475116729736328,
6214
+ "learning_rate": 1.7289351553206952e-06,
6215
+ "loss": 0.4995,
6216
+ "step": 21810
6217
+ },
6218
+ {
6219
+ "epoch": 43.68,
6220
+ "grad_norm": 65.69325256347656,
6221
+ "learning_rate": 1.7170712212352187e-06,
6222
+ "loss": 0.4236,
6223
+ "step": 21840
6224
+ },
6225
+ {
6226
+ "epoch": 43.74,
6227
+ "grad_norm": 83.24858856201172,
6228
+ "learning_rate": 1.7052396883314154e-06,
6229
+ "loss": 0.4865,
6230
+ "step": 21870
6231
+ },
6232
+ {
6233
+ "epoch": 43.8,
6234
+ "grad_norm": 49.75985336303711,
6235
+ "learning_rate": 1.6934406733817417e-06,
6236
+ "loss": 0.4061,
6237
+ "step": 21900
6238
+ },
6239
+ {
6240
+ "epoch": 43.86,
6241
+ "grad_norm": 0.0012297651264816523,
6242
+ "learning_rate": 1.6816742928377072e-06,
6243
+ "loss": 0.4391,
6244
+ "step": 21930
6245
+ },
6246
+ {
6247
+ "epoch": 43.92,
6248
+ "grad_norm": 107.39283752441406,
6249
+ "learning_rate": 1.6699406628287423e-06,
6250
+ "loss": 0.4027,
6251
+ "step": 21960
6252
+ },
6253
+ {
6254
+ "epoch": 43.98,
6255
+ "grad_norm": 53.299110412597656,
6256
+ "learning_rate": 1.658239899161036e-06,
6257
+ "loss": 0.7057,
6258
+ "step": 21990
6259
+ },
6260
+ {
6261
+ "epoch": 44.0,
6262
+ "eval_loss": 0.3092344403266907,
6263
+ "eval_map": 0.7822,
6264
+ "eval_map_50": 0.9563,
6265
+ "eval_map_75": 0.9171,
6266
+ "eval_map_chicken": 0.7941,
6267
+ "eval_map_duck": 0.7348,
6268
+ "eval_map_large": 0.8688,
6269
+ "eval_map_medium": 0.7813,
6270
+ "eval_map_plant": 0.8177,
6271
+ "eval_map_small": 0.1985,
6272
+ "eval_mar_1": 0.3003,
6273
+ "eval_mar_10": 0.8165,
6274
+ "eval_mar_100": 0.821,
6275
+ "eval_mar_100_chicken": 0.8307,
6276
+ "eval_mar_100_duck": 0.766,
6277
+ "eval_mar_100_plant": 0.8663,
6278
+ "eval_mar_large": 0.9117,
6279
+ "eval_mar_medium": 0.8292,
6280
+ "eval_mar_small": 0.3663,
6281
+ "eval_runtime": 5.0773,
6282
+ "eval_samples_per_second": 19.696,
6283
+ "eval_steps_per_second": 2.56,
6284
+ "step": 22000
6285
  }
6286
  ],
6287
  "logging_steps": 30,
 
6301
  "attributes": {}
6302
  }
6303
  },
6304
+ "total_flos": 7.5685084839936e+18,
6305
  "train_batch_size": 2,
6306
  "trial_name": null,
6307
  "trial_params": null