lesso commited on
Commit
2e77f5d
·
verified ·
1 Parent(s): d924fe0

Training in progress, step 200, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2b7fab8e5c707684dd7dcf2acfeef02dc66a45c810d37881d6d35ab0138813e
3
  size 338298
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9ac74b39f72854d193986d03bc840a1c04412975226a003ddf6f9712ea85a29
3
  size 338298
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cadb54f5b4b7cf6e5570f8b8aa5d66a30d9e31f2de3c6b5c891900bdb9053acc
3
  size 418030
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:543b0438259af00bb05f335870bb7e86c3bf831f69c1ab4c7de1da70e4df1a1a
3
  size 418030
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:039fcb416f3a29717abd0881d31fed0ae41a339ceb603e8a0d9a2989535c8efc
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0fa569ae9431ecec1ad250d458bd97a0680dbd03fc69e453a6363003309127e
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:921ab0de3764126581ec39378879cb5b5f7b00db4d38a319c5350418d3b5b284
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25f5be5717b8cedfd0ed40abce613b5b748b90320bdb20c1f1ab3a4f8a9f9654
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 6.850296497344971,
3
- "best_model_checkpoint": "miner_id_24/checkpoint-150",
4
- "epoch": 1.4527845036319613,
5
  "eval_steps": 50,
6
- "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -60,6 +60,21 @@
60
  "eval_samples_per_second": 1326.165,
61
  "eval_steps_per_second": 41.979,
62
  "step": 150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
  "logging_steps": 50,
@@ -88,7 +103,7 @@
88
  "attributes": {}
89
  }
90
  },
91
- "total_flos": 6325423902720.0,
92
  "train_batch_size": 32,
93
  "trial_name": null,
94
  "trial_params": null
 
1
  {
2
+ "best_metric": 6.843703746795654,
3
+ "best_model_checkpoint": "miner_id_24/checkpoint-200",
4
+ "epoch": 1.937046004842615,
5
  "eval_steps": 50,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
60
  "eval_samples_per_second": 1326.165,
61
  "eval_steps_per_second": 41.979,
62
  "step": 150
63
+ },
64
+ {
65
+ "epoch": 1.937046004842615,
66
+ "grad_norm": 0.13267219066619873,
67
+ "learning_rate": 0.000202,
68
+ "loss": 6.8475,
69
+ "step": 200
70
+ },
71
+ {
72
+ "epoch": 1.937046004842615,
73
+ "eval_loss": 6.843703746795654,
74
+ "eval_runtime": 0.7287,
75
+ "eval_samples_per_second": 953.768,
76
+ "eval_steps_per_second": 30.191,
77
+ "step": 200
78
  }
79
  ],
80
  "logging_steps": 50,
 
103
  "attributes": {}
104
  }
105
  },
106
+ "total_flos": 8430294306816.0,
107
  "train_batch_size": 32,
108
  "trial_name": null,
109
  "trial_params": null