CocoRoF commited on
Commit
a9bcdd1
·
verified ·
1 Parent(s): 5417c2b

Training in progress, step 188, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44422a94a97be5919c4f8acf50c2d6cc910db29c178068c091ab4d9dfb7add7f
3
  size 368988278
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5fee9b3be3ceee10186d35e87ac0167e8f551634db0ee10b7fd71dcdb471a64
3
  size 368988278
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27486bbb86c05ad439b79d09b4e894cab395d3edf735d4ca92b233100a99ffac
3
  size 1107079290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3edc9997421f59a2bab339723bfa57da56d3a3caeb07533babc705299d70ed21
3
  size 1107079290
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d9b86dea31fa233a9cd83c58b8309c25b99ab9d7e9c98c615fdb07adc8f1bd6
3
  size 1000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:906448df3b925c4237703b09a08232c313d6b304e3d61120e14d73631f8cabd0
3
  size 1000
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5304600082884376,
5
  "eval_steps": 100,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -85,6 +85,62 @@
85
  "eval_samples_per_second": 821.122,
86
  "eval_steps_per_second": 25.712,
87
  "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
88
  }
89
  ],
90
  "logging_steps": 10,
@@ -99,12 +155,12 @@
99
  "should_evaluate": false,
100
  "should_log": false,
101
  "should_save": true,
102
- "should_training_stop": false
103
  },
104
  "attributes": {}
105
  }
106
  },
107
- "total_flos": 2.7611165777461248e+17,
108
  "train_batch_size": 4,
109
  "trial_name": null,
110
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9972648155822628,
5
  "eval_steps": 100,
6
+ "global_step": 188,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
85
  "eval_samples_per_second": 821.122,
86
  "eval_steps_per_second": 25.712,
87
  "step": 100
88
+ },
89
+ {
90
+ "epoch": 0.5835060091172813,
91
+ "grad_norm": 13.484375,
92
+ "learning_rate": 9.988603516333233e-07,
93
+ "loss": 24.8423,
94
+ "step": 110
95
+ },
96
+ {
97
+ "epoch": 0.6365520099461252,
98
+ "grad_norm": 12.78125,
99
+ "learning_rate": 9.987567472363527e-07,
100
+ "loss": 24.5701,
101
+ "step": 120
102
+ },
103
+ {
104
+ "epoch": 0.689598010774969,
105
+ "grad_norm": 13.5625,
106
+ "learning_rate": 9.98653142839382e-07,
107
+ "loss": 24.5008,
108
+ "step": 130
109
+ },
110
+ {
111
+ "epoch": 0.7426440116038127,
112
+ "grad_norm": 10.8046875,
113
+ "learning_rate": 9.985495384424114e-07,
114
+ "loss": 24.1657,
115
+ "step": 140
116
+ },
117
+ {
118
+ "epoch": 0.7956900124326565,
119
+ "grad_norm": 15.5078125,
120
+ "learning_rate": 9.984459340454408e-07,
121
+ "loss": 24.2864,
122
+ "step": 150
123
+ },
124
+ {
125
+ "epoch": 0.8487360132615002,
126
+ "grad_norm": 11.609375,
127
+ "learning_rate": 9.983423296484702e-07,
128
+ "loss": 24.0425,
129
+ "step": 160
130
+ },
131
+ {
132
+ "epoch": 0.901782014090344,
133
+ "grad_norm": 11.1171875,
134
+ "learning_rate": 9.982387252514998e-07,
135
+ "loss": 24.1412,
136
+ "step": 170
137
+ },
138
+ {
139
+ "epoch": 0.9548280149191878,
140
+ "grad_norm": 15.390625,
141
+ "learning_rate": 9.98135120854529e-07,
142
+ "loss": 23.766,
143
+ "step": 180
144
  }
145
  ],
146
  "logging_steps": 10,
 
155
  "should_evaluate": false,
156
  "should_log": false,
157
  "should_save": true,
158
+ "should_training_stop": true
159
  },
160
  "attributes": {}
161
  }
162
  },
163
+ "total_flos": 5.1908991489828454e+17,
164
  "train_batch_size": 4,
165
  "trial_name": null,
166
  "trial_params": null