YYYYYYibo commited on
Commit
b0b9891
·
verified ·
1 Parent(s): 00cf010

Model save

Browse files
README.md CHANGED
@@ -2,14 +2,9 @@
2
  license: apache-2.0
3
  base_model: YYYYYYibo/full_vanilla_dpo_iter_1
4
  tags:
5
- - alignment-handbook
6
- - generated_from_trainer
7
  - trl
8
  - dpo
9
  - generated_from_trainer
10
- datasets:
11
- - updated
12
- - original
13
  model-index:
14
  - name: full_simple_online_iter_2
15
  results: []
@@ -20,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  # full_simple_online_iter_2
22
 
23
- This model is a fine-tuned version of [YYYYYYibo/full_vanilla_dpo_iter_1](https://huggingface.co/YYYYYYibo/full_vanilla_dpo_iter_1) on the updated and the original datasets.
24
 
25
  ## Model description
26
 
 
2
  license: apache-2.0
3
  base_model: YYYYYYibo/full_vanilla_dpo_iter_1
4
  tags:
 
 
5
  - trl
6
  - dpo
7
  - generated_from_trainer
 
 
 
8
  model-index:
9
  - name: full_simple_online_iter_2
10
  results: []
 
15
 
16
  # full_simple_online_iter_2
17
 
18
+ This model is a fine-tuned version of [YYYYYYibo/full_vanilla_dpo_iter_1](https://huggingface.co/YYYYYYibo/full_vanilla_dpo_iter_1) on the None dataset.
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.6894009854342487,
4
- "train_runtime": 9025.6123,
5
- "train_samples": 19000,
6
- "train_samples_per_second": 2.105,
7
  "train_steps_per_second": 0.016
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.5776262069359804,
4
+ "train_runtime": 9474.0276,
5
+ "train_samples": 20000,
6
+ "train_samples_per_second": 2.111,
7
  "train_steps_per_second": 0.016
8
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe86e2c25ad9ae983c498811e5a480ac3727f642766fef0236a11db3e13dcab0
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48cf9bd654703f1ed9fef98526910ec9c025c0d695da0b63c75a56bcd66db8fb
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:307c5e0242d47c8559d5c54f0a41b72bd4bc5610338b0aa2e8a209cfe8d24638
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcb19293e1e1d6426e90b5a675ba75b3277ca27d3bf76b59acb6072c131a4432
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00c242505930094b5941241990bc3657e0a553a43da834b995015f08c0718f9d
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2366e046327d3da5e5c7b3a83c25c1d3e1f07246246f7c73ac37b26d9f758300
3
  size 4540516344
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.6894009854342487,
4
- "train_runtime": 9025.6123,
5
- "train_samples": 19000,
6
- "train_samples_per_second": 2.105,
7
  "train_steps_per_second": 0.016
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.5776262069359804,
4
+ "train_runtime": 9474.0276,
5
+ "train_samples": 20000,
6
+ "train_samples_per_second": 2.111,
7
  "train_steps_per_second": 0.016
8
  }
trainer_state.json CHANGED
@@ -1,20 +1,20 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9966329966329966,
5
  "eval_steps": 500,
6
- "global_step": 148,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.01,
13
- "learning_rate": 3.3333333333333334e-08,
14
- "logits/chosen": -2.023646593093872,
15
- "logits/rejected": -1.861999750137329,
16
- "logps/chosen": -160.15196228027344,
17
- "logps/rejected": -164.30947875976562,
18
  "loss": 0.6931,
19
  "rewards/accuracies": 0.0,
20
  "rewards/chosen": 0.0,
@@ -23,213 +23,227 @@
23
  "step": 1
24
  },
25
  {
26
- "epoch": 0.07,
27
- "learning_rate": 3.333333333333333e-07,
28
- "logits/chosen": -1.8246960639953613,
29
- "logits/rejected": -1.874166488647461,
30
- "logps/chosen": -186.62855529785156,
31
- "logps/rejected": -191.06869506835938,
32
- "loss": 0.693,
33
- "rewards/accuracies": 0.4513888955116272,
34
- "rewards/chosen": -0.0028373675886541605,
35
- "rewards/margins": -9.477811545366421e-06,
36
- "rewards/rejected": -0.002827889285981655,
37
  "step": 10
38
  },
39
  {
40
  "epoch": 0.13,
41
- "learning_rate": 4.98258427321406e-07,
42
- "logits/chosen": -1.5834639072418213,
43
- "logits/rejected": -1.6468555927276611,
44
- "logps/chosen": -191.36276245117188,
45
- "logps/rejected": -201.68360900878906,
46
- "loss": 0.6936,
47
- "rewards/accuracies": 0.606249988079071,
48
- "rewards/chosen": -0.09236270189285278,
49
- "rewards/margins": 0.01027429848909378,
50
- "rewards/rejected": -0.10263700783252716,
51
  "step": 20
52
  },
53
  {
54
- "epoch": 0.2,
55
- "learning_rate": 4.844710954430464e-07,
56
- "logits/chosen": -1.572912335395813,
57
- "logits/rejected": -1.6341121196746826,
58
- "logps/chosen": -189.92250061035156,
59
- "logps/rejected": -188.98448181152344,
60
- "loss": 0.6947,
61
- "rewards/accuracies": 0.48750001192092896,
62
- "rewards/chosen": -0.10429297387599945,
63
- "rewards/margins": -0.007742973975837231,
64
- "rewards/rejected": -0.09655000269412994,
65
  "step": 30
66
  },
67
  {
68
- "epoch": 0.27,
69
- "learning_rate": 4.576621278295557e-07,
70
- "logits/chosen": -1.6369476318359375,
71
- "logits/rejected": -1.5702846050262451,
72
- "logps/chosen": -203.3102264404297,
73
- "logps/rejected": -203.18093872070312,
74
- "loss": 0.6897,
75
- "rewards/accuracies": 0.550000011920929,
76
- "rewards/chosen": -0.03835677355527878,
77
- "rewards/margins": 0.012528707273304462,
78
- "rewards/rejected": -0.05088547617197037,
79
  "step": 40
80
  },
81
  {
82
- "epoch": 0.34,
83
- "learning_rate": 4.193203929064353e-07,
84
- "logits/chosen": -1.3983080387115479,
85
- "logits/rejected": -1.405611276626587,
86
- "logps/chosen": -200.58035278320312,
87
- "logps/rejected": -205.0247802734375,
88
- "loss": 0.6879,
89
- "rewards/accuracies": 0.4749999940395355,
90
- "rewards/chosen": -0.2730618119239807,
91
- "rewards/margins": 0.03439151123166084,
92
- "rewards/rejected": -0.30745333433151245,
93
  "step": 50
94
  },
95
  {
96
- "epoch": 0.4,
97
- "learning_rate": 3.715752452735703e-07,
98
- "logits/chosen": -1.2504160404205322,
99
- "logits/rejected": -1.3270930051803589,
100
- "logps/chosen": -236.2527313232422,
101
- "logps/rejected": -239.9370574951172,
102
- "loss": 0.6856,
103
- "rewards/accuracies": 0.48750001192092896,
104
- "rewards/chosen": -0.5804754495620728,
105
- "rewards/margins": 0.015670539811253548,
106
- "rewards/rejected": -0.5961459279060364,
107
  "step": 60
108
  },
109
  {
110
- "epoch": 0.47,
111
- "learning_rate": 3.170782694233712e-07,
112
- "logits/chosen": -1.1783835887908936,
113
- "logits/rejected": -1.141601800918579,
114
- "logps/chosen": -263.32073974609375,
115
- "logps/rejected": -272.93450927734375,
116
- "loss": 0.6956,
117
- "rewards/accuracies": 0.612500011920929,
118
- "rewards/chosen": -0.9808699488639832,
119
- "rewards/margins": 0.05901496857404709,
120
- "rewards/rejected": -1.0398849248886108,
121
  "step": 70
122
  },
123
  {
124
- "epoch": 0.54,
125
- "learning_rate": 2.588560207905135e-07,
126
- "logits/chosen": -1.2210887670516968,
127
- "logits/rejected": -1.3275476694107056,
128
- "logps/chosen": -277.7283020019531,
129
- "logps/rejected": -284.2450256347656,
130
- "loss": 0.6953,
131
- "rewards/accuracies": 0.48750001192092896,
132
- "rewards/chosen": -0.8450358510017395,
133
- "rewards/margins": -0.01733619160950184,
134
- "rewards/rejected": -0.8276995420455933,
135
  "step": 80
136
  },
137
  {
138
- "epoch": 0.61,
139
- "learning_rate": 2.001419423371019e-07,
140
- "logits/chosen": -1.2033240795135498,
141
- "logits/rejected": -1.2934813499450684,
142
- "logps/chosen": -233.0209197998047,
143
- "logps/rejected": -232.87161254882812,
144
- "loss": 0.6984,
145
- "rewards/accuracies": 0.5062500238418579,
146
- "rewards/chosen": -0.7631824612617493,
147
- "rewards/margins": -0.014957061037421227,
148
- "rewards/rejected": -0.7482253313064575,
149
  "step": 90
150
  },
151
  {
152
- "epoch": 0.67,
153
- "learning_rate": 1.4419679138889375e-07,
154
- "logits/chosen": -1.5676350593566895,
155
- "logits/rejected": -1.5352352857589722,
156
- "logps/chosen": -243.58340454101562,
157
- "logps/rejected": -249.83670043945312,
158
- "loss": 0.6839,
159
- "rewards/accuracies": 0.6000000238418579,
160
- "rewards/chosen": -0.431363046169281,
161
- "rewards/margins": 0.026667874306440353,
162
- "rewards/rejected": -0.45803093910217285,
163
  "step": 100
164
  },
165
  {
166
- "epoch": 0.74,
167
- "learning_rate": 9.412754953531663e-08,
168
- "logits/chosen": -1.4186036586761475,
169
- "logits/rejected": -1.4321409463882446,
170
- "logps/chosen": -207.4648895263672,
171
- "logps/rejected": -220.63540649414062,
172
- "loss": 0.6783,
173
- "rewards/accuracies": 0.606249988079071,
174
- "rewards/chosen": -0.3499959409236908,
175
- "rewards/margins": 0.08647538721561432,
176
- "rewards/rejected": -0.4364713132381439,
177
  "step": 110
178
  },
179
  {
180
- "epoch": 0.81,
181
- "learning_rate": 5.271487265090163e-08,
182
- "logits/chosen": -1.3899421691894531,
183
- "logits/rejected": -1.4946931600570679,
184
- "logps/chosen": -199.7452392578125,
185
- "logps/rejected": -206.2049102783203,
186
- "loss": 0.6857,
187
- "rewards/accuracies": 0.550000011920929,
188
- "rewards/chosen": -0.31818634271621704,
189
- "rewards/margins": 0.03093295730650425,
190
- "rewards/rejected": -0.34911927580833435,
191
  "step": 120
192
  },
193
  {
194
- "epoch": 0.88,
195
- "learning_rate": 2.2258663809784888e-08,
196
- "logits/chosen": -1.5326082706451416,
197
- "logits/rejected": -1.4976835250854492,
198
- "logps/chosen": -203.8050079345703,
199
- "logps/rejected": -208.89431762695312,
200
- "loss": 0.6865,
201
- "rewards/accuracies": 0.5874999761581421,
202
- "rewards/chosen": -0.27058011293411255,
203
- "rewards/margins": 0.03228816017508507,
204
- "rewards/rejected": -0.3028682768344879,
205
  "step": 130
206
  },
207
  {
208
- "epoch": 0.94,
209
- "learning_rate": 4.45034538815614e-09,
210
- "logits/chosen": -1.4072165489196777,
211
- "logits/rejected": -1.4480218887329102,
212
- "logps/chosen": -210.232666015625,
213
- "logps/rejected": -218.79763793945312,
214
- "loss": 0.6827,
215
- "rewards/accuracies": 0.5625,
216
- "rewards/chosen": -0.29495373368263245,
217
- "rewards/margins": 0.03974684700369835,
218
- "rewards/rejected": -0.3347005844116211,
219
  "step": 140
220
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
221
  {
222
  "epoch": 1.0,
223
- "step": 148,
224
  "total_flos": 0.0,
225
- "train_loss": 0.6894009854342487,
226
- "train_runtime": 9025.6123,
227
- "train_samples_per_second": 2.105,
228
  "train_steps_per_second": 0.016
229
  }
230
  ],
231
  "logging_steps": 10,
232
- "max_steps": 148,
233
  "num_input_tokens_seen": 0,
234
  "num_train_epochs": 1,
235
  "save_steps": 100,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9984,
5
  "eval_steps": 500,
6
+ "global_step": 156,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.01,
13
+ "learning_rate": 3.125e-08,
14
+ "logits/chosen": -1.4567933082580566,
15
+ "logits/rejected": -0.871229887008667,
16
+ "logps/chosen": -244.365234375,
17
+ "logps/rejected": -212.26486206054688,
18
  "loss": 0.6931,
19
  "rewards/accuracies": 0.0,
20
  "rewards/chosen": 0.0,
 
23
  "step": 1
24
  },
25
  {
26
+ "epoch": 0.06,
27
+ "learning_rate": 3.1249999999999997e-07,
28
+ "logits/chosen": -1.83387291431427,
29
+ "logits/rejected": -1.0804697275161743,
30
+ "logps/chosen": -206.00912475585938,
31
+ "logps/rejected": -202.784912109375,
32
+ "loss": 0.6817,
33
+ "rewards/accuracies": 0.5486111044883728,
34
+ "rewards/chosen": -0.039022047072649,
35
+ "rewards/margins": 0.04178649187088013,
36
+ "rewards/rejected": -0.08080853521823883,
37
  "step": 10
38
  },
39
  {
40
  "epoch": 0.13,
41
+ "learning_rate": 4.989935734988097e-07,
42
+ "logits/chosen": -1.0675297975540161,
43
+ "logits/rejected": -0.5359733700752258,
44
+ "logps/chosen": -237.27444458007812,
45
+ "logps/rejected": -251.00753784179688,
46
+ "loss": 0.6561,
47
+ "rewards/accuracies": 0.581250011920929,
48
+ "rewards/chosen": -0.7787758111953735,
49
+ "rewards/margins": 0.11565746366977692,
50
+ "rewards/rejected": -0.8944332003593445,
51
  "step": 20
52
  },
53
  {
54
+ "epoch": 0.19,
55
+ "learning_rate": 4.877641290737883e-07,
56
+ "logits/chosen": -1.095473289489746,
57
+ "logits/rejected": -0.37094515562057495,
58
+ "logps/chosen": -244.32162475585938,
59
+ "logps/rejected": -296.1733703613281,
60
+ "loss": 0.5953,
61
+ "rewards/accuracies": 0.731249988079071,
62
+ "rewards/chosen": -0.6706979870796204,
63
+ "rewards/margins": 0.5164287090301514,
64
+ "rewards/rejected": -1.187126636505127,
65
  "step": 30
66
  },
67
  {
68
+ "epoch": 0.26,
69
+ "learning_rate": 4.646121984004665e-07,
70
+ "logits/chosen": -0.8634458780288696,
71
+ "logits/rejected": 0.12595783174037933,
72
+ "logps/chosen": -242.0459442138672,
73
+ "logps/rejected": -296.41595458984375,
74
+ "loss": 0.5648,
75
+ "rewards/accuracies": 0.78125,
76
+ "rewards/chosen": -0.5677449703216553,
77
+ "rewards/margins": 0.5976042747497559,
78
+ "rewards/rejected": -1.1653492450714111,
79
  "step": 40
80
  },
81
  {
82
+ "epoch": 0.32,
83
+ "learning_rate": 4.3069871595684787e-07,
84
+ "logits/chosen": -0.6954927444458008,
85
+ "logits/rejected": 0.03154268115758896,
86
+ "logps/chosen": -246.68258666992188,
87
+ "logps/rejected": -295.62884521484375,
88
+ "loss": 0.5913,
89
+ "rewards/accuracies": 0.71875,
90
+ "rewards/chosen": -0.8166979551315308,
91
+ "rewards/margins": 0.5098680257797241,
92
+ "rewards/rejected": -1.3265659809112549,
93
  "step": 50
94
  },
95
  {
96
+ "epoch": 0.38,
97
+ "learning_rate": 3.877242453630256e-07,
98
+ "logits/chosen": -0.768271267414093,
99
+ "logits/rejected": 0.022685179486870766,
100
+ "logps/chosen": -245.92782592773438,
101
+ "logps/rejected": -300.2510681152344,
102
+ "loss": 0.5887,
103
+ "rewards/accuracies": 0.731249988079071,
104
+ "rewards/chosen": -0.7170382738113403,
105
+ "rewards/margins": 0.5133967399597168,
106
+ "rewards/rejected": -1.2304350137710571,
107
  "step": 60
108
  },
109
  {
110
+ "epoch": 0.45,
111
+ "learning_rate": 3.378437060203357e-07,
112
+ "logits/chosen": -0.5168389081954956,
113
+ "logits/rejected": 0.45852264761924744,
114
+ "logps/chosen": -256.852294921875,
115
+ "logps/rejected": -309.4953308105469,
116
+ "loss": 0.5836,
117
+ "rewards/accuracies": 0.6875,
118
+ "rewards/chosen": -0.9044780731201172,
119
+ "rewards/margins": 0.5655065178871155,
120
+ "rewards/rejected": -1.4699846506118774,
121
  "step": 70
122
  },
123
  {
124
+ "epoch": 0.51,
125
+ "learning_rate": 2.8355831645441387e-07,
126
+ "logits/chosen": -0.3654092848300934,
127
+ "logits/rejected": 0.10795004665851593,
128
+ "logps/chosen": -251.9696502685547,
129
+ "logps/rejected": -292.9334716796875,
130
+ "loss": 0.5522,
131
+ "rewards/accuracies": 0.675000011920929,
132
+ "rewards/chosen": -0.7978931069374084,
133
+ "rewards/margins": 0.38232654333114624,
134
+ "rewards/rejected": -1.1802196502685547,
135
  "step": 80
136
  },
137
  {
138
+ "epoch": 0.58,
139
+ "learning_rate": 2.2759017277414164e-07,
140
+ "logits/chosen": -0.8108726739883423,
141
+ "logits/rejected": 0.14660978317260742,
142
+ "logps/chosen": -273.36419677734375,
143
+ "logps/rejected": -320.58209228515625,
144
+ "loss": 0.5671,
145
+ "rewards/accuracies": 0.7437499761581421,
146
+ "rewards/chosen": -0.6586915254592896,
147
+ "rewards/margins": 0.6224299669265747,
148
+ "rewards/rejected": -1.2811213731765747,
149
  "step": 90
150
  },
151
  {
152
+ "epoch": 0.64,
153
+ "learning_rate": 1.7274575140626315e-07,
154
+ "logits/chosen": -0.46979203820228577,
155
+ "logits/rejected": 0.5494852066040039,
156
+ "logps/chosen": -272.69427490234375,
157
+ "logps/rejected": -317.7990417480469,
158
+ "loss": 0.5547,
159
+ "rewards/accuracies": 0.706250011920929,
160
+ "rewards/chosen": -0.9002830386161804,
161
+ "rewards/margins": 0.5319327116012573,
162
+ "rewards/rejected": -1.432215690612793,
163
  "step": 100
164
  },
165
  {
166
+ "epoch": 0.7,
167
+ "learning_rate": 1.2177518064852348e-07,
168
+ "logits/chosen": -0.3219306170940399,
169
+ "logits/rejected": 0.26910799741744995,
170
+ "logps/chosen": -251.5453338623047,
171
+ "logps/rejected": -299.8834533691406,
172
+ "loss": 0.56,
173
+ "rewards/accuracies": 0.65625,
174
+ "rewards/chosen": -0.7972058057785034,
175
+ "rewards/margins": 0.43246564269065857,
176
+ "rewards/rejected": -1.2296714782714844,
177
  "step": 110
178
  },
179
  {
180
+ "epoch": 0.77,
181
+ "learning_rate": 7.723433775328384e-08,
182
+ "logits/chosen": -0.37325382232666016,
183
+ "logits/rejected": 0.5774334669113159,
184
+ "logps/chosen": -233.79562377929688,
185
+ "logps/rejected": -328.5582580566406,
186
+ "loss": 0.5585,
187
+ "rewards/accuracies": 0.7749999761581421,
188
+ "rewards/chosen": -0.6402639150619507,
189
+ "rewards/margins": 0.7515830397605896,
190
+ "rewards/rejected": -1.3918468952178955,
191
  "step": 120
192
  },
193
  {
194
+ "epoch": 0.83,
195
+ "learning_rate": 4.1356686569674335e-08,
196
+ "logits/chosen": -0.3119003176689148,
197
+ "logits/rejected": 0.8427650332450867,
198
+ "logps/chosen": -233.98971557617188,
199
+ "logps/rejected": -324.93316650390625,
200
+ "loss": 0.5265,
201
+ "rewards/accuracies": 0.762499988079071,
202
+ "rewards/chosen": -0.7347938418388367,
203
+ "rewards/margins": 0.7224765419960022,
204
+ "rewards/rejected": -1.4572702646255493,
205
  "step": 130
206
  },
207
  {
208
+ "epoch": 0.9,
209
+ "learning_rate": 1.5941282340065697e-08,
210
+ "logits/chosen": -0.20903070271015167,
211
+ "logits/rejected": 0.7928945422172546,
212
+ "logps/chosen": -274.28704833984375,
213
+ "logps/rejected": -331.6188049316406,
214
+ "loss": 0.5484,
215
+ "rewards/accuracies": 0.71875,
216
+ "rewards/chosen": -0.9145911931991577,
217
+ "rewards/margins": 0.5992218255996704,
218
+ "rewards/rejected": -1.5138130187988281,
219
  "step": 140
220
  },
221
+ {
222
+ "epoch": 0.96,
223
+ "learning_rate": 2.2625595580163247e-09,
224
+ "logits/chosen": 0.10685434192419052,
225
+ "logits/rejected": 0.766906201839447,
226
+ "logps/chosen": -257.482666015625,
227
+ "logps/rejected": -326.8499450683594,
228
+ "loss": 0.5539,
229
+ "rewards/accuracies": 0.7250000238418579,
230
+ "rewards/chosen": -0.9127100706100464,
231
+ "rewards/margins": 0.6432833075523376,
232
+ "rewards/rejected": -1.5559935569763184,
233
+ "step": 150
234
+ },
235
  {
236
  "epoch": 1.0,
237
+ "step": 156,
238
  "total_flos": 0.0,
239
+ "train_loss": 0.5776262069359804,
240
+ "train_runtime": 9474.0276,
241
+ "train_samples_per_second": 2.111,
242
  "train_steps_per_second": 0.016
243
  }
244
  ],
245
  "logging_steps": 10,
246
+ "max_steps": 156,
247
  "num_input_tokens_seen": 0,
248
  "num_train_epochs": 1,
249
  "save_steps": 100,