mengshyu commited on
Commit
9bebc2c
1 Parent(s): ad4b6fa

Initial commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
added_tokens.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 32000,
3
+ "<|assistant|>": 32001,
4
+ "<|placeholder1|>": 32002,
5
+ "<|placeholder2|>": 32003,
6
+ "<|placeholder3|>": 32004,
7
+ "<|placeholder4|>": 32005,
8
+ "<|system|>": 32006,
9
+ "<|end|>": 32007,
10
+ "<|placeholder5|>": 32008,
11
+ "<|placeholder6|>": 32009,
12
+ "<|user|>": 32010
13
+ }
logs.txt ADDED
@@ -0,0 +1,262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/195 [00:00<?, ?it/s]
1
 
 
2
  0%| | 0/195 [00:00<?, ?it/s]
3
 
 
4
  0%| | 0/195 [00:00<?, ?it/s]/home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:549: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
 
 
 
 
5
  1%| | 1/195 [00:01<05:23, 1.67s/it]
6
 
 
7
  1%| | 1/195 [00:01<05:23, 1.67s/it]
8
 
 
9
  1%| | 1/195 [00:01<05:23, 1.67s/it]
10
  2%|▏ | 3/195 [00:01<01:40, 1.91it/s]
11
 
 
12
  2%|▏ | 3/195 [00:01<01:40, 1.91it/s]
13
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
14
 
 
15
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
16
 
 
17
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
18
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
19
 
 
20
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
21
 
 
22
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
23
  4%|▍ | 8/195 [00:02<00:44, 4.23it/s]
24
 
 
25
  4%|▍ | 8/195 [00:02<00:44, 4.23it/s]
26
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
27
 
 
28
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
29
 
 
30
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
31
 
 
32
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
33
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
34
 
 
35
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
36
 
 
37
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
38
  7%|▋ | 14/195 [00:03<00:31, 5.70it/s]
39
 
 
40
  7%|▋ | 14/195 [00:03<00:31, 5.70it/s]
41
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
42
 
 
43
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
44
 
 
45
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
46
 
 
47
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
48
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
49
 
 
50
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
51
 
 
52
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
53
  10%|█ | 20/195 [00:04<00:28, 6.18it/s]
54
 
 
55
  10%|█ | 20/195 [00:05<00:28, 6.18it/s]
56
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
57
 
 
58
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
59
 
 
60
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
61
 
 
62
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
63
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
64
 
 
65
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
66
 
 
67
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
68
  13%|█▎ | 26/195 [00:06<00:26, 6.34it/s]
69
 
 
70
  13%|█▎ | 26/195 [00:06<00:26, 6.34it/s]
71
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
72
 
 
73
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
74
 
 
75
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
76
 
 
77
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
78
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
79
 
 
80
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
81
 
 
82
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
83
  16%|█▋ | 32/195 [00:07<00:25, 6.41it/s]
84
 
 
85
  16%|█▋ | 32/195 [00:07<00:25, 6.41it/s]
86
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
87
 
 
88
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
89
 
 
90
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
91
 
 
92
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
93
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
94
 
 
95
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
96
 
 
97
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
98
  19%|█▉ | 38/195 [00:08<00:24, 6.43it/s]
99
 
 
100
  19%|█▉ | 38/195 [00:08<00:24, 6.43it/s]
101
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
102
 
 
103
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
104
 
 
105
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
106
 
 
107
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
108
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
109
 
 
110
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
111
 
 
112
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
113
  23%|██▎ | 44/195 [00:09<00:23, 6.44it/s]
114
 
 
115
  23%|██▎ | 44/195 [00:09<00:23, 6.44it/s]
116
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
117
 
 
118
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
119
 
 
120
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
121
 
 
122
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
123
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
124
 
 
125
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
126
 
 
127
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
128
  26%|██▌ | 50/195 [00:10<00:22, 6.44it/s]
129
 
 
130
  26%|██▌ | 50/195 [00:10<00:22, 6.44it/s]
131
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
132
 
 
133
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
134
 
 
135
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
136
 
 
137
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
138
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
139
 
 
140
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
141
 
 
142
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
143
  29%|██▊ | 56/195 [00:11<00:21, 6.44it/s]
144
 
 
145
  29%|██▊ | 56/195 [00:11<00:21, 6.44it/s]
146
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
147
 
 
148
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
149
 
 
150
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
151
 
 
152
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
153
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
154
 
 
155
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
156
 
 
157
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
158
  32%|███▏ | 62/195 [00:12<00:20, 6.38it/s]
159
 
 
160
  32%|███▏ | 62/195 [00:12<00:20, 6.38it/s]
161
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
162
 
 
163
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
164
 
 
165
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
166
 
 
167
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
168
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
169
 
 
170
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
171
 
 
172
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
173
 
 
174
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
175
 
 
176
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
177
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
178
 
 
179
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
180
 
 
181
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
182
  36%|███▌ | 70/195 [00:14<00:33, 3.71it/s]
183
 
 
184
  36%|███▌ | 70/195 [00:14<00:33, 3.71it/s]
185
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
186
 
 
187
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
188
 
 
189
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
190
 
 
191
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
192
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
193
 
 
194
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
195
 
 
196
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
197
  39%|███▉ | 76/195 [00:15<00:22, 5.23it/s]
198
 
 
199
  39%|███▉ | 76/195 [00:15<00:22, 5.23it/s]
200
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
201
 
 
202
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
203
 
 
204
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
205
 
 
206
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
207
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
208
 
 
209
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
210
 
 
211
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
212
  42%|████▏ | 82/195 [00:17<00:19, 5.92it/s]
213
 
 
214
  42%|████▏ | 82/195 [00:17<00:19, 5.92it/s]
215
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
216
 
 
217
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
218
 
 
219
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
220
 
 
221
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
222
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
223
 
 
224
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
225
 
 
226
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
227
  45%|████▌ | 88/195 [00:18<00:17, 6.25it/s]
228
 
 
229
  45%|████▌ | 88/195 [00:18<00:17, 6.25it/s]
230
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
231
 
 
232
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
233
 
 
234
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
235
 
 
236
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
237
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
238
 
 
239
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
240
 
 
241
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
242
  48%|████▊ | 94/195 [00:19<00:15, 6.49it/s]
243
 
 
244
  48%|████▊ | 94/195 [00:19<00:15, 6.49it/s]
245
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
246
 
 
247
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
248
 
 
249
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
250
 
 
251
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
252
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
253
 
 
254
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
255
 
 
256
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
257
  51%|█████▏ | 100/195 [00:20<00:14, 6.57it/s]
258
 
 
259
  51%|█████▏ | 100/195 [00:20<00:14, 6.57it/s]
260
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
261
 
 
262
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
263
 
 
264
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
265
 
 
266
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
267
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
268
 
 
269
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
270
 
 
271
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
272
  54%|█████▍ | 106/195 [00:21<00:13, 6.61it/s]
273
 
 
274
  54%|█████▍ | 106/195 [00:21<00:13, 6.61it/s]
275
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
276
 
 
277
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
278
 
 
279
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
280
 
 
281
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
282
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
283
 
 
284
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
285
 
 
286
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
287
  57%|█████▋ | 112/195 [00:22<00:12, 6.54it/s]
288
 
 
289
  57%|█████▋ | 112/195 [00:22<00:12, 6.54it/s]
290
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
291
 
 
292
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
293
 
 
294
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
295
 
 
296
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
297
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
298
 
 
299
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
300
 
 
301
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
302
  61%|██████ | 118/195 [00:23<00:11, 6.51it/s]
303
 
 
304
  61%|██████ | 118/195 [00:23<00:11, 6.51it/s]
305
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
306
 
 
307
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
308
 
 
309
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
310
 
 
311
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
312
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
313
 
 
314
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
315
 
 
316
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
317
  64%|██████▎ | 124/195 [00:24<00:10, 6.59it/s]
318
 
 
319
  64%|██████▎ | 124/195 [00:24<00:10, 6.59it/s]
320
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
321
 
 
322
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
323
 
 
324
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
325
 
 
326
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
327
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
328
 
 
329
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
330
 
 
331
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
332
  67%|██████▋ | 130/195 [00:25<00:09, 6.61it/s]
333
 
 
334
  67%|██████▋ | 130/195 [00:25<00:09, 6.61it/s]
335
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
336
 
 
337
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
338
 
 
339
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
340
 
 
341
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
342
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
343
 
 
344
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
345
 
 
346
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
347
  70%|██████▉ | 136/195 [00:26<00:08, 6.63it/s]
348
 
 
349
  70%|██████▉ | 136/195 [00:26<00:08, 6.63it/s]
350
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
351
 
 
352
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
353
 
 
354
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
355
 
 
356
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
357
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
358
 
 
359
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
360
 
 
361
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
362
  73%|███████▎ | 142/195 [00:27<00:08, 6.60it/s]
363
 
 
364
  73%|███████▎ | 142/195 [00:27<00:08, 6.60it/s]
365
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
366
 
 
367
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
368
 
 
369
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
370
 
 
371
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
372
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
373
 
 
374
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
375
 
 
376
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
377
  76%|███████▌ | 148/195 [00:28<00:07, 6.58it/s]
378
 
 
379
  76%|███████▌ | 148/195 [00:28<00:07, 6.58it/s]
380
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
381
 
 
382
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
383
 
 
384
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
385
 
 
386
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
387
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
388
 
 
389
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
390
 
 
391
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
392
 
 
393
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
394
  79%|███████▉ | 155/195 [00:29<00:05, 6.97it/s]
395
 
 
396
  79%|███████▉ | 155/195 [00:29<00:05, 6.97it/s]
397
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
398
 
 
399
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
400
 
 
401
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
402
 
 
403
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
404
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
405
 
 
406
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
407
 
 
408
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
409
  83%|████████▎ | 161/195 [00:30<00:05, 6.75it/s]
410
 
 
411
  83%|████████▎ | 161/195 [00:30<00:05, 6.75it/s]
412
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
413
 
 
414
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
415
 
 
416
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
417
 
 
418
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
419
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
420
 
 
421
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
422
 
 
423
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
424
  86%|████████▌ | 167/195 [00:31<00:04, 6.67it/s]
425
 
 
426
  86%|████████▌ | 167/195 [00:31<00:04, 6.67it/s]
427
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
428
 
 
429
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
430
 
 
431
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
432
 
 
433
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
434
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
435
 
 
436
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
437
 
 
438
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
439
  89%|████████▊ | 173/195 [00:32<00:03, 6.64it/s]
440
 
 
441
  89%|████████▊ | 173/195 [00:32<00:03, 6.64it/s]
442
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
443
 
 
444
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
445
 
 
446
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
447
 
 
448
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
449
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
450
 
 
451
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
452
 
 
453
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
454
  92%|█████████▏| 179/195 [00:33<00:02, 6.63it/s]
455
 
 
456
  92%|█████████▏| 179/195 [00:33<00:02, 6.63it/s]
457
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
458
 
 
459
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
460
 
 
461
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
462
 
 
463
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
464
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
465
 
 
466
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
467
 
 
468
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
469
  95%|█████████▍| 185/195 [00:34<00:01, 6.63it/s]
470
 
 
471
  95%|█████████▍| 185/195 [00:34<00:01, 6.63it/s]
472
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
473
 
 
474
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
475
 
 
476
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
477
 
 
478
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
479
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
480
 
 
481
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
482
 
 
483
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
484
  98%|█████████▊| 191/195 [00:35<00:00, 6.64it/s]
485
 
 
486
  98%|█████████▊| 191/195 [00:35<00:00, 6.64it/s]
487
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
488
 
 
489
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
490
 
 
491
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
492
 
 
493
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
 
 
 
 
 
 
 
 
 
 
 
1
+ /home/msyu/workspace/venv/bin/python -m mlc_llm gen_config /tmp/tmpom_oz7t5/repo --quantization q0f32 --conv-template phi-3 --output /tmp/tmpbu0nfi81
2
+ [2024-05-08 13:43:32] INFO auto_config.py:115: Found model configuration: /tmp/tmpom_oz7t5/repo/config.json
3
+ [2024-05-08 13:43:32] INFO auto_config.py:153: Found model type: phi3. Use `--model-type` to override.
4
+ [2024-05-08 13:43:32] INFO phi3_model.py:53: context_window_size not found in config.json. Falling back to max_position_embeddings (131072)
5
+ [2024-05-08 13:43:32] INFO phi3_model.py:68: prefill_chunk_size defaults to 2048
6
+ [2024-05-08 13:43:32] INFO config.py:106: Overriding max_batch_size from 1 to 80
7
+ [2024-05-08 13:43:32] INFO gen_config.py:255: [generation_config.json] Setting bos_token_id: 1
8
+ [2024-05-08 13:43:32] INFO gen_config.py:255: [generation_config.json] Setting eos_token_id: [32000, 32001, 32007]
9
+ [2024-05-08 13:43:32] INFO gen_config.py:255: [generation_config.json] Setting pad_token_id: 32000
10
+ [2024-05-08 13:43:32] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpom_oz7t5/repo/tokenizer.model. Copying to /tmp/tmpbu0nfi81/tokenizer.model
11
+ [2024-05-08 13:43:32] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpom_oz7t5/repo/tokenizer.json. Copying to /tmp/tmpbu0nfi81/tokenizer.json
12
+ [2024-05-08 13:43:32] INFO gen_config.py:269: Not found tokenizer config: /tmp/tmpom_oz7t5/repo/vocab.json
13
+ [2024-05-08 13:43:32] INFO gen_config.py:269: Not found tokenizer config: /tmp/tmpom_oz7t5/repo/merges.txt
14
+ [2024-05-08 13:43:32] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpom_oz7t5/repo/added_tokens.json. Copying to /tmp/tmpbu0nfi81/added_tokens.json
15
+ [2024-05-08 13:43:32] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpom_oz7t5/repo/tokenizer_config.json. Copying to /tmp/tmpbu0nfi81/tokenizer_config.json
16
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting temperature: 0.7
17
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting presence_penalty: 0.0
18
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting frequency_penalty: 0.0
19
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting repetition_penalty: 1.0
20
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting top_p: 0.95
21
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting mean_gen_len: 128
22
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting max_gen_len: 512
23
+ [2024-05-08 13:43:32] INFO gen_config.py:80: [System default] Setting shift_fill_factor: 0.3
24
+ [2024-05-08 13:43:32] INFO gen_config.py:335: Dumping configuration file to: /tmp/tmpbu0nfi81/mlc-chat-config.json
25
+ /home/msyu/workspace/venv/bin/python -m mlc_llm convert_weight /tmp/tmpom_oz7t5/repo --quantization q0f32 --source-format auto --output /tmp/tmpbu0nfi81
26
+ [2024-05-08 13:43:33] INFO auto_config.py:115: Found model configuration: /tmp/tmpom_oz7t5/repo/config.json
27
+ [2024-05-08 13:43:33] INFO auto_device.py:79: Found device: cuda:0
28
+ [2024-05-08 13:43:34] INFO auto_device.py:88: Not found device: rocm:0
29
+ [2024-05-08 13:43:34] INFO auto_device.py:88: Not found device: metal:0
30
+ [2024-05-08 13:43:35] INFO auto_device.py:88: Not found device: vulkan:0
31
+ [2024-05-08 13:43:36] INFO auto_device.py:79: Found device: opencl:0
32
+ [2024-05-08 13:43:36] INFO auto_device.py:35: Using device: cuda:0
33
+ [2024-05-08 13:43:36] INFO auto_weight.py:70: Finding weights in: /tmp/tmpom_oz7t5/repo
34
+ [2024-05-08 13:43:36] INFO auto_weight.py:136: Not found Huggingface PyTorch
35
+ [2024-05-08 13:43:36] INFO auto_weight.py:143: Found source weight format: huggingface-safetensor. Source configuration: /tmp/tmpom_oz7t5/repo/model.safetensors.index.json
36
+ [2024-05-08 13:43:36] INFO auto_weight.py:106: Using source weight configuration: /tmp/tmpom_oz7t5/repo/model.safetensors.index.json. Use `--source` to override.
37
+ [2024-05-08 13:43:36] INFO auto_weight.py:110: Using source weight format: huggingface-safetensor. Use `--source-format` to override.
38
+ [2024-05-08 13:43:36] INFO auto_config.py:153: Found model type: phi3. Use `--model-type` to override.
39
+ [2024-05-08 13:43:36] INFO phi3_model.py:53: context_window_size not found in config.json. Falling back to max_position_embeddings (131072)
40
+ [2024-05-08 13:43:36] INFO phi3_model.py:68: prefill_chunk_size defaults to 2048
41
+ Weight conversion with arguments:
42
+ --config /tmp/tmpom_oz7t5/repo/config.json
43
+ --quantization NoQuantize(name='q0f32', kind='no-quant', model_dtype='float32')
44
+ --model-type phi3
45
+ --device cuda:0
46
+ --source /tmp/tmpom_oz7t5/repo/model.safetensors.index.json
47
+ --source-format huggingface-safetensor
48
+ --output /tmp/tmpbu0nfi81
49
+ Start storing to cache /tmp/tmpbu0nfi81
50
+
51
  0%| | 0/195 [00:00<?, ?it/s]
52
 
53
+
54
  0%| | 0/195 [00:00<?, ?it/s]
55
 
56
+
57
  0%| | 0/195 [00:00<?, ?it/s]/home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:549: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
58
+ setattr(self, word, getattr(machar, word).flat[0])
59
+ /home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
60
+ return self._float_to_str(self.smallest_subnormal)
61
+
62
  1%| | 1/195 [00:01<05:23, 1.67s/it]
63
 
64
+
65
  1%| | 1/195 [00:01<05:23, 1.67s/it]
66
 
67
+
68
  1%| | 1/195 [00:01<05:23, 1.67s/it]
69
  2%|▏ | 3/195 [00:01<01:40, 1.91it/s]
70
 
71
+
72
  2%|▏ | 3/195 [00:01<01:40, 1.91it/s]
73
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
74
 
75
+
76
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
77
 
78
+
79
  2%|▏ | 4/195 [00:02<01:36, 1.99it/s]
80
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
81
 
82
+
83
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
84
 
85
+
86
  3%|▎ | 6/195 [00:02<01:00, 3.13it/s]
87
  4%|▍ | 8/195 [00:02<00:44, 4.23it/s]
88
 
89
+
90
  4%|▍ | 8/195 [00:02<00:44, 4.23it/s]
91
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
92
 
93
+
94
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
95
 
96
+
97
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
98
 
99
+
100
  5%|▍ | 9/195 [00:03<00:53, 3.46it/s]
101
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
102
 
103
+
104
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
105
 
106
+
107
  6%|▌ | 12/195 [00:03<00:36, 4.96it/s]
108
  7%|▋ | 14/195 [00:03<00:31, 5.70it/s]
109
 
110
+
111
  7%|▋ | 14/195 [00:03<00:31, 5.70it/s]
112
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
113
 
114
+
115
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
116
 
117
+
118
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
119
 
120
+
121
  8%|▊ | 15/195 [00:04<00:41, 4.35it/s]
122
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
123
 
124
+
125
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
126
 
127
+
128
  9%|▉ | 18/195 [00:04<00:31, 5.56it/s]
129
  10%|█ | 20/195 [00:04<00:28, 6.18it/s]
130
 
131
+
132
  10%|█ | 20/195 [00:05<00:28, 6.18it/s]
133
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
134
 
135
+
136
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
137
 
138
+
139
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
140
 
141
+
142
  11%|█ | 21/195 [00:05<00:37, 4.64it/s]
143
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
144
 
145
+
146
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
147
 
148
+
149
  12%|█▏ | 24/195 [00:05<00:29, 5.77it/s]
150
  13%|█▎ | 26/195 [00:06<00:26, 6.34it/s]
151
 
152
+
153
  13%|█▎ | 26/195 [00:06<00:26, 6.34it/s]
154
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
155
 
156
+
157
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
158
 
159
+
160
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
161
 
162
+
163
  14%|█▍ | 27/195 [00:06<00:35, 4.75it/s]
164
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
165
 
166
+
167
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
168
 
169
+
170
  15%|█▌ | 30/195 [00:06<00:28, 5.85it/s]
171
  16%|█▋ | 32/195 [00:07<00:25, 6.41it/s]
172
 
173
+
174
  16%|█▋ | 32/195 [00:07<00:25, 6.41it/s]
175
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
176
 
177
+
178
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
179
 
180
+
181
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
182
 
183
+
184
  17%|█▋ | 33/195 [00:07<00:33, 4.78it/s]
185
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
186
 
187
+
188
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
189
 
190
+
191
  18%|█▊ | 36/195 [00:07<00:27, 5.88it/s]
192
  19%|█▉ | 38/195 [00:08<00:24, 6.43it/s]
193
 
194
+
195
  19%|█▉ | 38/195 [00:08<00:24, 6.43it/s]
196
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
197
 
198
+
199
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
200
 
201
+
202
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
203
 
204
+
205
  20%|██ | 39/195 [00:08<00:32, 4.80it/s]
206
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
207
 
208
+
209
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
210
 
211
+
212
  22%|██▏ | 42/195 [00:08<00:25, 5.90it/s]
213
  23%|██▎ | 44/195 [00:09<00:23, 6.44it/s]
214
 
215
+
216
  23%|██▎ | 44/195 [00:09<00:23, 6.44it/s]
217
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
218
 
219
+
220
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
221
 
222
+
223
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
224
 
225
+
226
  23%|██▎ | 45/195 [00:09<00:31, 4.81it/s]
227
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
228
 
229
+
230
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
231
 
232
+
233
  25%|██▍ | 48/195 [00:10<00:24, 5.90it/s]
234
  26%|██▌ | 50/195 [00:10<00:22, 6.44it/s]
235
 
236
+
237
  26%|██▌ | 50/195 [00:10<00:22, 6.44it/s]
238
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
239
 
240
+
241
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
242
 
243
+
244
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
245
 
246
+
247
  26%|██▌ | 51/195 [00:10<00:29, 4.80it/s]
248
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
249
 
250
+
251
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
252
 
253
+
254
  28%|██▊ | 54/195 [00:11<00:23, 5.89it/s]
255
  29%|██▊ | 56/195 [00:11<00:21, 6.44it/s]
256
 
257
+
258
  29%|██▊ | 56/195 [00:11<00:21, 6.44it/s]
259
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
260
 
261
+
262
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
263
 
264
+
265
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
266
 
267
+
268
  29%|██▉ | 57/195 [00:11<00:28, 4.81it/s]
269
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
270
 
271
+
272
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
273
 
274
+
275
  31%|███ | 60/195 [00:12<00:22, 5.89it/s]
276
  32%|███▏ | 62/195 [00:12<00:20, 6.38it/s]
277
 
278
+
279
  32%|███▏ | 62/195 [00:12<00:20, 6.38it/s]
280
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
281
 
282
+
283
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
284
 
285
+
286
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
287
 
288
+
289
  32%|███▏ | 63/195 [00:12<00:27, 4.74it/s]
290
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
291
 
292
+
293
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
294
 
295
+
296
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
297
 
298
+
299
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
300
 
301
+
302
  34%|███▍ | 66/195 [00:13<00:22, 5.84it/s]
303
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
304
 
305
+
306
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
307
 
308
+
309
  35%|███▍ | 68/195 [00:14<00:42, 3.02it/s]
310
  36%|███▌ | 70/195 [00:14<00:33, 3.71it/s]
311
 
312
+
313
  36%|███▌ | 70/195 [00:14<00:33, 3.71it/s]
314
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
315
 
316
+
317
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
318
 
319
+
320
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
321
 
322
+
323
  36%|███▋ | 71/195 [00:15<00:37, 3.30it/s]
324
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
325
 
326
+
327
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
328
 
329
+
330
  38%|███▊ | 74/195 [00:15<00:26, 4.51it/s]
331
  39%|███▉ | 76/195 [00:15<00:22, 5.23it/s]
332
 
333
+
334
  39%|███▉ | 76/195 [00:15<00:22, 5.23it/s]
335
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
336
 
337
+
338
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
339
 
340
+
341
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
342
 
343
+
344
  39%|███▉ | 77/195 [00:16<00:28, 4.16it/s]
345
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
346
 
347
+
348
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
349
 
350
+
351
  41%|████ | 80/195 [00:16<00:21, 5.31it/s]
352
  42%|████▏ | 82/195 [00:17<00:19, 5.92it/s]
353
 
354
+
355
  42%|████▏ | 82/195 [00:17<00:19, 5.92it/s]
356
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
357
 
358
+
359
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
360
 
361
+
362
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
363
 
364
+
365
  43%|████▎ | 83/195 [00:17<00:24, 4.50it/s]
366
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
367
 
368
+
369
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
370
 
371
+
372
  44%|████▍ | 86/195 [00:17<00:19, 5.62it/s]
373
  45%|████▌ | 88/195 [00:18<00:17, 6.25it/s]
374
 
375
+
376
  45%|████▌ | 88/195 [00:18<00:17, 6.25it/s]
377
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
378
 
379
+
380
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
381
 
382
+
383
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
384
 
385
+
386
  46%|████▌ | 89/195 [00:18<00:22, 4.73it/s]
387
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
388
 
389
+
390
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
391
 
392
+
393
  47%|████▋ | 92/195 [00:18<00:17, 5.90it/s]
394
  48%|████▊ | 94/195 [00:19<00:15, 6.49it/s]
395
 
396
+
397
  48%|████▊ | 94/195 [00:19<00:15, 6.49it/s]
398
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
399
 
400
+
401
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
402
 
403
+
404
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
405
 
406
+
407
  49%|████▊ | 95/195 [00:19<00:20, 4.85it/s]
408
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
409
 
410
+
411
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
412
 
413
+
414
  50%|█████ | 98/195 [00:19<00:16, 6.01it/s]
415
  51%|█████▏ | 100/195 [00:20<00:14, 6.57it/s]
416
 
417
+
418
  51%|█████▏ | 100/195 [00:20<00:14, 6.57it/s]
419
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
420
 
421
+
422
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
423
 
424
+
425
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
426
 
427
+
428
  52%|█████▏ | 101/195 [00:20<00:19, 4.88it/s]
429
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
430
 
431
+
432
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
433
 
434
+
435
  53%|█████▎ | 104/195 [00:20<00:15, 6.04it/s]
436
  54%|█████▍ | 106/195 [00:21<00:13, 6.61it/s]
437
 
438
+
439
  54%|█████▍ | 106/195 [00:21<00:13, 6.61it/s]
440
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
441
 
442
+
443
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
444
 
445
+
446
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
447
 
448
+
449
  55%|█████▍ | 107/195 [00:21<00:17, 4.90it/s]
450
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
451
 
452
+
453
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
454
 
455
+
456
  56%|█████▋ | 110/195 [00:21<00:14, 6.03it/s]
457
  57%|█████▋ | 112/195 [00:22<00:12, 6.54it/s]
458
 
459
+
460
  57%|█████▋ | 112/195 [00:22<00:12, 6.54it/s]
461
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
462
 
463
+
464
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
465
 
466
+
467
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
468
 
469
+
470
  58%|█████▊ | 113/195 [00:22<00:17, 4.79it/s]
471
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
472
 
473
+
474
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
475
 
476
+
477
  59%|█████▉ | 116/195 [00:23<00:13, 5.93it/s]
478
  61%|██████ | 118/195 [00:23<00:11, 6.51it/s]
479
 
480
+
481
  61%|██████ | 118/195 [00:23<00:11, 6.51it/s]
482
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
483
 
484
+
485
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
486
 
487
+
488
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
489
 
490
+
491
  61%|██████ | 119/195 [00:23<00:15, 4.86it/s]
492
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
493
 
494
+
495
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
496
 
497
+
498
  63%|██████▎ | 122/195 [00:24<00:12, 6.02it/s]
499
  64%|██████▎ | 124/195 [00:24<00:10, 6.59it/s]
500
 
501
+
502
  64%|██████▎ | 124/195 [00:24<00:10, 6.59it/s]
503
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
504
 
505
+
506
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
507
 
508
+
509
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
510
 
511
+
512
  64%|██████▍ | 125/195 [00:24<00:14, 4.89it/s]
513
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
514
 
515
+
516
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
517
 
518
+
519
  66%|██████▌ | 128/195 [00:25<00:11, 6.05it/s]
520
  67%|██████▋ | 130/195 [00:25<00:09, 6.61it/s]
521
 
522
+
523
  67%|██████▋ | 130/195 [00:25<00:09, 6.61it/s]
524
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
525
 
526
+
527
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
528
 
529
+
530
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
531
 
532
+
533
  67%|██████▋ | 131/195 [00:25<00:13, 4.90it/s]
534
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
535
 
536
+
537
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
538
 
539
+
540
  69%|██████▊ | 134/195 [00:26<00:10, 6.06it/s]
541
  70%|██████▉ | 136/195 [00:26<00:08, 6.63it/s]
542
 
543
+
544
  70%|██████▉ | 136/195 [00:26<00:08, 6.63it/s]
545
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
546
 
547
+
548
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
549
 
550
+
551
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
552
 
553
+
554
  70%|███████ | 137/195 [00:26<00:11, 4.91it/s]
555
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
556
 
557
+
558
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
559
 
560
+
561
  72%|███████▏ | 140/195 [00:27<00:09, 6.05it/s]
562
  73%|███████▎ | 142/195 [00:27<00:08, 6.60it/s]
563
 
564
+
565
  73%|███████▎ | 142/195 [00:27<00:08, 6.60it/s]
566
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
567
 
568
+
569
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
570
 
571
+
572
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
573
 
574
+
575
  73%|███████▎ | 143/195 [00:27<00:10, 4.88it/s]
576
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
577
 
578
+
579
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
580
 
581
+
582
  75%|███████▍ | 146/195 [00:28<00:08, 6.03it/s]
583
  76%|███████▌ | 148/195 [00:28<00:07, 6.58it/s]
584
 
585
+
586
  76%|███████▌ | 148/195 [00:28<00:07, 6.58it/s]
587
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
588
 
589
+
590
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
591
 
592
+
593
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
594
 
595
+
596
  76%|███████▋ | 149/195 [00:28<00:09, 4.85it/s]
597
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
598
 
599
+
600
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
601
 
602
+
603
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
604
 
605
+
606
  78%|███████▊ | 152/195 [00:29<00:07, 6.00it/s]
607
  79%|███████▉ | 155/195 [00:29<00:05, 6.97it/s]
608
 
609
+
610
  79%|███████▉ | 155/195 [00:29<00:05, 6.97it/s]
611
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
612
 
613
+
614
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
615
 
616
+
617
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
618
 
619
+
620
  80%|████████ | 156/195 [00:30<00:07, 5.22it/s]
621
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
622
 
623
+
624
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
625
 
626
+
627
  82%|████████▏ | 159/195 [00:30<00:05, 6.24it/s]
628
  83%|████████▎ | 161/195 [00:30<00:05, 6.75it/s]
629
 
630
+
631
  83%|████████▎ | 161/195 [00:30<00:05, 6.75it/s]
632
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
633
 
634
+
635
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
636
 
637
+
638
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
639
 
640
+
641
  83%|████████▎ | 162/195 [00:31<00:06, 5.02it/s]
642
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
643
 
644
+
645
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
646
 
647
+
648
  85%|████████▍ | 165/195 [00:31<00:04, 6.13it/s]
649
  86%|████████▌ | 167/195 [00:31<00:04, 6.67it/s]
650
 
651
+
652
  86%|████████▌ | 167/195 [00:31<00:04, 6.67it/s]
653
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
654
 
655
+
656
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
657
 
658
+
659
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
660
 
661
+
662
  86%|████████▌ | 168/195 [00:32<00:05, 4.95it/s]
663
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
664
 
665
+
666
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
667
 
668
+
669
  88%|████████▊ | 171/195 [00:32<00:03, 6.09it/s]
670
  89%|████████▊ | 173/195 [00:32<00:03, 6.64it/s]
671
 
672
+
673
  89%|████████▊ | 173/195 [00:32<00:03, 6.64it/s]
674
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
675
 
676
+
677
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
678
 
679
+
680
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
681
 
682
+
683
  89%|████████▉ | 174/195 [00:33<00:04, 4.92it/s]
684
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
685
 
686
+
687
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
688
 
689
+
690
  91%|█████████ | 177/195 [00:33<00:02, 6.07it/s]
691
  92%|█████████▏| 179/195 [00:33<00:02, 6.63it/s]
692
 
693
+
694
  92%|█████████▏| 179/195 [00:33<00:02, 6.63it/s]
695
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
696
 
697
+
698
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
699
 
700
+
701
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
702
 
703
+
704
  92%|█████████▏| 180/195 [00:34<00:03, 4.91it/s]
705
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
706
 
707
+
708
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
709
 
710
+
711
  94%|█████████▍| 183/195 [00:34<00:01, 6.07it/s]
712
  95%|█████████▍| 185/195 [00:34<00:01, 6.63it/s]
713
 
714
+
715
  95%|█████████▍| 185/195 [00:34<00:01, 6.63it/s]
716
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
717
 
718
+
719
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
720
 
721
+
722
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
723
 
724
+
725
  95%|█████████▌| 186/195 [00:35<00:01, 4.92it/s]
726
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
727
 
728
+
729
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
730
 
731
+
732
  97%|█████████▋| 189/195 [00:35<00:00, 6.07it/s]
733
  98%|█████████▊| 191/195 [00:35<00:00, 6.64it/s]
734
 
735
+
736
  98%|█████████▊| 191/195 [00:35<00:00, 6.64it/s]
737
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
738
 
739
+
740
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
741
 
742
+
743
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
744
 
745
+
746
  98%|█████████▊| 192/195 [00:36<00:00, 4.92it/s]
747
+ [2024-05-08 13:44:14] INFO huggingface_loader.py:196: Unloading HF weight file: /tmp/tmpom_oz7t5/repo/model-00001-of-00002.safetensors
748
+ [2024-05-08 13:44:14] INFO stats.py:76: Time usage: HF loading: 1.466 sec; Pre-quantization mapping: 1.680 sec; Quantization: 0.000 sec
749
+ [2024-05-08 13:44:14] INFO stats.py:90: RAM usage: Peak RAM: 9.262 GB. Total bytes loaded from disk: 14.235 GB
750
+ [2024-05-08 13:44:14] INFO convert_weight.py:155: Parameter size after quantization: 14.235 GB
751
+ [2024-05-08 13:44:14] INFO convert_weight.py:160: Total parameters: 3,821,079,552
752
+ [2024-05-08 13:44:14] INFO convert_weight.py:161: Bits per parameter: 32.000
753
+ [2024-05-08 13:44:14] INFO convert_weight.py:166: Saved to directory: /tmp/tmpbu0nfi81
754
+
755
+ All finished, 130 total shards committed, record saved to /tmp/tmpbu0nfi81/ndarray-cache.json
756
+ Also saved a bf16 record to /tmp/tmpbu0nfi81/ndarray-cache-b16.json
mlc-chat-config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "phi3",
3
+ "quantization": "q0f32",
4
+ "model_config": {
5
+ "model_type": "phi3",
6
+ "hidden_size": 3072,
7
+ "vocab_size": 32064,
8
+ "num_hidden_layers": 32,
9
+ "num_attention_heads": 32,
10
+ "intermediate_size": 8192,
11
+ "rms_norm_eps": 1e-05,
12
+ "num_key_value_heads": 32,
13
+ "position_embedding_base": 10000.0,
14
+ "context_window_size": 131072,
15
+ "prefill_chunk_size": 2048,
16
+ "head_dim": 96,
17
+ "tensor_parallel_shards": 1,
18
+ "max_batch_size": 80
19
+ },
20
+ "vocab_size": 32064,
21
+ "context_window_size": 131072,
22
+ "sliding_window_size": -1,
23
+ "prefill_chunk_size": 2048,
24
+ "attention_sink_size": -1,
25
+ "tensor_parallel_shards": 1,
26
+ "mean_gen_len": 128,
27
+ "max_gen_len": 512,
28
+ "shift_fill_factor": 0.3,
29
+ "temperature": 0.7,
30
+ "presence_penalty": 0.0,
31
+ "frequency_penalty": 0.0,
32
+ "repetition_penalty": 1.0,
33
+ "top_p": 0.95,
34
+ "conv_template": {
35
+ "name": "phi-3",
36
+ "system_template": "<|system|>\n{system_message}",
37
+ "system_message": "You are a helpful digital assistant. Please provide safe, ethical and accurate information to the user.",
38
+ "system_prefix_token_ids": [
39
+ 1
40
+ ],
41
+ "add_role_after_system_message": true,
42
+ "roles": {
43
+ "user": "<|user|>",
44
+ "assistant": "<|assistant|>"
45
+ },
46
+ "role_templates": {
47
+ "user": "{user_message}",
48
+ "assistant": "{assistant_message}",
49
+ "tool": "{tool_message}"
50
+ },
51
+ "messages": [],
52
+ "seps": [
53
+ "<|end|>\n"
54
+ ],
55
+ "role_content_sep": "\n",
56
+ "role_empty_sep": "\n",
57
+ "stop_str": [
58
+ "<|endoftext|>"
59
+ ],
60
+ "stop_token_ids": [
61
+ 32000,
62
+ 32001,
63
+ 32007
64
+ ],
65
+ "function_string": "",
66
+ "use_function_calling": false
67
+ },
68
+ "pad_token_id": 32000,
69
+ "bos_token_id": 1,
70
+ "eos_token_id": [
71
+ 32000,
72
+ 32001,
73
+ 32007
74
+ ],
75
+ "tokenizer_files": [
76
+ "tokenizer.model",
77
+ "tokenizer.json",
78
+ "added_tokens.json",
79
+ "tokenizer_config.json"
80
+ ],
81
+ "token_table_postproc_method": "byte_fallback",
82
+ "version": "0.1.0"
83
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:369e6479cbd0e85f4adf9dbd67636386f6b90893c9c5123c40161521518a2fa9
3
+ size 197001216
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:578ab6b7d6995b49291f4839dcd937c888b9c683bdca14b91c62592629634137
3
+ size 50331648
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5739d64c685f6fb3372701400d4834a1a1f517a4f81681f9fac0e495b65f181
3
+ size 56623104
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23784b6276d8b0a0017460757e601dd8bd97698b61dd3e95e45324a9c585ba71
3
+ size 18874368
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a30f025d5e0ec7fbbbf832af148e0697cb3a4216e3dd6f4e1ec757a6b3c92bb
3
+ size 50331648
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec95af4556a3f142f2044c508296727c347cffdf8b68ba1ebd8f0e6ac82a9842
3
+ size 100663296
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4ee8dbcf88d2907736f4b6577a596fd220e1397e83843b37eeb8dcf240a0fc3
3
+ size 18874368
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a4c795f42cd3474c443fc88ffc9bf7c0f9fed37e53684a7e18bedb0bb66b08d
3
+ size 56623104
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20a9444ffb50b0d432ebd182457e071c97f061dafe1ff4ebe7751d1a2cd68dd3
3
+ size 50331648
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:225baa887fa999546952fee1a992c55835a30b4aa0a4f3fc714e5805eafda856
3
+ size 100663296
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2dbd10126377521d32ddb484372030892e3a8bb33034d97d9830595a65bb732
3
+ size 18874368
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c637da00c8856bb5582ff2d4b5096dfbcc0de4d48c017260a9e643450ca68958
3
+ size 56623104
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6021d9f4a542555b74bf80ab5a589a8770d2116ff1844d7b5f63e4d2048d8e75
3
+ size 50331648
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bafbb60145a31c43f2ce7d9dcc78407c79ace0b6f490643f8c36091a0d7b5c43
3
+ size 50331648
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36d82dbb1a6e00bce71e532cecc58a47d3c49169493a3289ec5fcee6d60946c0
3
+ size 100663296
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bc8b14dc4df304b2189a17c4e47b8cdd534e0acb1ec4929a6a692e75e506b69
3
+ size 18874368
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b55107f28d4d1a0c09c3cb28e914cbfcd65a7708015aec624da3d486452ba5fc
3
+ size 56623104
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:699492fb0cff81bc5c007863c69eedf1be3fe31186c606836a36e2e6250b10b1
3
+ size 50331648
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a90a6949ee1dd8189e9ddb1008f0e44d0970d189e3618f11eb67dcb1ed8ec9c
3
+ size 100663296
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:184d082a86250e4226d980a8e59ac6c0c7bb4f3db16d84a64f70f501aba7ce4f
3
+ size 18874368
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9950a231856e4b416f7d7152ca38581363ebdac23a39404f7270dd21fd362e3
3
+ size 56623104
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5ebfa765717a992be6254113d2751c14dbd25a0a91ad588fb147189cb76bda
3
+ size 50331648
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:206e6479e9bcb52fd843d010e6599fb5cb6c3e67f3ff61af73e61e5ebf3bd121
3
+ size 100663296
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e2642dd319c6f01577013ae7b6dd4321f418c78e90342798f143598d38de1b1
3
+ size 18874368
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823816e41f84e9a67b90cd20a96c63ede16094456cca28eaf2ce87af52937368
3
+ size 100663296
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9061d71341f302e32b0f4f1827683b1f3d33d3d7451e58117c17d1ca1ee52e31
3
+ size 56623104
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d2a90ccc503f1cd61f688b21a79e124a139e95add977f5cf9f705a51017d8b8
3
+ size 50331648
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcbaa7e45069319220f6d923a8f682f5dc31168cdc289e693ac74d3a650ac67c
3
+ size 100663296
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd9b49091e07d5cd91cbd053197ee9e220e24367d2576ef25ffec8ac95f4b21
3
+ size 18874368
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee1b09c97a4ab78b2f52cebac8223a312fa7ebe0fc49d257cb9d2a2cdb3070f7
3
+ size 56623104
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f5f5e7ec83acb261c27cdd32468e2215464a4ac56b2ac2cc5c3dcf9958f6da9
3
+ size 50331648
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b80a43959420fb0d4f5bb4925a94d3547175a26e89262699f36ec4237ffe55ab
3
+ size 100663296
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21bb1e6eb074a791bffc85d8e22f8df0adcd77439a407ca1b624e3492e06fea1
3
+ size 18874368
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf4be9f0ed4ad8c5dde04e72da06d5fdba3883094ca0c9bc64849ce473d2048f
3
+ size 56623104
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b331d8030ad05b1a895107f55a21ad407bf43dc506f9e26c23f0ff556af9f54c
3
+ size 19273728
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:998600ff2c000d5d0e85856ae063ea46a7215f5109548978465b3700e4269a37
3
+ size 18874368
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:597acd9d2339ff81bed53629ac699718b0743ba65b6fd11050d08484eeb16176
3
+ size 56623104
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8cff80ebe058849beac249fd8fe6b719010c23c387cf98a7f803c6375523aef
3
+ size 50331648
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cfd14bdabaf1e7685def5a8566b66b3fe2c5f7f9b60d42c49c48c9c7ed7f174
3
+ size 100663296
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2831f366fd5633235db341940ad43f34b0a277f35ebb7d42f3c39a71f2ab7bb6
3
+ size 18874368
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e686f5a26aaa885a6918f2a616e0eb7e8bfd12656b38b5d35189541dbc8e09f2
3
+ size 56623104
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ced1d5b3f0bdb6e3150e5251699d9074945d236d37c75033ccbbb5dca5f8012f
3
+ size 50331648
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b86950eb9d8961253692f3310da8a114ab54dedbd2c456fb13027593655c84e
3
+ size 100663296
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:035180a81e2320076d40b9a2c2d6c1cbebd0c9e9e7bf2a7ea824c2949248c953
3
+ size 100663296
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:153292ba056306567067131f224860d0a7e78f0034fdb2c45013bda2f505a817
3
+ size 18874368