MedAliBH commited on
Commit
1eddb89
·
1 Parent(s): f4ece99

Upload intent classifier lstm

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model/model_weights filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ model/logs/*
2
+ model/training_checkpoints/*
3
+ *.csv
4
+ *.npy
5
+ *.parquet
description.json ADDED
@@ -0,0 +1,893 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "command": "/usr/local/bin/ludwig experiment --config /src/intent-classifier-lstm.yaml --dataset /data/data.json --output_directory /results",
3
+ "compute": {
4
+ "num_nodes": 1
5
+ },
6
+ "config": {
7
+ "backend": null,
8
+ "combiner": {
9
+ "activation": "relu",
10
+ "bias_initializer": "zeros",
11
+ "dropout": 0.0,
12
+ "fc_layers": null,
13
+ "flatten_inputs": false,
14
+ "norm": null,
15
+ "norm_params": null,
16
+ "num_fc_layers": 0,
17
+ "output_size": 256,
18
+ "residual": false,
19
+ "type": "concat",
20
+ "use_bias": true,
21
+ "weights_initializer": "xavier_uniform"
22
+ },
23
+ "defaults": {
24
+ "audio": {
25
+ "encoder": {
26
+ "activation": "relu",
27
+ "bias_initializer": "zeros",
28
+ "conv_layers": null,
29
+ "dropout": 0.0,
30
+ "embedding_size": 256,
31
+ "embeddings_on_cpu": false,
32
+ "embeddings_trainable": true,
33
+ "fc_layers": null,
34
+ "filter_size": 3,
35
+ "max_sequence_length": null,
36
+ "norm": null,
37
+ "norm_params": null,
38
+ "num_conv_layers": null,
39
+ "num_fc_layers": null,
40
+ "num_filters": 256,
41
+ "output_size": 256,
42
+ "pool_function": "max",
43
+ "pool_size": null,
44
+ "pretrained_embeddings": null,
45
+ "reduce_output": "sum",
46
+ "representation": "dense",
47
+ "should_embed": true,
48
+ "skip": false,
49
+ "type": "parallel_cnn",
50
+ "use_bias": true,
51
+ "vocab": null,
52
+ "weights_initializer": "xavier_uniform"
53
+ },
54
+ "preprocessing": {
55
+ "audio_file_length_limit_in_s": 7.5,
56
+ "computed_fill_value": null,
57
+ "fill_value": null,
58
+ "in_memory": true,
59
+ "missing_value_strategy": "bfill",
60
+ "norm": null,
61
+ "num_fft_points": null,
62
+ "num_filter_bands": 80,
63
+ "padding_value": 0.0,
64
+ "type": "fbank",
65
+ "window_length_in_s": 0.04,
66
+ "window_shift_in_s": 0.02,
67
+ "window_type": "hamming"
68
+ }
69
+ },
70
+ "bag": {
71
+ "encoder": {
72
+ "activation": "relu",
73
+ "bias_initializer": "zeros",
74
+ "dropout": 0.0,
75
+ "embedding_size": 50,
76
+ "embeddings_on_cpu": false,
77
+ "embeddings_trainable": true,
78
+ "fc_layers": null,
79
+ "force_embedding_size": false,
80
+ "norm": null,
81
+ "norm_params": null,
82
+ "num_fc_layers": 0,
83
+ "output_size": 10,
84
+ "pretrained_embeddings": null,
85
+ "representation": "dense",
86
+ "skip": false,
87
+ "type": "embed",
88
+ "use_bias": true,
89
+ "vocab": null,
90
+ "weights_initializer": "xavier_uniform"
91
+ },
92
+ "preprocessing": {
93
+ "computed_fill_value": "<UNK>",
94
+ "fill_value": "<UNK>",
95
+ "lowercase": false,
96
+ "missing_value_strategy": "fill_with_const",
97
+ "most_common": 10000,
98
+ "tokenizer": "space"
99
+ }
100
+ },
101
+ "binary": {
102
+ "decoder": {
103
+ "bias_initializer": "zeros",
104
+ "fc_activation": "relu",
105
+ "fc_bias_initializer": "zeros",
106
+ "fc_dropout": 0.0,
107
+ "fc_layers": null,
108
+ "fc_norm": null,
109
+ "fc_norm_params": null,
110
+ "fc_output_size": 256,
111
+ "fc_use_bias": true,
112
+ "fc_weights_initializer": "xavier_uniform",
113
+ "input_size": null,
114
+ "num_fc_layers": 0,
115
+ "type": "regressor",
116
+ "use_bias": true,
117
+ "weights_initializer": "xavier_uniform"
118
+ },
119
+ "encoder": {
120
+ "skip": false,
121
+ "type": "passthrough"
122
+ },
123
+ "loss": {
124
+ "confidence_penalty": 0,
125
+ "positive_class_weight": null,
126
+ "robust_lambda": 0,
127
+ "type": "binary_weighted_cross_entropy",
128
+ "weight": 1.0
129
+ },
130
+ "preprocessing": {
131
+ "computed_fill_value": null,
132
+ "fallback_true_label": null,
133
+ "fill_value": null,
134
+ "missing_value_strategy": "fill_with_false"
135
+ }
136
+ },
137
+ "category": {
138
+ "decoder": {
139
+ "bias_initializer": "zeros",
140
+ "fc_activation": "relu",
141
+ "fc_bias_initializer": "zeros",
142
+ "fc_dropout": 0.0,
143
+ "fc_layers": null,
144
+ "fc_norm": null,
145
+ "fc_norm_params": null,
146
+ "fc_output_size": 256,
147
+ "fc_use_bias": true,
148
+ "fc_weights_initializer": "xavier_uniform",
149
+ "input_size": null,
150
+ "num_classes": null,
151
+ "num_fc_layers": 0,
152
+ "type": "classifier",
153
+ "use_bias": true,
154
+ "weights_initializer": "xavier_uniform"
155
+ },
156
+ "encoder": {
157
+ "dropout": 0.0,
158
+ "embedding_initializer": null,
159
+ "embedding_size": 50,
160
+ "embeddings_on_cpu": false,
161
+ "embeddings_trainable": true,
162
+ "pretrained_embeddings": null,
163
+ "skip": false,
164
+ "type": "dense",
165
+ "vocab": null
166
+ },
167
+ "loss": {
168
+ "class_similarities": null,
169
+ "class_similarities_temperature": 0,
170
+ "class_weights": null,
171
+ "confidence_penalty": 0,
172
+ "robust_lambda": 0,
173
+ "type": "softmax_cross_entropy",
174
+ "weight": 1.0
175
+ },
176
+ "preprocessing": {
177
+ "cache_encoder_embeddings": false,
178
+ "computed_fill_value": "<UNK>",
179
+ "fill_value": "<UNK>",
180
+ "lowercase": false,
181
+ "missing_value_strategy": "fill_with_const",
182
+ "most_common": 10000
183
+ }
184
+ },
185
+ "date": {
186
+ "encoder": {
187
+ "activation": "relu",
188
+ "bias_initializer": "zeros",
189
+ "dropout": 0.0,
190
+ "embedding_size": 10,
191
+ "embeddings_on_cpu": false,
192
+ "fc_layers": null,
193
+ "norm": null,
194
+ "norm_params": null,
195
+ "num_fc_layers": 0,
196
+ "output_size": 10,
197
+ "skip": false,
198
+ "type": "embed",
199
+ "use_bias": true,
200
+ "weights_initializer": "xavier_uniform"
201
+ },
202
+ "preprocessing": {
203
+ "computed_fill_value": "",
204
+ "datetime_format": null,
205
+ "fill_value": "",
206
+ "missing_value_strategy": "fill_with_const"
207
+ }
208
+ },
209
+ "h3": {
210
+ "encoder": {
211
+ "activation": "relu",
212
+ "bias_initializer": "zeros",
213
+ "dropout": 0.0,
214
+ "embedding_size": 10,
215
+ "embeddings_on_cpu": false,
216
+ "fc_layers": null,
217
+ "norm": null,
218
+ "norm_params": null,
219
+ "num_fc_layers": 0,
220
+ "output_size": 10,
221
+ "reduce_output": "sum",
222
+ "skip": false,
223
+ "type": "embed",
224
+ "use_bias": true,
225
+ "weights_initializer": "xavier_uniform"
226
+ },
227
+ "preprocessing": {
228
+ "computed_fill_value": 576495936675512319,
229
+ "fill_value": 576495936675512319,
230
+ "missing_value_strategy": "fill_with_const"
231
+ }
232
+ },
233
+ "image": {
234
+ "augmentation": [],
235
+ "decoder": {
236
+ "conv_norm": "batch",
237
+ "fc_activation": "relu",
238
+ "fc_bias_initializer": "zeros",
239
+ "fc_dropout": 0.0,
240
+ "fc_layers": null,
241
+ "fc_norm": null,
242
+ "fc_norm_params": null,
243
+ "fc_output_size": 256,
244
+ "fc_use_bias": true,
245
+ "fc_weights_initializer": "xavier_uniform",
246
+ "height": null,
247
+ "input_size": 1024,
248
+ "num_channels": null,
249
+ "num_classes": null,
250
+ "num_fc_layers": 0,
251
+ "type": "unet",
252
+ "width": null
253
+ },
254
+ "encoder": {
255
+ "conv_activation": "relu",
256
+ "conv_dropout": 0.0,
257
+ "conv_layers": null,
258
+ "conv_norm": null,
259
+ "conv_norm_params": null,
260
+ "conv_use_bias": true,
261
+ "dilation": 1,
262
+ "fc_activation": "relu",
263
+ "fc_bias_initializer": "zeros",
264
+ "fc_dropout": 0.0,
265
+ "fc_layers": null,
266
+ "fc_norm": null,
267
+ "fc_norm_params": null,
268
+ "fc_use_bias": true,
269
+ "fc_weights_initializer": "xavier_uniform",
270
+ "groups": 1,
271
+ "height": null,
272
+ "kernel_size": 3,
273
+ "num_channels": null,
274
+ "num_conv_layers": null,
275
+ "num_fc_layers": 1,
276
+ "out_channels": 32,
277
+ "output_size": 128,
278
+ "padding": "valid",
279
+ "padding_mode": "zeros",
280
+ "pool_dilation": 1,
281
+ "pool_function": "max",
282
+ "pool_kernel_size": 2,
283
+ "pool_padding": 0,
284
+ "pool_stride": null,
285
+ "skip": false,
286
+ "stride": 1,
287
+ "type": "stacked_cnn",
288
+ "width": null
289
+ },
290
+ "loss": {
291
+ "class_similarities": null,
292
+ "class_similarities_temperature": 0,
293
+ "class_weights": null,
294
+ "confidence_penalty": 0,
295
+ "robust_lambda": 0,
296
+ "type": "softmax_cross_entropy",
297
+ "weight": 1.0
298
+ },
299
+ "preprocessing": {
300
+ "computed_fill_value": null,
301
+ "fill_value": null,
302
+ "height": null,
303
+ "in_memory": true,
304
+ "infer_image_dimensions": true,
305
+ "infer_image_max_height": 256,
306
+ "infer_image_max_width": 256,
307
+ "infer_image_num_channels": true,
308
+ "infer_image_num_classes": false,
309
+ "infer_image_sample_size": 100,
310
+ "missing_value_strategy": "bfill",
311
+ "num_channels": null,
312
+ "num_classes": null,
313
+ "num_processes": 1,
314
+ "requires_equal_dimensions": false,
315
+ "resize_method": "interpolate",
316
+ "standardize_image": null,
317
+ "width": null
318
+ }
319
+ },
320
+ "number": {
321
+ "decoder": {
322
+ "bias_initializer": "zeros",
323
+ "fc_activation": "relu",
324
+ "fc_bias_initializer": "zeros",
325
+ "fc_dropout": 0.0,
326
+ "fc_layers": null,
327
+ "fc_norm": null,
328
+ "fc_norm_params": null,
329
+ "fc_output_size": 256,
330
+ "fc_use_bias": true,
331
+ "fc_weights_initializer": "xavier_uniform",
332
+ "input_size": null,
333
+ "num_fc_layers": 0,
334
+ "type": "regressor",
335
+ "use_bias": true,
336
+ "weights_initializer": "xavier_uniform"
337
+ },
338
+ "encoder": {
339
+ "skip": false,
340
+ "type": "passthrough"
341
+ },
342
+ "loss": {
343
+ "type": "mean_squared_error",
344
+ "weight": 1.0
345
+ },
346
+ "preprocessing": {
347
+ "computed_fill_value": 0.0,
348
+ "computed_outlier_fill_value": 0.0,
349
+ "fill_value": 0.0,
350
+ "missing_value_strategy": "fill_with_const",
351
+ "normalization": "zscore",
352
+ "outlier_strategy": null,
353
+ "outlier_threshold": 3.0
354
+ }
355
+ },
356
+ "sequence": {
357
+ "decoder": {
358
+ "cell_type": "gru",
359
+ "fc_activation": "relu",
360
+ "fc_bias_initializer": "zeros",
361
+ "fc_dropout": 0.0,
362
+ "fc_layers": null,
363
+ "fc_norm": null,
364
+ "fc_norm_params": null,
365
+ "fc_output_size": 256,
366
+ "fc_use_bias": true,
367
+ "fc_weights_initializer": "xavier_uniform",
368
+ "input_size": 256,
369
+ "max_sequence_length": null,
370
+ "num_fc_layers": 0,
371
+ "num_layers": 1,
372
+ "reduce_input": "sum",
373
+ "type": "generator",
374
+ "vocab_size": null
375
+ },
376
+ "encoder": {
377
+ "dropout": 0.0,
378
+ "embedding_size": 256,
379
+ "embeddings_on_cpu": false,
380
+ "embeddings_trainable": true,
381
+ "max_sequence_length": null,
382
+ "pretrained_embeddings": null,
383
+ "reduce_output": "sum",
384
+ "representation": "dense",
385
+ "skip": false,
386
+ "type": "embed",
387
+ "vocab": null,
388
+ "weights_initializer": "uniform"
389
+ },
390
+ "loss": {
391
+ "class_similarities": null,
392
+ "class_similarities_temperature": 0,
393
+ "class_weights": null,
394
+ "confidence_penalty": 0,
395
+ "robust_lambda": 0,
396
+ "type": "sequence_softmax_cross_entropy",
397
+ "unique": false,
398
+ "weight": 1.0
399
+ },
400
+ "preprocessing": {
401
+ "cache_encoder_embeddings": false,
402
+ "computed_fill_value": "<UNK>",
403
+ "fill_value": "<UNK>",
404
+ "lowercase": false,
405
+ "max_sequence_length": 256,
406
+ "missing_value_strategy": "fill_with_const",
407
+ "most_common": 20000,
408
+ "ngram_size": 2,
409
+ "padding": "right",
410
+ "padding_symbol": "<PAD>",
411
+ "sequence_length": null,
412
+ "tokenizer": "space",
413
+ "unknown_symbol": "<UNK>",
414
+ "vocab_file": null
415
+ }
416
+ },
417
+ "set": {
418
+ "decoder": {
419
+ "bias_initializer": "zeros",
420
+ "fc_activation": "relu",
421
+ "fc_bias_initializer": "zeros",
422
+ "fc_dropout": 0.0,
423
+ "fc_layers": null,
424
+ "fc_norm": null,
425
+ "fc_norm_params": null,
426
+ "fc_output_size": 256,
427
+ "fc_use_bias": true,
428
+ "fc_weights_initializer": "xavier_uniform",
429
+ "input_size": null,
430
+ "num_classes": null,
431
+ "num_fc_layers": 0,
432
+ "type": "classifier",
433
+ "use_bias": true,
434
+ "weights_initializer": "xavier_uniform"
435
+ },
436
+ "encoder": {
437
+ "activation": "relu",
438
+ "bias_initializer": "zeros",
439
+ "dropout": 0.0,
440
+ "embedding_size": 50,
441
+ "embeddings_on_cpu": false,
442
+ "embeddings_trainable": true,
443
+ "fc_layers": null,
444
+ "norm": null,
445
+ "norm_params": null,
446
+ "num_fc_layers": 0,
447
+ "output_size": 10,
448
+ "pretrained_embeddings": null,
449
+ "representation": "dense",
450
+ "skip": false,
451
+ "type": "embed",
452
+ "use_bias": true,
453
+ "vocab": null,
454
+ "weights_initializer": "xavier_uniform"
455
+ },
456
+ "loss": {
457
+ "class_weights": null,
458
+ "type": "sigmoid_cross_entropy",
459
+ "weight": 1.0
460
+ },
461
+ "preprocessing": {
462
+ "computed_fill_value": "<UNK>",
463
+ "fill_value": "<UNK>",
464
+ "lowercase": false,
465
+ "missing_value_strategy": "fill_with_const",
466
+ "most_common": 10000,
467
+ "tokenizer": "space"
468
+ }
469
+ },
470
+ "text": {
471
+ "decoder": {
472
+ "cell_type": "gru",
473
+ "fc_activation": "relu",
474
+ "fc_bias_initializer": "zeros",
475
+ "fc_dropout": 0.0,
476
+ "fc_layers": null,
477
+ "fc_norm": null,
478
+ "fc_norm_params": null,
479
+ "fc_output_size": 256,
480
+ "fc_use_bias": true,
481
+ "fc_weights_initializer": "xavier_uniform",
482
+ "input_size": 256,
483
+ "max_sequence_length": null,
484
+ "num_fc_layers": 0,
485
+ "num_layers": 1,
486
+ "reduce_input": "sum",
487
+ "type": "generator",
488
+ "vocab_size": null
489
+ },
490
+ "encoder": {
491
+ "activation": "relu",
492
+ "bias_initializer": "zeros",
493
+ "conv_layers": null,
494
+ "dropout": 0.0,
495
+ "embedding_size": 256,
496
+ "embeddings_on_cpu": false,
497
+ "embeddings_trainable": true,
498
+ "fc_layers": null,
499
+ "filter_size": 3,
500
+ "max_sequence_length": null,
501
+ "norm": null,
502
+ "norm_params": null,
503
+ "num_conv_layers": null,
504
+ "num_fc_layers": null,
505
+ "num_filters": 256,
506
+ "output_size": 256,
507
+ "pool_function": "max",
508
+ "pool_size": null,
509
+ "pretrained_embeddings": null,
510
+ "reduce_output": "sum",
511
+ "representation": "dense",
512
+ "should_embed": true,
513
+ "skip": false,
514
+ "type": "parallel_cnn",
515
+ "use_bias": true,
516
+ "vocab": null,
517
+ "weights_initializer": "xavier_uniform"
518
+ },
519
+ "loss": {
520
+ "class_similarities": null,
521
+ "class_similarities_temperature": 0,
522
+ "class_weights": null,
523
+ "confidence_penalty": 0,
524
+ "robust_lambda": 0,
525
+ "type": "sequence_softmax_cross_entropy",
526
+ "unique": false,
527
+ "weight": 1.0
528
+ },
529
+ "preprocessing": {
530
+ "cache_encoder_embeddings": false,
531
+ "compute_idf": false,
532
+ "computed_fill_value": "<UNK>",
533
+ "fill_value": "<UNK>",
534
+ "lowercase": false,
535
+ "max_sequence_length": 256,
536
+ "missing_value_strategy": "fill_with_const",
537
+ "most_common": 20000,
538
+ "ngram_size": 2,
539
+ "padding": "right",
540
+ "padding_symbol": "<PAD>",
541
+ "pretrained_model_name_or_path": null,
542
+ "prompt": {
543
+ "retrieval": {
544
+ "index_name": null,
545
+ "k": 0,
546
+ "model_name": null,
547
+ "type": null
548
+ },
549
+ "task": null,
550
+ "template": null
551
+ },
552
+ "sequence_length": null,
553
+ "tokenizer": "space_punct",
554
+ "unknown_symbol": "<UNK>",
555
+ "vocab_file": null
556
+ }
557
+ },
558
+ "timeseries": {
559
+ "decoder": {
560
+ "activation": null,
561
+ "bias_initializer": "zeros",
562
+ "clip": null,
563
+ "fc_activation": "relu",
564
+ "fc_bias_initializer": "zeros",
565
+ "fc_dropout": 0.0,
566
+ "fc_layers": null,
567
+ "fc_norm": null,
568
+ "fc_norm_params": null,
569
+ "fc_output_size": 256,
570
+ "fc_use_bias": true,
571
+ "fc_weights_initializer": "xavier_uniform",
572
+ "input_size": null,
573
+ "multiplier": 1.0,
574
+ "num_fc_layers": 0,
575
+ "output_size": null,
576
+ "type": "projector",
577
+ "use_bias": true,
578
+ "weights_initializer": "xavier_uniform"
579
+ },
580
+ "encoder": {
581
+ "activation": "relu",
582
+ "bias_initializer": "zeros",
583
+ "conv_layers": null,
584
+ "dropout": 0.0,
585
+ "embedding_size": 256,
586
+ "embeddings_on_cpu": false,
587
+ "embeddings_trainable": true,
588
+ "fc_layers": null,
589
+ "filter_size": 3,
590
+ "max_sequence_length": null,
591
+ "norm": null,
592
+ "norm_params": null,
593
+ "num_conv_layers": null,
594
+ "num_fc_layers": null,
595
+ "num_filters": 256,
596
+ "output_size": 256,
597
+ "pool_function": "max",
598
+ "pool_size": null,
599
+ "pretrained_embeddings": null,
600
+ "reduce_output": "sum",
601
+ "representation": "dense",
602
+ "should_embed": true,
603
+ "skip": false,
604
+ "type": "parallel_cnn",
605
+ "use_bias": true,
606
+ "vocab": null,
607
+ "weights_initializer": "xavier_uniform"
608
+ },
609
+ "loss": {
610
+ "delta": 1.0,
611
+ "type": "huber",
612
+ "weight": 1.0
613
+ },
614
+ "preprocessing": {
615
+ "computed_fill_value": "",
616
+ "fill_value": "",
617
+ "missing_value_strategy": "fill_with_const",
618
+ "padding": "right",
619
+ "padding_value": 0.0,
620
+ "timeseries_length_limit": 256,
621
+ "tokenizer": "space",
622
+ "window_size": 0
623
+ }
624
+ },
625
+ "vector": {
626
+ "decoder": {
627
+ "activation": null,
628
+ "bias_initializer": "zeros",
629
+ "clip": null,
630
+ "fc_activation": "relu",
631
+ "fc_bias_initializer": "zeros",
632
+ "fc_dropout": 0.0,
633
+ "fc_layers": null,
634
+ "fc_norm": null,
635
+ "fc_norm_params": null,
636
+ "fc_output_size": 256,
637
+ "fc_use_bias": true,
638
+ "fc_weights_initializer": "xavier_uniform",
639
+ "input_size": null,
640
+ "multiplier": 1.0,
641
+ "num_fc_layers": 0,
642
+ "output_size": null,
643
+ "type": "projector",
644
+ "use_bias": true,
645
+ "weights_initializer": "xavier_uniform"
646
+ },
647
+ "encoder": {
648
+ "activation": "relu",
649
+ "bias_initializer": "zeros",
650
+ "dropout": 0.0,
651
+ "fc_layers": null,
652
+ "input_size": null,
653
+ "norm": null,
654
+ "norm_params": null,
655
+ "num_layers": 1,
656
+ "output_size": 256,
657
+ "skip": false,
658
+ "type": "dense",
659
+ "use_bias": true,
660
+ "weights_initializer": "xavier_uniform"
661
+ },
662
+ "loss": {
663
+ "type": "mean_squared_error",
664
+ "weight": 1.0
665
+ },
666
+ "preprocessing": {
667
+ "computed_fill_value": "",
668
+ "fill_value": "",
669
+ "missing_value_strategy": "fill_with_const",
670
+ "vector_size": null
671
+ }
672
+ }
673
+ },
674
+ "hyperopt": null,
675
+ "input_features": [
676
+ {
677
+ "active": true,
678
+ "column": "text",
679
+ "encoder": {
680
+ "activation": "tanh",
681
+ "bias_initializer": "zeros",
682
+ "bidirectional": true,
683
+ "cell_type": "lstm",
684
+ "conv_activation": "relu",
685
+ "conv_dropout": 0.0,
686
+ "conv_layers": null,
687
+ "dilation_rate": 1,
688
+ "dropout": 0.2,
689
+ "embedding_size": 256,
690
+ "embeddings_on_cpu": false,
691
+ "embeddings_trainable": true,
692
+ "fc_activation": "relu",
693
+ "fc_dropout": 0.0,
694
+ "fc_layers": null,
695
+ "filter_size": 5,
696
+ "max_sequence_length": null,
697
+ "norm": null,
698
+ "norm_params": null,
699
+ "num_conv_layers": null,
700
+ "num_fc_layers": 0,
701
+ "num_filters": 256,
702
+ "num_rec_layers": 1,
703
+ "output_size": 256,
704
+ "padding": "same",
705
+ "pool_function": "max",
706
+ "pool_padding": "same",
707
+ "pool_size": null,
708
+ "pool_strides": null,
709
+ "pretrained_embeddings": null,
710
+ "recurrent_activation": "sigmoid",
711
+ "recurrent_dropout": 0.0,
712
+ "recurrent_initializer": "orthogonal",
713
+ "reduce_output": null,
714
+ "representation": "dense",
715
+ "should_embed": true,
716
+ "skip": false,
717
+ "state_size": 256,
718
+ "strides": 1,
719
+ "type": "cnnrnn",
720
+ "unit_forget_bias": true,
721
+ "use_bias": true,
722
+ "vocab": null,
723
+ "weights_initializer": "xavier_uniform"
724
+ },
725
+ "name": "text",
726
+ "preprocessing": {
727
+ "cache_encoder_embeddings": false,
728
+ "computed_fill_value": "<UNK>",
729
+ "fill_value": "<UNK>",
730
+ "lowercase": true,
731
+ "max_sequence_length": 256,
732
+ "missing_value_strategy": "fill_with_const",
733
+ "most_common": 20000,
734
+ "ngram_size": 3,
735
+ "padding": "right",
736
+ "padding_symbol": "<PAD>",
737
+ "sequence_length": null,
738
+ "tokenizer": "ngram",
739
+ "unknown_symbol": "<UNK>",
740
+ "vocab_file": null
741
+ },
742
+ "proc_column": "text_llKKzv",
743
+ "tied": null,
744
+ "type": "sequence"
745
+ }
746
+ ],
747
+ "ludwig_version": "0.10.2.dev",
748
+ "model_type": "ecd",
749
+ "output_features": [
750
+ {
751
+ "active": true,
752
+ "calibration": false,
753
+ "column": "intent",
754
+ "decoder": {
755
+ "bias_initializer": "zeros",
756
+ "fc_activation": "relu",
757
+ "fc_bias_initializer": "zeros",
758
+ "fc_dropout": 0.2,
759
+ "fc_layers": null,
760
+ "fc_norm": null,
761
+ "fc_norm_params": null,
762
+ "fc_output_size": 256,
763
+ "fc_use_bias": true,
764
+ "fc_weights_initializer": "xavier_uniform",
765
+ "input_size": null,
766
+ "num_classes": null,
767
+ "num_fc_layers": 0,
768
+ "type": "classifier",
769
+ "use_bias": true,
770
+ "weights_initializer": "xavier_uniform"
771
+ },
772
+ "default_validation_metric": "accuracy",
773
+ "dependencies": [],
774
+ "input_size": null,
775
+ "loss": {
776
+ "class_similarities": null,
777
+ "class_similarities_temperature": 0,
778
+ "class_weights": null,
779
+ "confidence_penalty": 0,
780
+ "robust_lambda": 0,
781
+ "type": "softmax_cross_entropy",
782
+ "weight": 1.0
783
+ },
784
+ "name": "intent",
785
+ "num_classes": null,
786
+ "preprocessing": {
787
+ "cache_encoder_embeddings": false,
788
+ "computed_fill_value": "<UNK>",
789
+ "fill_value": "<UNK>",
790
+ "lowercase": false,
791
+ "missing_value_strategy": "drop_row",
792
+ "most_common": 10000
793
+ },
794
+ "proc_column": "intent_YwJjWN",
795
+ "reduce_dependencies": "sum",
796
+ "reduce_input": "sum",
797
+ "top_k": 3,
798
+ "type": "category"
799
+ }
800
+ ],
801
+ "preprocessing": {
802
+ "global_max_sequence_length": null,
803
+ "oversample_minority": null,
804
+ "sample_ratio": 1.0,
805
+ "sample_size": null,
806
+ "split": {
807
+ "column": "intent",
808
+ "probabilities": [
809
+ 0.85,
810
+ 0.1,
811
+ 0.05
812
+ ],
813
+ "type": "stratify"
814
+ },
815
+ "undersample_majority": null
816
+ },
817
+ "trainer": {
818
+ "batch_size": "auto",
819
+ "bucketing_field": null,
820
+ "checkpoints_per_epoch": 0,
821
+ "compile": false,
822
+ "early_stop": 0,
823
+ "effective_batch_size": "auto",
824
+ "enable_gradient_checkpointing": false,
825
+ "enable_profiling": false,
826
+ "epochs": 10,
827
+ "eval_batch_size": null,
828
+ "eval_steps": null,
829
+ "evaluate_training_set": false,
830
+ "gradient_accumulation_steps": "auto",
831
+ "gradient_clipping": {
832
+ "clipglobalnorm": 0.5,
833
+ "clipnorm": null,
834
+ "clipvalue": null
835
+ },
836
+ "increase_batch_size_eval_metric": "loss",
837
+ "increase_batch_size_eval_split": "training",
838
+ "increase_batch_size_on_plateau": 0,
839
+ "increase_batch_size_on_plateau_patience": 5,
840
+ "increase_batch_size_on_plateau_rate": 2.0,
841
+ "learning_rate": 0.001,
842
+ "learning_rate_scaling": "linear",
843
+ "learning_rate_scheduler": {
844
+ "decay": "exponential",
845
+ "decay_rate": 0.96,
846
+ "decay_steps": 10000,
847
+ "eta_min": 0,
848
+ "reduce_eval_metric": "loss",
849
+ "reduce_eval_split": "training",
850
+ "reduce_on_plateau": 0,
851
+ "reduce_on_plateau_patience": 10,
852
+ "reduce_on_plateau_rate": 0.1,
853
+ "staircase": false,
854
+ "t_0": null,
855
+ "t_mult": 1,
856
+ "warmup_evaluations": 0,
857
+ "warmup_fraction": 0.0
858
+ },
859
+ "max_batch_size": 1099511627776,
860
+ "optimizer": {
861
+ "amsgrad": false,
862
+ "betas": [
863
+ 0.9,
864
+ 0.999
865
+ ],
866
+ "eps": 1e-08,
867
+ "type": "adam",
868
+ "weight_decay": 0.0
869
+ },
870
+ "profiler": {
871
+ "active": 3,
872
+ "repeat": 5,
873
+ "skip_first": 0,
874
+ "wait": 1,
875
+ "warmup": 1
876
+ },
877
+ "regularization_lambda": 0.0,
878
+ "regularization_type": "l2",
879
+ "should_shuffle": true,
880
+ "skip_all_evaluation": false,
881
+ "steps_per_checkpoint": 0,
882
+ "train_steps": null,
883
+ "use_mixed_precision": false,
884
+ "validation_field": "intent",
885
+ "validation_metric": "accuracy"
886
+ }
887
+ },
888
+ "data_format": "json",
889
+ "dataset": "/data/data.json",
890
+ "ludwig_version": "0.10.2.dev",
891
+ "random_seed": 42,
892
+ "torch_version": "2.0.0+cpu"
893
+ }
model/model_hyperparameters.json ADDED
The diff for this file is too large to render. See raw diff
 
model/model_weights ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d2b767c5b8249f486b98d595f49fa1a25d818953dfc434d73c31f53c34acba9
3
+ size 24754846
model/training_progress.json ADDED
@@ -0,0 +1,2045 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "batch_size": 128,
3
+ "best_eval_metric_checkpoint_number": 18,
4
+ "best_eval_metric_epoch": 10,
5
+ "best_eval_metric_steps": 470,
6
+ "best_eval_metric_value": 0.6166250705718994,
7
+ "best_eval_test_metrics": {
8
+ "combined": {
9
+ "loss": 3.0807435512542725
10
+ },
11
+ "intent": {
12
+ "accuracy": 0.5496426820755005,
13
+ "accuracy_micro": 0.5959885120391846,
14
+ "hits_at_k": 0.6660665273666382,
15
+ "loss": 3.0807435512542725,
16
+ "roc_auc": 0.9340102672576904
17
+ }
18
+ },
19
+ "best_eval_train_metrics": {
20
+ "combined": {
21
+ "loss": 0.15086334943771362
22
+ },
23
+ "intent": {
24
+ "accuracy": 0.9410130977630615,
25
+ "accuracy_micro": 0.9574396014213562,
26
+ "hits_at_k": 0.9925163984298706,
27
+ "loss": 0.15086334943771362,
28
+ "roc_auc": 0.9996311664581299
29
+ }
30
+ },
31
+ "best_eval_validation_metrics": {
32
+ "combined": {
33
+ "loss": 2.5151546001434326
34
+ },
35
+ "intent": {
36
+ "accuracy": 0.6166250705718994,
37
+ "accuracy_micro": 0.63271164894104,
38
+ "hits_at_k": 0.7617202997207642,
39
+ "loss": 2.5151546001434326,
40
+ "roc_auc": 0.9704092144966125
41
+ }
42
+ },
43
+ "best_increase_batch_size_eval_metric": Infinity,
44
+ "checkpoint_number": 20,
45
+ "checkpoint_to_epoch": {
46
+ "1": 1,
47
+ "10": 5,
48
+ "11": 6,
49
+ "12": 6,
50
+ "13": 7,
51
+ "14": 7,
52
+ "15": 8,
53
+ "16": 8,
54
+ "17": 9,
55
+ "18": 9,
56
+ "19": 10,
57
+ "2": 1,
58
+ "20": 10,
59
+ "3": 2,
60
+ "4": 2,
61
+ "5": 3,
62
+ "6": 3,
63
+ "7": 4,
64
+ "8": 4,
65
+ "9": 5
66
+ },
67
+ "checkpoint_to_step": {
68
+ "1": 47,
69
+ "10": 235,
70
+ "11": 282,
71
+ "12": 282,
72
+ "13": 329,
73
+ "14": 329,
74
+ "15": 376,
75
+ "16": 376,
76
+ "17": 423,
77
+ "18": 423,
78
+ "19": 470,
79
+ "2": 47,
80
+ "20": 470,
81
+ "3": 94,
82
+ "4": 94,
83
+ "5": 141,
84
+ "6": 141,
85
+ "7": 188,
86
+ "8": 188,
87
+ "9": 235
88
+ },
89
+ "cumulative_checkpoint_token_usage": {
90
+ "1": 1521697,
91
+ "10": 7608485,
92
+ "11": 9130182,
93
+ "12": 9130182,
94
+ "13": 10651879,
95
+ "14": 10651879,
96
+ "15": 12173576,
97
+ "16": 12173576,
98
+ "17": 13695273,
99
+ "18": 13695273,
100
+ "19": 15216970,
101
+ "2": 1521697,
102
+ "20": 15216970,
103
+ "3": 3043394,
104
+ "4": 3043394,
105
+ "5": 4565091,
106
+ "6": 4565091,
107
+ "7": 6086788,
108
+ "8": 6086788,
109
+ "9": 7608485
110
+ },
111
+ "cumulative_step_token_usage": {
112
+ "0": 32896,
113
+ "1": 65792,
114
+ "10": 361856,
115
+ "100": 3273666,
116
+ "101": 3306562,
117
+ "102": 3339458,
118
+ "103": 3372354,
119
+ "104": 3405250,
120
+ "105": 3438146,
121
+ "106": 3471042,
122
+ "107": 3503938,
123
+ "108": 3536834,
124
+ "109": 3569730,
125
+ "11": 394752,
126
+ "110": 3602626,
127
+ "111": 3635522,
128
+ "112": 3668418,
129
+ "113": 3701314,
130
+ "114": 3734210,
131
+ "115": 3767106,
132
+ "116": 3800002,
133
+ "117": 3832898,
134
+ "118": 3865794,
135
+ "119": 3898690,
136
+ "12": 427648,
137
+ "120": 3931586,
138
+ "121": 3964482,
139
+ "122": 3997378,
140
+ "123": 4030274,
141
+ "124": 4063170,
142
+ "125": 4096066,
143
+ "126": 4128962,
144
+ "127": 4161858,
145
+ "128": 4194754,
146
+ "129": 4227650,
147
+ "13": 460544,
148
+ "130": 4260546,
149
+ "131": 4293442,
150
+ "132": 4326338,
151
+ "133": 4359234,
152
+ "134": 4392130,
153
+ "135": 4425026,
154
+ "136": 4457922,
155
+ "137": 4490818,
156
+ "138": 4523714,
157
+ "139": 4556610,
158
+ "14": 493440,
159
+ "140": 4565091,
160
+ "141": 4597987,
161
+ "142": 4630883,
162
+ "143": 4663779,
163
+ "144": 4696675,
164
+ "145": 4729571,
165
+ "146": 4762467,
166
+ "147": 4795363,
167
+ "148": 4828259,
168
+ "149": 4861155,
169
+ "15": 526336,
170
+ "150": 4894051,
171
+ "151": 4926947,
172
+ "152": 4959843,
173
+ "153": 4992739,
174
+ "154": 5025635,
175
+ "155": 5058531,
176
+ "156": 5091427,
177
+ "157": 5124323,
178
+ "158": 5157219,
179
+ "159": 5190115,
180
+ "16": 559232,
181
+ "160": 5223011,
182
+ "161": 5255907,
183
+ "162": 5288803,
184
+ "163": 5321699,
185
+ "164": 5354595,
186
+ "165": 5387491,
187
+ "166": 5420387,
188
+ "167": 5453283,
189
+ "168": 5486179,
190
+ "169": 5519075,
191
+ "17": 592128,
192
+ "170": 5551971,
193
+ "171": 5584867,
194
+ "172": 5617763,
195
+ "173": 5650659,
196
+ "174": 5683555,
197
+ "175": 5716451,
198
+ "176": 5749347,
199
+ "177": 5782243,
200
+ "178": 5815139,
201
+ "179": 5848035,
202
+ "18": 625024,
203
+ "180": 5880931,
204
+ "181": 5913827,
205
+ "182": 5946723,
206
+ "183": 5979619,
207
+ "184": 6012515,
208
+ "185": 6045411,
209
+ "186": 6078307,
210
+ "187": 6086788,
211
+ "188": 6119684,
212
+ "189": 6152580,
213
+ "19": 657920,
214
+ "190": 6185476,
215
+ "191": 6218372,
216
+ "192": 6251268,
217
+ "193": 6284164,
218
+ "194": 6317060,
219
+ "195": 6349956,
220
+ "196": 6382852,
221
+ "197": 6415748,
222
+ "198": 6448644,
223
+ "199": 6481540,
224
+ "2": 98688,
225
+ "20": 690816,
226
+ "200": 6514436,
227
+ "201": 6547332,
228
+ "202": 6580228,
229
+ "203": 6613124,
230
+ "204": 6646020,
231
+ "205": 6678916,
232
+ "206": 6711812,
233
+ "207": 6744708,
234
+ "208": 6777604,
235
+ "209": 6810500,
236
+ "21": 723712,
237
+ "210": 6843396,
238
+ "211": 6876292,
239
+ "212": 6909188,
240
+ "213": 6942084,
241
+ "214": 6974980,
242
+ "215": 7007876,
243
+ "216": 7040772,
244
+ "217": 7073668,
245
+ "218": 7106564,
246
+ "219": 7139460,
247
+ "22": 756608,
248
+ "220": 7172356,
249
+ "221": 7205252,
250
+ "222": 7238148,
251
+ "223": 7271044,
252
+ "224": 7303940,
253
+ "225": 7336836,
254
+ "226": 7369732,
255
+ "227": 7402628,
256
+ "228": 7435524,
257
+ "229": 7468420,
258
+ "23": 789504,
259
+ "230": 7501316,
260
+ "231": 7534212,
261
+ "232": 7567108,
262
+ "233": 7600004,
263
+ "234": 7608485,
264
+ "235": 7641381,
265
+ "236": 7674277,
266
+ "237": 7707173,
267
+ "238": 7740069,
268
+ "239": 7772965,
269
+ "24": 822400,
270
+ "240": 7805861,
271
+ "241": 7838757,
272
+ "242": 7871653,
273
+ "243": 7904549,
274
+ "244": 7937445,
275
+ "245": 7970341,
276
+ "246": 8003237,
277
+ "247": 8036133,
278
+ "248": 8069029,
279
+ "249": 8101925,
280
+ "25": 855296,
281
+ "250": 8134821,
282
+ "251": 8167717,
283
+ "252": 8200613,
284
+ "253": 8233509,
285
+ "254": 8266405,
286
+ "255": 8299301,
287
+ "256": 8332197,
288
+ "257": 8365093,
289
+ "258": 8397989,
290
+ "259": 8430885,
291
+ "26": 888192,
292
+ "260": 8463781,
293
+ "261": 8496677,
294
+ "262": 8529573,
295
+ "263": 8562469,
296
+ "264": 8595365,
297
+ "265": 8628261,
298
+ "266": 8661157,
299
+ "267": 8694053,
300
+ "268": 8726949,
301
+ "269": 8759845,
302
+ "27": 921088,
303
+ "270": 8792741,
304
+ "271": 8825637,
305
+ "272": 8858533,
306
+ "273": 8891429,
307
+ "274": 8924325,
308
+ "275": 8957221,
309
+ "276": 8990117,
310
+ "277": 9023013,
311
+ "278": 9055909,
312
+ "279": 9088805,
313
+ "28": 953984,
314
+ "280": 9121701,
315
+ "281": 9130182,
316
+ "282": 9163078,
317
+ "283": 9195974,
318
+ "284": 9228870,
319
+ "285": 9261766,
320
+ "286": 9294662,
321
+ "287": 9327558,
322
+ "288": 9360454,
323
+ "289": 9393350,
324
+ "29": 986880,
325
+ "290": 9426246,
326
+ "291": 9459142,
327
+ "292": 9492038,
328
+ "293": 9524934,
329
+ "294": 9557830,
330
+ "295": 9590726,
331
+ "296": 9623622,
332
+ "297": 9656518,
333
+ "298": 9689414,
334
+ "299": 9722310,
335
+ "3": 131584,
336
+ "30": 1019776,
337
+ "300": 9755206,
338
+ "301": 9788102,
339
+ "302": 9820998,
340
+ "303": 9853894,
341
+ "304": 9886790,
342
+ "305": 9919686,
343
+ "306": 9952582,
344
+ "307": 9985478,
345
+ "308": 10018374,
346
+ "309": 10051270,
347
+ "31": 1052672,
348
+ "310": 10084166,
349
+ "311": 10117062,
350
+ "312": 10149958,
351
+ "313": 10182854,
352
+ "314": 10215750,
353
+ "315": 10248646,
354
+ "316": 10281542,
355
+ "317": 10314438,
356
+ "318": 10347334,
357
+ "319": 10380230,
358
+ "32": 1085568,
359
+ "320": 10413126,
360
+ "321": 10446022,
361
+ "322": 10478918,
362
+ "323": 10511814,
363
+ "324": 10544710,
364
+ "325": 10577606,
365
+ "326": 10610502,
366
+ "327": 10643398,
367
+ "328": 10651879,
368
+ "329": 10684775,
369
+ "33": 1118464,
370
+ "330": 10717671,
371
+ "331": 10750567,
372
+ "332": 10783463,
373
+ "333": 10816359,
374
+ "334": 10849255,
375
+ "335": 10882151,
376
+ "336": 10915047,
377
+ "337": 10947943,
378
+ "338": 10980839,
379
+ "339": 11013735,
380
+ "34": 1151360,
381
+ "340": 11046631,
382
+ "341": 11079527,
383
+ "342": 11112423,
384
+ "343": 11145319,
385
+ "344": 11178215,
386
+ "345": 11211111,
387
+ "346": 11244007,
388
+ "347": 11276903,
389
+ "348": 11309799,
390
+ "349": 11342695,
391
+ "35": 1184256,
392
+ "350": 11375591,
393
+ "351": 11408487,
394
+ "352": 11441383,
395
+ "353": 11474279,
396
+ "354": 11507175,
397
+ "355": 11540071,
398
+ "356": 11572967,
399
+ "357": 11605863,
400
+ "358": 11638759,
401
+ "359": 11671655,
402
+ "36": 1217152,
403
+ "360": 11704551,
404
+ "361": 11737447,
405
+ "362": 11770343,
406
+ "363": 11803239,
407
+ "364": 11836135,
408
+ "365": 11869031,
409
+ "366": 11901927,
410
+ "367": 11934823,
411
+ "368": 11967719,
412
+ "369": 12000615,
413
+ "37": 1250048,
414
+ "370": 12033511,
415
+ "371": 12066407,
416
+ "372": 12099303,
417
+ "373": 12132199,
418
+ "374": 12165095,
419
+ "375": 12173576,
420
+ "376": 12206472,
421
+ "377": 12239368,
422
+ "378": 12272264,
423
+ "379": 12305160,
424
+ "38": 1282944,
425
+ "380": 12338056,
426
+ "381": 12370952,
427
+ "382": 12403848,
428
+ "383": 12436744,
429
+ "384": 12469640,
430
+ "385": 12502536,
431
+ "386": 12535432,
432
+ "387": 12568328,
433
+ "388": 12601224,
434
+ "389": 12634120,
435
+ "39": 1315840,
436
+ "390": 12667016,
437
+ "391": 12699912,
438
+ "392": 12732808,
439
+ "393": 12765704,
440
+ "394": 12798600,
441
+ "395": 12831496,
442
+ "396": 12864392,
443
+ "397": 12897288,
444
+ "398": 12930184,
445
+ "399": 12963080,
446
+ "4": 164480,
447
+ "40": 1348736,
448
+ "400": 12995976,
449
+ "401": 13028872,
450
+ "402": 13061768,
451
+ "403": 13094664,
452
+ "404": 13127560,
453
+ "405": 13160456,
454
+ "406": 13193352,
455
+ "407": 13226248,
456
+ "408": 13259144,
457
+ "409": 13292040,
458
+ "41": 1381632,
459
+ "410": 13324936,
460
+ "411": 13357832,
461
+ "412": 13390728,
462
+ "413": 13423624,
463
+ "414": 13456520,
464
+ "415": 13489416,
465
+ "416": 13522312,
466
+ "417": 13555208,
467
+ "418": 13588104,
468
+ "419": 13621000,
469
+ "42": 1414528,
470
+ "420": 13653896,
471
+ "421": 13686792,
472
+ "422": 13695273,
473
+ "423": 13728169,
474
+ "424": 13761065,
475
+ "425": 13793961,
476
+ "426": 13826857,
477
+ "427": 13859753,
478
+ "428": 13892649,
479
+ "429": 13925545,
480
+ "43": 1447424,
481
+ "430": 13958441,
482
+ "431": 13991337,
483
+ "432": 14024233,
484
+ "433": 14057129,
485
+ "434": 14090025,
486
+ "435": 14122921,
487
+ "436": 14155817,
488
+ "437": 14188713,
489
+ "438": 14221609,
490
+ "439": 14254505,
491
+ "44": 1480320,
492
+ "440": 14287401,
493
+ "441": 14320297,
494
+ "442": 14353193,
495
+ "443": 14386089,
496
+ "444": 14418985,
497
+ "445": 14451881,
498
+ "446": 14484777,
499
+ "447": 14517673,
500
+ "448": 14550569,
501
+ "449": 14583465,
502
+ "45": 1513216,
503
+ "450": 14616361,
504
+ "451": 14649257,
505
+ "452": 14682153,
506
+ "453": 14715049,
507
+ "454": 14747945,
508
+ "455": 14780841,
509
+ "456": 14813737,
510
+ "457": 14846633,
511
+ "458": 14879529,
512
+ "459": 14912425,
513
+ "46": 1521697,
514
+ "460": 14945321,
515
+ "461": 14978217,
516
+ "462": 15011113,
517
+ "463": 15044009,
518
+ "464": 15076905,
519
+ "465": 15109801,
520
+ "466": 15142697,
521
+ "467": 15175593,
522
+ "468": 15208489,
523
+ "469": 15216970,
524
+ "47": 1554593,
525
+ "48": 1587489,
526
+ "49": 1620385,
527
+ "5": 197376,
528
+ "50": 1653281,
529
+ "51": 1686177,
530
+ "52": 1719073,
531
+ "53": 1751969,
532
+ "54": 1784865,
533
+ "55": 1817761,
534
+ "56": 1850657,
535
+ "57": 1883553,
536
+ "58": 1916449,
537
+ "59": 1949345,
538
+ "6": 230272,
539
+ "60": 1982241,
540
+ "61": 2015137,
541
+ "62": 2048033,
542
+ "63": 2080929,
543
+ "64": 2113825,
544
+ "65": 2146721,
545
+ "66": 2179617,
546
+ "67": 2212513,
547
+ "68": 2245409,
548
+ "69": 2278305,
549
+ "7": 263168,
550
+ "70": 2311201,
551
+ "71": 2344097,
552
+ "72": 2376993,
553
+ "73": 2409889,
554
+ "74": 2442785,
555
+ "75": 2475681,
556
+ "76": 2508577,
557
+ "77": 2541473,
558
+ "78": 2574369,
559
+ "79": 2607265,
560
+ "8": 296064,
561
+ "80": 2640161,
562
+ "81": 2673057,
563
+ "82": 2705953,
564
+ "83": 2738849,
565
+ "84": 2771745,
566
+ "85": 2804641,
567
+ "86": 2837537,
568
+ "87": 2870433,
569
+ "88": 2903329,
570
+ "89": 2936225,
571
+ "9": 328960,
572
+ "90": 2969121,
573
+ "91": 3002017,
574
+ "92": 3034913,
575
+ "93": 3043394,
576
+ "94": 3076290,
577
+ "95": 3109186,
578
+ "96": 3142082,
579
+ "97": 3174978,
580
+ "98": 3207874,
581
+ "99": 3240770
582
+ },
583
+ "epoch": 10,
584
+ "incremental_checkpoint_token_usage": {
585
+ "1": 1521697,
586
+ "10": 0,
587
+ "11": 1521697,
588
+ "12": 0,
589
+ "13": 1521697,
590
+ "14": 0,
591
+ "15": 1521697,
592
+ "16": 0,
593
+ "17": 1521697,
594
+ "18": 0,
595
+ "19": 1521697,
596
+ "2": 0,
597
+ "20": 0,
598
+ "3": 1521697,
599
+ "4": 0,
600
+ "5": 1521697,
601
+ "6": 0,
602
+ "7": 1521697,
603
+ "8": 0,
604
+ "9": 1521697
605
+ },
606
+ "incremental_step_token_usage": {
607
+ "0": 32896,
608
+ "1": 32896,
609
+ "10": 32896,
610
+ "100": 32896,
611
+ "101": 32896,
612
+ "102": 32896,
613
+ "103": 32896,
614
+ "104": 32896,
615
+ "105": 32896,
616
+ "106": 32896,
617
+ "107": 32896,
618
+ "108": 32896,
619
+ "109": 32896,
620
+ "11": 32896,
621
+ "110": 32896,
622
+ "111": 32896,
623
+ "112": 32896,
624
+ "113": 32896,
625
+ "114": 32896,
626
+ "115": 32896,
627
+ "116": 32896,
628
+ "117": 32896,
629
+ "118": 32896,
630
+ "119": 32896,
631
+ "12": 32896,
632
+ "120": 32896,
633
+ "121": 32896,
634
+ "122": 32896,
635
+ "123": 32896,
636
+ "124": 32896,
637
+ "125": 32896,
638
+ "126": 32896,
639
+ "127": 32896,
640
+ "128": 32896,
641
+ "129": 32896,
642
+ "13": 32896,
643
+ "130": 32896,
644
+ "131": 32896,
645
+ "132": 32896,
646
+ "133": 32896,
647
+ "134": 32896,
648
+ "135": 32896,
649
+ "136": 32896,
650
+ "137": 32896,
651
+ "138": 32896,
652
+ "139": 32896,
653
+ "14": 32896,
654
+ "140": 8481,
655
+ "141": 32896,
656
+ "142": 32896,
657
+ "143": 32896,
658
+ "144": 32896,
659
+ "145": 32896,
660
+ "146": 32896,
661
+ "147": 32896,
662
+ "148": 32896,
663
+ "149": 32896,
664
+ "15": 32896,
665
+ "150": 32896,
666
+ "151": 32896,
667
+ "152": 32896,
668
+ "153": 32896,
669
+ "154": 32896,
670
+ "155": 32896,
671
+ "156": 32896,
672
+ "157": 32896,
673
+ "158": 32896,
674
+ "159": 32896,
675
+ "16": 32896,
676
+ "160": 32896,
677
+ "161": 32896,
678
+ "162": 32896,
679
+ "163": 32896,
680
+ "164": 32896,
681
+ "165": 32896,
682
+ "166": 32896,
683
+ "167": 32896,
684
+ "168": 32896,
685
+ "169": 32896,
686
+ "17": 32896,
687
+ "170": 32896,
688
+ "171": 32896,
689
+ "172": 32896,
690
+ "173": 32896,
691
+ "174": 32896,
692
+ "175": 32896,
693
+ "176": 32896,
694
+ "177": 32896,
695
+ "178": 32896,
696
+ "179": 32896,
697
+ "18": 32896,
698
+ "180": 32896,
699
+ "181": 32896,
700
+ "182": 32896,
701
+ "183": 32896,
702
+ "184": 32896,
703
+ "185": 32896,
704
+ "186": 32896,
705
+ "187": 8481,
706
+ "188": 32896,
707
+ "189": 32896,
708
+ "19": 32896,
709
+ "190": 32896,
710
+ "191": 32896,
711
+ "192": 32896,
712
+ "193": 32896,
713
+ "194": 32896,
714
+ "195": 32896,
715
+ "196": 32896,
716
+ "197": 32896,
717
+ "198": 32896,
718
+ "199": 32896,
719
+ "2": 32896,
720
+ "20": 32896,
721
+ "200": 32896,
722
+ "201": 32896,
723
+ "202": 32896,
724
+ "203": 32896,
725
+ "204": 32896,
726
+ "205": 32896,
727
+ "206": 32896,
728
+ "207": 32896,
729
+ "208": 32896,
730
+ "209": 32896,
731
+ "21": 32896,
732
+ "210": 32896,
733
+ "211": 32896,
734
+ "212": 32896,
735
+ "213": 32896,
736
+ "214": 32896,
737
+ "215": 32896,
738
+ "216": 32896,
739
+ "217": 32896,
740
+ "218": 32896,
741
+ "219": 32896,
742
+ "22": 32896,
743
+ "220": 32896,
744
+ "221": 32896,
745
+ "222": 32896,
746
+ "223": 32896,
747
+ "224": 32896,
748
+ "225": 32896,
749
+ "226": 32896,
750
+ "227": 32896,
751
+ "228": 32896,
752
+ "229": 32896,
753
+ "23": 32896,
754
+ "230": 32896,
755
+ "231": 32896,
756
+ "232": 32896,
757
+ "233": 32896,
758
+ "234": 8481,
759
+ "235": 32896,
760
+ "236": 32896,
761
+ "237": 32896,
762
+ "238": 32896,
763
+ "239": 32896,
764
+ "24": 32896,
765
+ "240": 32896,
766
+ "241": 32896,
767
+ "242": 32896,
768
+ "243": 32896,
769
+ "244": 32896,
770
+ "245": 32896,
771
+ "246": 32896,
772
+ "247": 32896,
773
+ "248": 32896,
774
+ "249": 32896,
775
+ "25": 32896,
776
+ "250": 32896,
777
+ "251": 32896,
778
+ "252": 32896,
779
+ "253": 32896,
780
+ "254": 32896,
781
+ "255": 32896,
782
+ "256": 32896,
783
+ "257": 32896,
784
+ "258": 32896,
785
+ "259": 32896,
786
+ "26": 32896,
787
+ "260": 32896,
788
+ "261": 32896,
789
+ "262": 32896,
790
+ "263": 32896,
791
+ "264": 32896,
792
+ "265": 32896,
793
+ "266": 32896,
794
+ "267": 32896,
795
+ "268": 32896,
796
+ "269": 32896,
797
+ "27": 32896,
798
+ "270": 32896,
799
+ "271": 32896,
800
+ "272": 32896,
801
+ "273": 32896,
802
+ "274": 32896,
803
+ "275": 32896,
804
+ "276": 32896,
805
+ "277": 32896,
806
+ "278": 32896,
807
+ "279": 32896,
808
+ "28": 32896,
809
+ "280": 32896,
810
+ "281": 8481,
811
+ "282": 32896,
812
+ "283": 32896,
813
+ "284": 32896,
814
+ "285": 32896,
815
+ "286": 32896,
816
+ "287": 32896,
817
+ "288": 32896,
818
+ "289": 32896,
819
+ "29": 32896,
820
+ "290": 32896,
821
+ "291": 32896,
822
+ "292": 32896,
823
+ "293": 32896,
824
+ "294": 32896,
825
+ "295": 32896,
826
+ "296": 32896,
827
+ "297": 32896,
828
+ "298": 32896,
829
+ "299": 32896,
830
+ "3": 32896,
831
+ "30": 32896,
832
+ "300": 32896,
833
+ "301": 32896,
834
+ "302": 32896,
835
+ "303": 32896,
836
+ "304": 32896,
837
+ "305": 32896,
838
+ "306": 32896,
839
+ "307": 32896,
840
+ "308": 32896,
841
+ "309": 32896,
842
+ "31": 32896,
843
+ "310": 32896,
844
+ "311": 32896,
845
+ "312": 32896,
846
+ "313": 32896,
847
+ "314": 32896,
848
+ "315": 32896,
849
+ "316": 32896,
850
+ "317": 32896,
851
+ "318": 32896,
852
+ "319": 32896,
853
+ "32": 32896,
854
+ "320": 32896,
855
+ "321": 32896,
856
+ "322": 32896,
857
+ "323": 32896,
858
+ "324": 32896,
859
+ "325": 32896,
860
+ "326": 32896,
861
+ "327": 32896,
862
+ "328": 8481,
863
+ "329": 32896,
864
+ "33": 32896,
865
+ "330": 32896,
866
+ "331": 32896,
867
+ "332": 32896,
868
+ "333": 32896,
869
+ "334": 32896,
870
+ "335": 32896,
871
+ "336": 32896,
872
+ "337": 32896,
873
+ "338": 32896,
874
+ "339": 32896,
875
+ "34": 32896,
876
+ "340": 32896,
877
+ "341": 32896,
878
+ "342": 32896,
879
+ "343": 32896,
880
+ "344": 32896,
881
+ "345": 32896,
882
+ "346": 32896,
883
+ "347": 32896,
884
+ "348": 32896,
885
+ "349": 32896,
886
+ "35": 32896,
887
+ "350": 32896,
888
+ "351": 32896,
889
+ "352": 32896,
890
+ "353": 32896,
891
+ "354": 32896,
892
+ "355": 32896,
893
+ "356": 32896,
894
+ "357": 32896,
895
+ "358": 32896,
896
+ "359": 32896,
897
+ "36": 32896,
898
+ "360": 32896,
899
+ "361": 32896,
900
+ "362": 32896,
901
+ "363": 32896,
902
+ "364": 32896,
903
+ "365": 32896,
904
+ "366": 32896,
905
+ "367": 32896,
906
+ "368": 32896,
907
+ "369": 32896,
908
+ "37": 32896,
909
+ "370": 32896,
910
+ "371": 32896,
911
+ "372": 32896,
912
+ "373": 32896,
913
+ "374": 32896,
914
+ "375": 8481,
915
+ "376": 32896,
916
+ "377": 32896,
917
+ "378": 32896,
918
+ "379": 32896,
919
+ "38": 32896,
920
+ "380": 32896,
921
+ "381": 32896,
922
+ "382": 32896,
923
+ "383": 32896,
924
+ "384": 32896,
925
+ "385": 32896,
926
+ "386": 32896,
927
+ "387": 32896,
928
+ "388": 32896,
929
+ "389": 32896,
930
+ "39": 32896,
931
+ "390": 32896,
932
+ "391": 32896,
933
+ "392": 32896,
934
+ "393": 32896,
935
+ "394": 32896,
936
+ "395": 32896,
937
+ "396": 32896,
938
+ "397": 32896,
939
+ "398": 32896,
940
+ "399": 32896,
941
+ "4": 32896,
942
+ "40": 32896,
943
+ "400": 32896,
944
+ "401": 32896,
945
+ "402": 32896,
946
+ "403": 32896,
947
+ "404": 32896,
948
+ "405": 32896,
949
+ "406": 32896,
950
+ "407": 32896,
951
+ "408": 32896,
952
+ "409": 32896,
953
+ "41": 32896,
954
+ "410": 32896,
955
+ "411": 32896,
956
+ "412": 32896,
957
+ "413": 32896,
958
+ "414": 32896,
959
+ "415": 32896,
960
+ "416": 32896,
961
+ "417": 32896,
962
+ "418": 32896,
963
+ "419": 32896,
964
+ "42": 32896,
965
+ "420": 32896,
966
+ "421": 32896,
967
+ "422": 8481,
968
+ "423": 32896,
969
+ "424": 32896,
970
+ "425": 32896,
971
+ "426": 32896,
972
+ "427": 32896,
973
+ "428": 32896,
974
+ "429": 32896,
975
+ "43": 32896,
976
+ "430": 32896,
977
+ "431": 32896,
978
+ "432": 32896,
979
+ "433": 32896,
980
+ "434": 32896,
981
+ "435": 32896,
982
+ "436": 32896,
983
+ "437": 32896,
984
+ "438": 32896,
985
+ "439": 32896,
986
+ "44": 32896,
987
+ "440": 32896,
988
+ "441": 32896,
989
+ "442": 32896,
990
+ "443": 32896,
991
+ "444": 32896,
992
+ "445": 32896,
993
+ "446": 32896,
994
+ "447": 32896,
995
+ "448": 32896,
996
+ "449": 32896,
997
+ "45": 32896,
998
+ "450": 32896,
999
+ "451": 32896,
1000
+ "452": 32896,
1001
+ "453": 32896,
1002
+ "454": 32896,
1003
+ "455": 32896,
1004
+ "456": 32896,
1005
+ "457": 32896,
1006
+ "458": 32896,
1007
+ "459": 32896,
1008
+ "46": 8481,
1009
+ "460": 32896,
1010
+ "461": 32896,
1011
+ "462": 32896,
1012
+ "463": 32896,
1013
+ "464": 32896,
1014
+ "465": 32896,
1015
+ "466": 32896,
1016
+ "467": 32896,
1017
+ "468": 32896,
1018
+ "469": 8481,
1019
+ "47": 32896,
1020
+ "48": 32896,
1021
+ "49": 32896,
1022
+ "5": 32896,
1023
+ "50": 32896,
1024
+ "51": 32896,
1025
+ "52": 32896,
1026
+ "53": 32896,
1027
+ "54": 32896,
1028
+ "55": 32896,
1029
+ "56": 32896,
1030
+ "57": 32896,
1031
+ "58": 32896,
1032
+ "59": 32896,
1033
+ "6": 32896,
1034
+ "60": 32896,
1035
+ "61": 32896,
1036
+ "62": 32896,
1037
+ "63": 32896,
1038
+ "64": 32896,
1039
+ "65": 32896,
1040
+ "66": 32896,
1041
+ "67": 32896,
1042
+ "68": 32896,
1043
+ "69": 32896,
1044
+ "7": 32896,
1045
+ "70": 32896,
1046
+ "71": 32896,
1047
+ "72": 32896,
1048
+ "73": 32896,
1049
+ "74": 32896,
1050
+ "75": 32896,
1051
+ "76": 32896,
1052
+ "77": 32896,
1053
+ "78": 32896,
1054
+ "79": 32896,
1055
+ "8": 32896,
1056
+ "80": 32896,
1057
+ "81": 32896,
1058
+ "82": 32896,
1059
+ "83": 32896,
1060
+ "84": 32896,
1061
+ "85": 32896,
1062
+ "86": 32896,
1063
+ "87": 32896,
1064
+ "88": 32896,
1065
+ "89": 32896,
1066
+ "9": 32896,
1067
+ "90": 32896,
1068
+ "91": 32896,
1069
+ "92": 32896,
1070
+ "93": 8481,
1071
+ "94": 32896,
1072
+ "95": 32896,
1073
+ "96": 32896,
1074
+ "97": 32896,
1075
+ "98": 32896,
1076
+ "99": 32896
1077
+ },
1078
+ "last_improvement_steps": 0,
1079
+ "last_increase_batch_size": 0,
1080
+ "last_increase_batch_size_eval_metric_improvement": 0,
1081
+ "last_increase_batch_size_steps": 0,
1082
+ "last_learning_rate_reduction": 0,
1083
+ "last_learning_rate_reduction_steps": 0,
1084
+ "learning_rate": 0.0009581637888400619,
1085
+ "llm_eval_examples": {},
1086
+ "num_increases_batch_size": 0,
1087
+ "num_reductions_learning_rate": 0,
1088
+ "steps": 470,
1089
+ "test_metrics": {
1090
+ "combined": {
1091
+ "loss": [
1092
+ [
1093
+ 1,
1094
+ 47,
1095
+ 4.140954494476318
1096
+ ],
1097
+ [
1098
+ 2,
1099
+ 94,
1100
+ 3.6341311931610107
1101
+ ],
1102
+ [
1103
+ 3,
1104
+ 141,
1105
+ 2.973945379257202
1106
+ ],
1107
+ [
1108
+ 4,
1109
+ 188,
1110
+ 2.604846239089966
1111
+ ],
1112
+ [
1113
+ 5,
1114
+ 235,
1115
+ 2.477090835571289
1116
+ ],
1117
+ [
1118
+ 6,
1119
+ 282,
1120
+ 2.765279769897461
1121
+ ],
1122
+ [
1123
+ 7,
1124
+ 329,
1125
+ 2.932941436767578
1126
+ ],
1127
+ [
1128
+ 8,
1129
+ 376,
1130
+ 2.916217565536499
1131
+ ],
1132
+ [
1133
+ 9,
1134
+ 423,
1135
+ 3.01550555229187
1136
+ ],
1137
+ [
1138
+ 10,
1139
+ 470,
1140
+ 3.0807435512542725
1141
+ ]
1142
+ ]
1143
+ },
1144
+ "intent": {
1145
+ "accuracy": [
1146
+ [
1147
+ 1,
1148
+ 47,
1149
+ 0.02062796801328659
1150
+ ],
1151
+ [
1152
+ 2,
1153
+ 94,
1154
+ 0.03668239712715149
1155
+ ],
1156
+ [
1157
+ 3,
1158
+ 141,
1159
+ 0.12673470377922058
1160
+ ],
1161
+ [
1162
+ 4,
1163
+ 188,
1164
+ 0.2651279866695404
1165
+ ],
1166
+ [
1167
+ 5,
1168
+ 235,
1169
+ 0.3786191940307617
1170
+ ],
1171
+ [
1172
+ 6,
1173
+ 282,
1174
+ 0.41484618186950684
1175
+ ],
1176
+ [
1177
+ 7,
1178
+ 329,
1179
+ 0.48310428857803345
1180
+ ],
1181
+ [
1182
+ 8,
1183
+ 376,
1184
+ 0.49936506152153015
1185
+ ],
1186
+ [
1187
+ 9,
1188
+ 423,
1189
+ 0.5275611281394958
1190
+ ],
1191
+ [
1192
+ 10,
1193
+ 470,
1194
+ 0.5496426820755005
1195
+ ]
1196
+ ],
1197
+ "accuracy_micro": [
1198
+ [
1199
+ 1,
1200
+ 47,
1201
+ 0.05730659142136574
1202
+ ],
1203
+ [
1204
+ 2,
1205
+ 94,
1206
+ 0.10028653591871262
1207
+ ],
1208
+ [
1209
+ 3,
1210
+ 141,
1211
+ 0.266475647687912
1212
+ ],
1213
+ [
1214
+ 4,
1215
+ 188,
1216
+ 0.3982807993888855
1217
+ ],
1218
+ [
1219
+ 5,
1220
+ 235,
1221
+ 0.4871060252189636
1222
+ ],
1223
+ [
1224
+ 6,
1225
+ 282,
1226
+ 0.4871060252189636
1227
+ ],
1228
+ [
1229
+ 7,
1230
+ 329,
1231
+ 0.5587392449378967
1232
+ ],
1233
+ [
1234
+ 8,
1235
+ 376,
1236
+ 0.5415472984313965
1237
+ ],
1238
+ [
1239
+ 9,
1240
+ 423,
1241
+ 0.5759312510490417
1242
+ ],
1243
+ [
1244
+ 10,
1245
+ 470,
1246
+ 0.5959885120391846
1247
+ ]
1248
+ ],
1249
+ "hits_at_k": [
1250
+ [
1251
+ 1,
1252
+ 47,
1253
+ 0.052861444652080536
1254
+ ],
1255
+ [
1256
+ 2,
1257
+ 94,
1258
+ 0.11137306690216064
1259
+ ],
1260
+ [
1261
+ 3,
1262
+ 141,
1263
+ 0.25743797421455383
1264
+ ],
1265
+ [
1266
+ 4,
1267
+ 188,
1268
+ 0.4437764883041382
1269
+ ],
1270
+ [
1271
+ 5,
1272
+ 235,
1273
+ 0.5734579563140869
1274
+ ],
1275
+ [
1276
+ 6,
1277
+ 282,
1278
+ 0.6254034638404846
1279
+ ],
1280
+ [
1281
+ 7,
1282
+ 329,
1283
+ 0.6468311548233032
1284
+ ],
1285
+ [
1286
+ 8,
1287
+ 376,
1288
+ 0.6431319713592529
1289
+ ],
1290
+ [
1291
+ 9,
1292
+ 423,
1293
+ 0.6786106824874878
1294
+ ],
1295
+ [
1296
+ 10,
1297
+ 470,
1298
+ 0.6660665273666382
1299
+ ]
1300
+ ],
1301
+ "loss": [
1302
+ [
1303
+ 1,
1304
+ 47,
1305
+ 4.140954494476318
1306
+ ],
1307
+ [
1308
+ 2,
1309
+ 94,
1310
+ 3.6341311931610107
1311
+ ],
1312
+ [
1313
+ 3,
1314
+ 141,
1315
+ 2.973945379257202
1316
+ ],
1317
+ [
1318
+ 4,
1319
+ 188,
1320
+ 2.604846239089966
1321
+ ],
1322
+ [
1323
+ 5,
1324
+ 235,
1325
+ 2.477090835571289
1326
+ ],
1327
+ [
1328
+ 6,
1329
+ 282,
1330
+ 2.765279769897461
1331
+ ],
1332
+ [
1333
+ 7,
1334
+ 329,
1335
+ 2.932941436767578
1336
+ ],
1337
+ [
1338
+ 8,
1339
+ 376,
1340
+ 2.916217565536499
1341
+ ],
1342
+ [
1343
+ 9,
1344
+ 423,
1345
+ 3.01550555229187
1346
+ ],
1347
+ [
1348
+ 10,
1349
+ 470,
1350
+ 3.0807435512542725
1351
+ ]
1352
+ ],
1353
+ "roc_auc": [
1354
+ [
1355
+ 1,
1356
+ 47,
1357
+ 0.6999472975730896
1358
+ ],
1359
+ [
1360
+ 2,
1361
+ 94,
1362
+ 0.8169810771942139
1363
+ ],
1364
+ [
1365
+ 3,
1366
+ 141,
1367
+ 0.8789530992507935
1368
+ ],
1369
+ [
1370
+ 4,
1371
+ 188,
1372
+ 0.9105718731880188
1373
+ ],
1374
+ [
1375
+ 5,
1376
+ 235,
1377
+ 0.9285396337509155
1378
+ ],
1379
+ [
1380
+ 6,
1381
+ 282,
1382
+ 0.932953953742981
1383
+ ],
1384
+ [
1385
+ 7,
1386
+ 329,
1387
+ 0.9334519505500793
1388
+ ],
1389
+ [
1390
+ 8,
1391
+ 376,
1392
+ 0.9398418664932251
1393
+ ],
1394
+ [
1395
+ 9,
1396
+ 423,
1397
+ 0.9440649747848511
1398
+ ],
1399
+ [
1400
+ 10,
1401
+ 470,
1402
+ 0.9340102672576904
1403
+ ]
1404
+ ]
1405
+ }
1406
+ },
1407
+ "total_tokens_used": 15216970,
1408
+ "train_metrics": {
1409
+ "combined": {
1410
+ "loss": [
1411
+ [
1412
+ 1,
1413
+ 47,
1414
+ 4.941826820373535
1415
+ ],
1416
+ [
1417
+ 2,
1418
+ 94,
1419
+ 3.8220131397247314
1420
+ ],
1421
+ [
1422
+ 3,
1423
+ 141,
1424
+ 2.966855049133301
1425
+ ],
1426
+ [
1427
+ 4,
1428
+ 188,
1429
+ 1.9691708087921143
1430
+ ],
1431
+ [
1432
+ 5,
1433
+ 235,
1434
+ 1.1989307403564453
1435
+ ],
1436
+ [
1437
+ 6,
1438
+ 282,
1439
+ 0.7208091020584106
1440
+ ],
1441
+ [
1442
+ 7,
1443
+ 329,
1444
+ 0.41259047389030457
1445
+ ],
1446
+ [
1447
+ 8,
1448
+ 376,
1449
+ 0.2844356894493103
1450
+ ],
1451
+ [
1452
+ 9,
1453
+ 423,
1454
+ 0.20260311663150787
1455
+ ],
1456
+ [
1457
+ 10,
1458
+ 470,
1459
+ 0.15086334943771362
1460
+ ]
1461
+ ]
1462
+ },
1463
+ "intent": {
1464
+ "accuracy": [
1465
+ [
1466
+ 1,
1467
+ 47,
1468
+ 0.014659089967608452
1469
+ ],
1470
+ [
1471
+ 2,
1472
+ 94,
1473
+ 0.03883907198905945
1474
+ ],
1475
+ [
1476
+ 3,
1477
+ 141,
1478
+ 0.10787460207939148
1479
+ ],
1480
+ [
1481
+ 4,
1482
+ 188,
1483
+ 0.25457778573036194
1484
+ ],
1485
+ [
1486
+ 5,
1487
+ 235,
1488
+ 0.4590109586715698
1489
+ ],
1490
+ [
1491
+ 6,
1492
+ 282,
1493
+ 0.653484046459198
1494
+ ],
1495
+ [
1496
+ 7,
1497
+ 329,
1498
+ 0.8075626492500305
1499
+ ],
1500
+ [
1501
+ 8,
1502
+ 376,
1503
+ 0.8613330721855164
1504
+ ],
1505
+ [
1506
+ 9,
1507
+ 423,
1508
+ 0.9029062986373901
1509
+ ],
1510
+ [
1511
+ 10,
1512
+ 470,
1513
+ 0.9410130977630615
1514
+ ]
1515
+ ],
1516
+ "accuracy_micro": [
1517
+ [
1518
+ 1,
1519
+ 47,
1520
+ 0.035635873675346375
1521
+ ],
1522
+ [
1523
+ 2,
1524
+ 94,
1525
+ 0.09812531620264053
1526
+ ],
1527
+ [
1528
+ 3,
1529
+ 141,
1530
+ 0.23492653667926788
1531
+ ],
1532
+ [
1533
+ 4,
1534
+ 188,
1535
+ 0.4457017481327057
1536
+ ],
1537
+ [
1538
+ 5,
1539
+ 235,
1540
+ 0.6433035135269165
1541
+ ],
1542
+ [
1543
+ 6,
1544
+ 282,
1545
+ 0.7851714491844177
1546
+ ],
1547
+ [
1548
+ 7,
1549
+ 329,
1550
+ 0.8792433738708496
1551
+ ],
1552
+ [
1553
+ 8,
1554
+ 376,
1555
+ 0.9142037034034729
1556
+ ],
1557
+ [
1558
+ 9,
1559
+ 423,
1560
+ 0.9376794695854187
1561
+ ],
1562
+ [
1563
+ 10,
1564
+ 470,
1565
+ 0.9574396014213562
1566
+ ]
1567
+ ],
1568
+ "hits_at_k": [
1569
+ [
1570
+ 1,
1571
+ 47,
1572
+ 0.03866136819124222
1573
+ ],
1574
+ [
1575
+ 2,
1576
+ 94,
1577
+ 0.09584441781044006
1578
+ ],
1579
+ [
1580
+ 3,
1581
+ 141,
1582
+ 0.2281757891178131
1583
+ ],
1584
+ [
1585
+ 4,
1586
+ 188,
1587
+ 0.46207964420318604
1588
+ ],
1589
+ [
1590
+ 5,
1591
+ 235,
1592
+ 0.700287401676178
1593
+ ],
1594
+ [
1595
+ 6,
1596
+ 282,
1597
+ 0.876828670501709
1598
+ ],
1599
+ [
1600
+ 7,
1601
+ 329,
1602
+ 0.9502895474433899
1603
+ ],
1604
+ [
1605
+ 8,
1606
+ 376,
1607
+ 0.9748519659042358
1608
+ ],
1609
+ [
1610
+ 9,
1611
+ 423,
1612
+ 0.985029935836792
1613
+ ],
1614
+ [
1615
+ 10,
1616
+ 470,
1617
+ 0.9925163984298706
1618
+ ]
1619
+ ],
1620
+ "loss": [
1621
+ [
1622
+ 1,
1623
+ 47,
1624
+ 4.941826820373535
1625
+ ],
1626
+ [
1627
+ 2,
1628
+ 94,
1629
+ 3.8220131397247314
1630
+ ],
1631
+ [
1632
+ 3,
1633
+ 141,
1634
+ 2.966855049133301
1635
+ ],
1636
+ [
1637
+ 4,
1638
+ 188,
1639
+ 1.9691708087921143
1640
+ ],
1641
+ [
1642
+ 5,
1643
+ 235,
1644
+ 1.1989307403564453
1645
+ ],
1646
+ [
1647
+ 6,
1648
+ 282,
1649
+ 0.7208091020584106
1650
+ ],
1651
+ [
1652
+ 7,
1653
+ 329,
1654
+ 0.41259047389030457
1655
+ ],
1656
+ [
1657
+ 8,
1658
+ 376,
1659
+ 0.2844356894493103
1660
+ ],
1661
+ [
1662
+ 9,
1663
+ 423,
1664
+ 0.20260311663150787
1665
+ ],
1666
+ [
1667
+ 10,
1668
+ 470,
1669
+ 0.15086334943771362
1670
+ ]
1671
+ ],
1672
+ "roc_auc": [
1673
+ [
1674
+ 1,
1675
+ 47,
1676
+ 0.5121718645095825
1677
+ ],
1678
+ [
1679
+ 2,
1680
+ 94,
1681
+ 0.7023259997367859
1682
+ ],
1683
+ [
1684
+ 3,
1685
+ 141,
1686
+ 0.8708662986755371
1687
+ ],
1688
+ [
1689
+ 4,
1690
+ 188,
1691
+ 0.9513766765594482
1692
+ ],
1693
+ [
1694
+ 5,
1695
+ 235,
1696
+ 0.98272705078125
1697
+ ],
1698
+ [
1699
+ 6,
1700
+ 282,
1701
+ 0.9933627843856812
1702
+ ],
1703
+ [
1704
+ 7,
1705
+ 329,
1706
+ 0.997870147228241
1707
+ ],
1708
+ [
1709
+ 8,
1710
+ 376,
1711
+ 0.9987038969993591
1712
+ ],
1713
+ [
1714
+ 9,
1715
+ 423,
1716
+ 0.999286949634552
1717
+ ],
1718
+ [
1719
+ 10,
1720
+ 470,
1721
+ 0.9996311664581299
1722
+ ]
1723
+ ]
1724
+ }
1725
+ },
1726
+ "tune_checkpoint_num": 0,
1727
+ "validation_metrics": {
1728
+ "combined": {
1729
+ "loss": [
1730
+ [
1731
+ 1,
1732
+ 47,
1733
+ 4.075289249420166
1734
+ ],
1735
+ [
1736
+ 2,
1737
+ 94,
1738
+ 3.5391108989715576
1739
+ ],
1740
+ [
1741
+ 3,
1742
+ 141,
1743
+ 2.817091703414917
1744
+ ],
1745
+ [
1746
+ 4,
1747
+ 188,
1748
+ 2.289855718612671
1749
+ ],
1750
+ [
1751
+ 5,
1752
+ 235,
1753
+ 2.167616605758667
1754
+ ],
1755
+ [
1756
+ 6,
1757
+ 282,
1758
+ 2.3362152576446533
1759
+ ],
1760
+ [
1761
+ 7,
1762
+ 329,
1763
+ 2.3229939937591553
1764
+ ],
1765
+ [
1766
+ 8,
1767
+ 376,
1768
+ 2.545104742050171
1769
+ ],
1770
+ [
1771
+ 9,
1772
+ 423,
1773
+ 2.641582489013672
1774
+ ],
1775
+ [
1776
+ 10,
1777
+ 470,
1778
+ 2.5151546001434326
1779
+ ]
1780
+ ]
1781
+ },
1782
+ "intent": {
1783
+ "accuracy": [
1784
+ [
1785
+ 1,
1786
+ 47,
1787
+ 0.02408008836209774
1788
+ ],
1789
+ [
1790
+ 2,
1791
+ 94,
1792
+ 0.039156392216682434
1793
+ ],
1794
+ [
1795
+ 3,
1796
+ 141,
1797
+ 0.13850188255310059
1798
+ ],
1799
+ [
1800
+ 4,
1801
+ 188,
1802
+ 0.262044221162796
1803
+ ],
1804
+ [
1805
+ 5,
1806
+ 235,
1807
+ 0.4144769310951233
1808
+ ],
1809
+ [
1810
+ 6,
1811
+ 282,
1812
+ 0.4744482636451721
1813
+ ],
1814
+ [
1815
+ 7,
1816
+ 329,
1817
+ 0.5366732478141785
1818
+ ],
1819
+ [
1820
+ 8,
1821
+ 376,
1822
+ 0.546140730381012
1823
+ ],
1824
+ [
1825
+ 9,
1826
+ 423,
1827
+ 0.5821728706359863
1828
+ ],
1829
+ [
1830
+ 10,
1831
+ 470,
1832
+ 0.6166250705718994
1833
+ ]
1834
+ ],
1835
+ "accuracy_micro": [
1836
+ [
1837
+ 1,
1838
+ 47,
1839
+ 0.06743185222148895
1840
+ ],
1841
+ [
1842
+ 2,
1843
+ 94,
1844
+ 0.09899569302797318
1845
+ ],
1846
+ [
1847
+ 3,
1848
+ 141,
1849
+ 0.28263989090919495
1850
+ ],
1851
+ [
1852
+ 4,
1853
+ 188,
1854
+ 0.4189383089542389
1855
+ ],
1856
+ [
1857
+ 5,
1858
+ 235,
1859
+ 0.515064537525177
1860
+ ],
1861
+ [
1862
+ 6,
1863
+ 282,
1864
+ 0.5451936721801758
1865
+ ],
1866
+ [
1867
+ 7,
1868
+ 329,
1869
+ 0.6011477708816528
1870
+ ],
1871
+ [
1872
+ 8,
1873
+ 376,
1874
+ 0.5810617208480835
1875
+ ],
1876
+ [
1877
+ 9,
1878
+ 423,
1879
+ 0.5968436002731323
1880
+ ],
1881
+ [
1882
+ 10,
1883
+ 470,
1884
+ 0.63271164894104
1885
+ ]
1886
+ ],
1887
+ "hits_at_k": [
1888
+ [
1889
+ 1,
1890
+ 47,
1891
+ 0.0595182403922081
1892
+ ],
1893
+ [
1894
+ 2,
1895
+ 94,
1896
+ 0.12082408368587494
1897
+ ],
1898
+ [
1899
+ 3,
1900
+ 141,
1901
+ 0.28157058358192444
1902
+ ],
1903
+ [
1904
+ 4,
1905
+ 188,
1906
+ 0.4951961934566498
1907
+ ],
1908
+ [
1909
+ 5,
1910
+ 235,
1911
+ 0.60570228099823
1912
+ ],
1913
+ [
1914
+ 6,
1915
+ 282,
1916
+ 0.6759977340698242
1917
+ ],
1918
+ [
1919
+ 7,
1920
+ 329,
1921
+ 0.7160040140151978
1922
+ ],
1923
+ [
1924
+ 8,
1925
+ 376,
1926
+ 0.7496565580368042
1927
+ ],
1928
+ [
1929
+ 9,
1930
+ 423,
1931
+ 0.7678131461143494
1932
+ ],
1933
+ [
1934
+ 10,
1935
+ 470,
1936
+ 0.7617202997207642
1937
+ ]
1938
+ ],
1939
+ "loss": [
1940
+ [
1941
+ 1,
1942
+ 47,
1943
+ 4.075289249420166
1944
+ ],
1945
+ [
1946
+ 2,
1947
+ 94,
1948
+ 3.5391108989715576
1949
+ ],
1950
+ [
1951
+ 3,
1952
+ 141,
1953
+ 2.817091703414917
1954
+ ],
1955
+ [
1956
+ 4,
1957
+ 188,
1958
+ 2.289855718612671
1959
+ ],
1960
+ [
1961
+ 5,
1962
+ 235,
1963
+ 2.167616605758667
1964
+ ],
1965
+ [
1966
+ 6,
1967
+ 282,
1968
+ 2.3362152576446533
1969
+ ],
1970
+ [
1971
+ 7,
1972
+ 329,
1973
+ 2.3229939937591553
1974
+ ],
1975
+ [
1976
+ 8,
1977
+ 376,
1978
+ 2.545104742050171
1979
+ ],
1980
+ [
1981
+ 9,
1982
+ 423,
1983
+ 2.641582489013672
1984
+ ],
1985
+ [
1986
+ 10,
1987
+ 470,
1988
+ 2.5151546001434326
1989
+ ]
1990
+ ],
1991
+ "roc_auc": [
1992
+ [
1993
+ 1,
1994
+ 47,
1995
+ 0.7134010791778564
1996
+ ],
1997
+ [
1998
+ 2,
1999
+ 94,
2000
+ 0.8469101190567017
2001
+ ],
2002
+ [
2003
+ 3,
2004
+ 141,
2005
+ 0.9105364680290222
2006
+ ],
2007
+ [
2008
+ 4,
2009
+ 188,
2010
+ 0.9462321400642395
2011
+ ],
2012
+ [
2013
+ 5,
2014
+ 235,
2015
+ 0.955407440662384
2016
+ ],
2017
+ [
2018
+ 6,
2019
+ 282,
2020
+ 0.9614531993865967
2021
+ ],
2022
+ [
2023
+ 7,
2024
+ 329,
2025
+ 0.9639908075332642
2026
+ ],
2027
+ [
2028
+ 8,
2029
+ 376,
2030
+ 0.9642417430877686
2031
+ ],
2032
+ [
2033
+ 9,
2034
+ 423,
2035
+ 0.9641472697257996
2036
+ ],
2037
+ [
2038
+ 10,
2039
+ 470,
2040
+ 0.9704092144966125
2041
+ ]
2042
+ ]
2043
+ }
2044
+ }
2045
+ }
model/training_set_metadata.json ADDED
The diff for this file is too large to render. See raw diff
 
training_statistics.json ADDED
@@ -0,0 +1,240 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "evaluation_frequency": {
3
+ "frequency": 1,
4
+ "period": "epoch"
5
+ },
6
+ "test": {
7
+ "combined": {
8
+ "loss": [
9
+ 4.140954494476318,
10
+ 3.6341311931610107,
11
+ 2.973945379257202,
12
+ 2.604846239089966,
13
+ 2.477090835571289,
14
+ 2.765279769897461,
15
+ 2.932941436767578,
16
+ 2.916217565536499,
17
+ 3.01550555229187,
18
+ 3.0807435512542725
19
+ ]
20
+ },
21
+ "intent": {
22
+ "accuracy": [
23
+ 0.02062796801328659,
24
+ 0.03668239712715149,
25
+ 0.12673470377922058,
26
+ 0.2651279866695404,
27
+ 0.3786191940307617,
28
+ 0.41484618186950684,
29
+ 0.48310428857803345,
30
+ 0.49936506152153015,
31
+ 0.5275611281394958,
32
+ 0.5496426820755005
33
+ ],
34
+ "accuracy_micro": [
35
+ 0.05730659142136574,
36
+ 0.10028653591871262,
37
+ 0.266475647687912,
38
+ 0.3982807993888855,
39
+ 0.4871060252189636,
40
+ 0.4871060252189636,
41
+ 0.5587392449378967,
42
+ 0.5415472984313965,
43
+ 0.5759312510490417,
44
+ 0.5959885120391846
45
+ ],
46
+ "hits_at_k": [
47
+ 0.052861444652080536,
48
+ 0.11137306690216064,
49
+ 0.25743797421455383,
50
+ 0.4437764883041382,
51
+ 0.5734579563140869,
52
+ 0.6254034638404846,
53
+ 0.6468311548233032,
54
+ 0.6431319713592529,
55
+ 0.6786106824874878,
56
+ 0.6660665273666382
57
+ ],
58
+ "loss": [
59
+ 4.140954494476318,
60
+ 3.6341311931610107,
61
+ 2.973945379257202,
62
+ 2.604846239089966,
63
+ 2.477090835571289,
64
+ 2.765279769897461,
65
+ 2.932941436767578,
66
+ 2.916217565536499,
67
+ 3.01550555229187,
68
+ 3.0807435512542725
69
+ ],
70
+ "roc_auc": [
71
+ 0.6999472975730896,
72
+ 0.8169810771942139,
73
+ 0.8789530992507935,
74
+ 0.9105718731880188,
75
+ 0.9285396337509155,
76
+ 0.932953953742981,
77
+ 0.9334519505500793,
78
+ 0.9398418664932251,
79
+ 0.9440649747848511,
80
+ 0.9340102672576904
81
+ ]
82
+ }
83
+ },
84
+ "training": {
85
+ "combined": {
86
+ "loss": [
87
+ 4.941826820373535,
88
+ 3.8220131397247314,
89
+ 2.966855049133301,
90
+ 1.9691708087921143,
91
+ 1.1989307403564453,
92
+ 0.7208091020584106,
93
+ 0.41259047389030457,
94
+ 0.2844356894493103,
95
+ 0.20260311663150787,
96
+ 0.15086334943771362
97
+ ]
98
+ },
99
+ "intent": {
100
+ "accuracy": [
101
+ 0.014659089967608452,
102
+ 0.03883907198905945,
103
+ 0.10787460207939148,
104
+ 0.25457778573036194,
105
+ 0.4590109586715698,
106
+ 0.653484046459198,
107
+ 0.8075626492500305,
108
+ 0.8613330721855164,
109
+ 0.9029062986373901,
110
+ 0.9410130977630615
111
+ ],
112
+ "accuracy_micro": [
113
+ 0.035635873675346375,
114
+ 0.09812531620264053,
115
+ 0.23492653667926788,
116
+ 0.4457017481327057,
117
+ 0.6433035135269165,
118
+ 0.7851714491844177,
119
+ 0.8792433738708496,
120
+ 0.9142037034034729,
121
+ 0.9376794695854187,
122
+ 0.9574396014213562
123
+ ],
124
+ "hits_at_k": [
125
+ 0.03866136819124222,
126
+ 0.09584441781044006,
127
+ 0.2281757891178131,
128
+ 0.46207964420318604,
129
+ 0.700287401676178,
130
+ 0.876828670501709,
131
+ 0.9502895474433899,
132
+ 0.9748519659042358,
133
+ 0.985029935836792,
134
+ 0.9925163984298706
135
+ ],
136
+ "loss": [
137
+ 4.941826820373535,
138
+ 3.8220131397247314,
139
+ 2.966855049133301,
140
+ 1.9691708087921143,
141
+ 1.1989307403564453,
142
+ 0.7208091020584106,
143
+ 0.41259047389030457,
144
+ 0.2844356894493103,
145
+ 0.20260311663150787,
146
+ 0.15086334943771362
147
+ ],
148
+ "roc_auc": [
149
+ 0.5121718645095825,
150
+ 0.7023259997367859,
151
+ 0.8708662986755371,
152
+ 0.9513766765594482,
153
+ 0.98272705078125,
154
+ 0.9933627843856812,
155
+ 0.997870147228241,
156
+ 0.9987038969993591,
157
+ 0.999286949634552,
158
+ 0.9996311664581299
159
+ ]
160
+ }
161
+ },
162
+ "validation": {
163
+ "combined": {
164
+ "loss": [
165
+ 4.075289249420166,
166
+ 3.5391108989715576,
167
+ 2.817091703414917,
168
+ 2.289855718612671,
169
+ 2.167616605758667,
170
+ 2.3362152576446533,
171
+ 2.3229939937591553,
172
+ 2.545104742050171,
173
+ 2.641582489013672,
174
+ 2.5151546001434326
175
+ ]
176
+ },
177
+ "intent": {
178
+ "accuracy": [
179
+ 0.02408008836209774,
180
+ 0.039156392216682434,
181
+ 0.13850188255310059,
182
+ 0.262044221162796,
183
+ 0.4144769310951233,
184
+ 0.4744482636451721,
185
+ 0.5366732478141785,
186
+ 0.546140730381012,
187
+ 0.5821728706359863,
188
+ 0.6166250705718994
189
+ ],
190
+ "accuracy_micro": [
191
+ 0.06743185222148895,
192
+ 0.09899569302797318,
193
+ 0.28263989090919495,
194
+ 0.4189383089542389,
195
+ 0.515064537525177,
196
+ 0.5451936721801758,
197
+ 0.6011477708816528,
198
+ 0.5810617208480835,
199
+ 0.5968436002731323,
200
+ 0.63271164894104
201
+ ],
202
+ "hits_at_k": [
203
+ 0.0595182403922081,
204
+ 0.12082408368587494,
205
+ 0.28157058358192444,
206
+ 0.4951961934566498,
207
+ 0.60570228099823,
208
+ 0.6759977340698242,
209
+ 0.7160040140151978,
210
+ 0.7496565580368042,
211
+ 0.7678131461143494,
212
+ 0.7617202997207642
213
+ ],
214
+ "loss": [
215
+ 4.075289249420166,
216
+ 3.5391108989715576,
217
+ 2.817091703414917,
218
+ 2.289855718612671,
219
+ 2.167616605758667,
220
+ 2.3362152576446533,
221
+ 2.3229939937591553,
222
+ 2.545104742050171,
223
+ 2.641582489013672,
224
+ 2.5151546001434326
225
+ ],
226
+ "roc_auc": [
227
+ 0.7134010791778564,
228
+ 0.8469101190567017,
229
+ 0.9105364680290222,
230
+ 0.9462321400642395,
231
+ 0.955407440662384,
232
+ 0.9614531993865967,
233
+ 0.9639908075332642,
234
+ 0.9642417430877686,
235
+ 0.9641472697257996,
236
+ 0.9704092144966125
237
+ ]
238
+ }
239
+ }
240
+ }