End of training
Browse files
all_results.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"eval_loss": 0.27755075693130493,
|
4 |
-
"eval_runtime":
|
5 |
"eval_samples_per_second": 0.418,
|
6 |
"eval_steps_per_second": 0.07,
|
7 |
"eval_wer": 12.51522533495737,
|
8 |
-
"train_loss": 0.
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second":
|
11 |
-
"train_steps_per_second":
|
12 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"eval_loss": 0.27755075693130493,
|
4 |
+
"eval_runtime": 385.5995,
|
5 |
"eval_samples_per_second": 0.418,
|
6 |
"eval_steps_per_second": 0.07,
|
7 |
"eval_wer": 12.51522533495737,
|
8 |
+
"train_loss": 0.00010507909137471822,
|
9 |
+
"train_runtime": 167.7323,
|
10 |
+
"train_samples_per_second": 357.713,
|
11 |
+
"train_steps_per_second": 29.809
|
12 |
}
|
eval_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"eval_loss": 0.27755075693130493,
|
4 |
-
"eval_runtime":
|
5 |
"eval_samples_per_second": 0.418,
|
6 |
"eval_steps_per_second": 0.07,
|
7 |
"eval_wer": 12.51522533495737
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"eval_loss": 0.27755075693130493,
|
4 |
+
"eval_runtime": 385.5995,
|
5 |
"eval_samples_per_second": 0.418,
|
6 |
"eval_steps_per_second": 0.07,
|
7 |
"eval_wer": 12.51522533495737
|
runs/Dec10_21-10-13_dante/events.out.tfevents.1670703878.dante.3904631.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fd8ce3059c2b75f54be418a4e22c49836ae752e23b2eb07db72e304fbd3626e
|
3 |
+
size 358
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second":
|
6 |
-
"train_steps_per_second":
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
+
"train_loss": 0.00010507909137471822,
|
4 |
+
"train_runtime": 167.7323,
|
5 |
+
"train_samples_per_second": 357.713,
|
6 |
+
"train_steps_per_second": 29.809
|
7 |
}
|
trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 12.51522533495737,
|
3 |
"best_model_checkpoint": "./checkpoint-5000",
|
4 |
-
"epoch": 1.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1254,17 +1254,17 @@
|
|
1254 |
},
|
1255 |
{
|
1256 |
"epoch": 1.0,
|
1257 |
-
"step":
|
1258 |
-
"total_flos": 1.
|
1259 |
-
"train_loss": 0.
|
1260 |
-
"train_runtime":
|
1261 |
-
"train_samples_per_second":
|
1262 |
-
"train_steps_per_second":
|
1263 |
}
|
1264 |
],
|
1265 |
"max_steps": 5000,
|
1266 |
"num_train_epochs": 9223372036854775807,
|
1267 |
-
"total_flos": 1.
|
1268 |
"trial_name": null,
|
1269 |
"trial_params": null
|
1270 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 12.51522533495737,
|
3 |
"best_model_checkpoint": "./checkpoint-5000",
|
4 |
+
"epoch": 1.0002,
|
5 |
+
"global_step": 5001,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1254 |
},
|
1255 |
{
|
1256 |
"epoch": 1.0,
|
1257 |
+
"step": 5001,
|
1258 |
+
"total_flos": 1.2741573362483357e+20,
|
1259 |
+
"train_loss": 0.00010507909137471822,
|
1260 |
+
"train_runtime": 167.7323,
|
1261 |
+
"train_samples_per_second": 357.713,
|
1262 |
+
"train_steps_per_second": 29.809
|
1263 |
}
|
1264 |
],
|
1265 |
"max_steps": 5000,
|
1266 |
"num_train_epochs": 9223372036854775807,
|
1267 |
+
"total_flos": 1.2741573362483357e+20,
|
1268 |
"trial_name": null,
|
1269 |
"trial_params": null
|
1270 |
}
|