Training in progress, step 36000
Browse files
all_results.json
CHANGED
@@ -5,8 +5,8 @@
|
|
5 |
"eval_samples_per_second": 0.81,
|
6 |
"eval_steps_per_second": 0.203,
|
7 |
"eval_wer": 29.205723913714138,
|
8 |
-
"train_loss":
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second":
|
11 |
-
"train_steps_per_second":
|
12 |
}
|
|
|
5 |
"eval_samples_per_second": 0.81,
|
6 |
"eval_steps_per_second": 0.203,
|
7 |
"eval_wer": 29.205723913714138,
|
8 |
+
"train_loss": 1.5390448555129346e-05,
|
9 |
+
"train_runtime": 6.8399,
|
10 |
+
"train_samples_per_second": 40936.549,
|
11 |
+
"train_steps_per_second": 5117.069
|
12 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4936567968
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2793cdc0144994fe021fe306cd3dab078f8e2a27184dc7a8734c2650705c9db5
|
3 |
size 4936567968
|
runs/Feb04_08-43-21_ip-10-0-3-5.eu-west-1.compute.internal/events.out.tfevents.1707036244.ip-10-0-3-5.eu-west-1.compute.internal.10679.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11a6a682062abf19d149cbf3e928b6f72a7b99231e75383176c59544e5e7a8a9
|
3 |
+
size 11942
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 0.18,
|
3 |
-
"train_loss":
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second":
|
6 |
-
"train_steps_per_second":
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 0.18,
|
3 |
+
"train_loss": 1.5390448555129346e-05,
|
4 |
+
"train_runtime": 6.8399,
|
5 |
+
"train_samples_per_second": 40936.549,
|
6 |
+
"train_steps_per_second": 5117.069
|
7 |
}
|
trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 29.205723913714138,
|
3 |
"best_model_checkpoint": "./hamsa-pretrained/checkpoint-35000",
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 1000,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -8725,12 +8725,12 @@
|
|
8725 |
},
|
8726 |
{
|
8727 |
"epoch": 0.18,
|
8728 |
-
"step":
|
8729 |
-
"total_flos": 4.
|
8730 |
-
"train_loss":
|
8731 |
-
"train_runtime":
|
8732 |
-
"train_samples_per_second":
|
8733 |
-
"train_steps_per_second":
|
8734 |
}
|
8735 |
],
|
8736 |
"logging_steps": 25,
|
@@ -8738,7 +8738,7 @@
|
|
8738 |
"num_input_tokens_seen": 0,
|
8739 |
"num_train_epochs": 1,
|
8740 |
"save_steps": 1000,
|
8741 |
-
"total_flos": 4.
|
8742 |
"train_batch_size": 8,
|
8743 |
"trial_name": null,
|
8744 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 29.205723913714138,
|
3 |
"best_model_checkpoint": "./hamsa-pretrained/checkpoint-35000",
|
4 |
+
"epoch": 0.17544536787336215,
|
5 |
"eval_steps": 1000,
|
6 |
+
"global_step": 35001,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
8725 |
},
|
8726 |
{
|
8727 |
"epoch": 0.18,
|
8728 |
+
"step": 35001,
|
8729 |
+
"total_flos": 4.7538258866601984e+20,
|
8730 |
+
"train_loss": 1.5390448555129346e-05,
|
8731 |
+
"train_runtime": 6.8399,
|
8732 |
+
"train_samples_per_second": 40936.549,
|
8733 |
+
"train_steps_per_second": 5117.069
|
8734 |
}
|
8735 |
],
|
8736 |
"logging_steps": 25,
|
|
|
8738 |
"num_input_tokens_seen": 0,
|
8739 |
"num_train_epochs": 1,
|
8740 |
"save_steps": 1000,
|
8741 |
+
"total_flos": 4.7538258866601984e+20,
|
8742 |
"train_batch_size": 8,
|
8743 |
"trial_name": null,
|
8744 |
"trial_params": null
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4856
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74b9e93f07ccec52bc6245b5cb3e4e9324c69da5b5fc95cb33c1098eb297b715
|
3 |
size 4856
|