stuser2023
commited on
Commit
•
c128b2d
1
Parent(s):
2606d14
Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- run-1/checkpoint-268/config.json +1 -1
- run-1/checkpoint-268/model.safetensors +1 -1
- run-1/checkpoint-268/optimizer.pt +1 -1
- run-1/checkpoint-268/rng_state.pth +2 -2
- run-1/checkpoint-268/scheduler.pt +1 -1
- run-1/checkpoint-268/trainer_state.json +20 -8
- run-1/checkpoint-268/training_args.bin +2 -2
- runs/Sep26_13-34-33_f266a1036e13/events.out.tfevents.1727358189.f266a1036e13.258.3 +3 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca8fe9f4d3b1eda4a732430841ce9a13e294d4165cbbeecd8e420652e2ca1d59
|
3 |
size 267832560
|
run-1/checkpoint-268/config.json
CHANGED
@@ -20,6 +20,6 @@
|
|
20 |
"sinusoidal_pos_embds": false,
|
21 |
"tie_weights_": true,
|
22 |
"torch_dtype": "float32",
|
23 |
-
"transformers_version": "4.
|
24 |
"vocab_size": 30522
|
25 |
}
|
|
|
20 |
"sinusoidal_pos_embds": false,
|
21 |
"tie_weights_": true,
|
22 |
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.45.0",
|
24 |
"vocab_size": 30522
|
25 |
}
|
run-1/checkpoint-268/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca8fe9f4d3b1eda4a732430841ce9a13e294d4165cbbeecd8e420652e2ca1d59
|
3 |
size 267832560
|
run-1/checkpoint-268/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535727290
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b516537655b6bf969c53f4695a44925a5b4bc725eee0618aaac9e3bcc64f989
|
3 |
size 535727290
|
run-1/checkpoint-268/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acf4e24f2f10c1479c3cc0c08f6c5b0ec1f4f7435d026a8a835334c7aebd88cb
|
3 |
+
size 14244
|
run-1/checkpoint-268/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64657bb9ceab0aa97e483aa39f8608b0faee3d21fe29168f23a470df6b267123
|
3 |
size 1064
|
run-1/checkpoint-268/trainer_state.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-268",
|
4 |
"epoch": 1.0,
|
5 |
"eval_steps": 500,
|
@@ -10,11 +10,11 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
-
"eval_loss": 0.
|
14 |
-
"eval_matthews_correlation": 0.
|
15 |
-
"eval_runtime": 0.
|
16 |
-
"eval_samples_per_second":
|
17 |
-
"eval_steps_per_second":
|
18 |
"step": 268
|
19 |
}
|
20 |
],
|
@@ -23,13 +23,25 @@
|
|
23 |
"num_input_tokens_seen": 0,
|
24 |
"num_train_epochs": 4,
|
25 |
"save_steps": 500,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
26 |
"total_flos": 0,
|
27 |
"train_batch_size": 32,
|
28 |
"trial_name": null,
|
29 |
"trial_params": {
|
30 |
-
"learning_rate":
|
31 |
"num_train_epochs": 4,
|
32 |
"per_device_train_batch_size": 32,
|
33 |
-
"seed":
|
34 |
}
|
35 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.3637991719695883,
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-268",
|
4 |
"epoch": 1.0,
|
5 |
"eval_steps": 500,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
+
"eval_loss": 0.5182795524597168,
|
14 |
+
"eval_matthews_correlation": 0.3637991719695883,
|
15 |
+
"eval_runtime": 0.8749,
|
16 |
+
"eval_samples_per_second": 1192.137,
|
17 |
+
"eval_steps_per_second": 75.437,
|
18 |
"step": 268
|
19 |
}
|
20 |
],
|
|
|
23 |
"num_input_tokens_seen": 0,
|
24 |
"num_train_epochs": 4,
|
25 |
"save_steps": 500,
|
26 |
+
"stateful_callbacks": {
|
27 |
+
"TrainerControl": {
|
28 |
+
"args": {
|
29 |
+
"should_epoch_stop": false,
|
30 |
+
"should_evaluate": false,
|
31 |
+
"should_log": false,
|
32 |
+
"should_save": true,
|
33 |
+
"should_training_stop": false
|
34 |
+
},
|
35 |
+
"attributes": {}
|
36 |
+
}
|
37 |
+
},
|
38 |
"total_flos": 0,
|
39 |
"train_batch_size": 32,
|
40 |
"trial_name": null,
|
41 |
"trial_params": {
|
42 |
+
"learning_rate": 7.650877926980232e-06,
|
43 |
"num_train_epochs": 4,
|
44 |
"per_device_train_batch_size": 32,
|
45 |
+
"seed": 28
|
46 |
}
|
47 |
}
|
run-1/checkpoint-268/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55916040b5530f85fbbef38cd42dcd18934cd6b77c8a8a1a110fdc3d400f34d0
|
3 |
+
size 5304
|
runs/Sep26_13-34-33_f266a1036e13/events.out.tfevents.1727358189.f266a1036e13.258.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebf518373c6afe38ee8e31b1e4a6d789d20ac210800b0f4d65682c148044d916
|
3 |
+
size 5841
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55916040b5530f85fbbef38cd42dcd18934cd6b77c8a8a1a110fdc3d400f34d0
|
3 |
size 5304
|