stuser2023 commited on
Commit
c128b2d
1 Parent(s): 2606d14

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ed58cfbcaae38345ff1479ed04cdec936f68a03189cbe89adafac63e2cae843
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca8fe9f4d3b1eda4a732430841ce9a13e294d4165cbbeecd8e420652e2ca1d59
3
  size 267832560
run-1/checkpoint-268/config.json CHANGED
@@ -20,6 +20,6 @@
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.38.2",
24
  "vocab_size": 30522
25
  }
 
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.45.0",
24
  "vocab_size": 30522
25
  }
run-1/checkpoint-268/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc9878783b0818c688c28abea8a5d61ace7dcab7d3f290e5b80a5cde21639f4f
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca8fe9f4d3b1eda4a732430841ce9a13e294d4165cbbeecd8e420652e2ca1d59
3
  size 267832560
run-1/checkpoint-268/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e636934686b41a0f79de6208f706315ddc2a3cfa0585cee3ba2d34a439b209db
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b516537655b6bf969c53f4695a44925a5b4bc725eee0618aaac9e3bcc64f989
3
  size 535727290
run-1/checkpoint-268/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a7df60d1f16fe9e85b40c9a61615d24bef5f0ce05b0f715ad8da2204ad48db8
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acf4e24f2f10c1479c3cc0c08f6c5b0ec1f4f7435d026a8a835334c7aebd88cb
3
+ size 14244
run-1/checkpoint-268/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:464e697567a35a41b5d63da1ecc000461d81bd321d5860f5da26db618d04341e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64657bb9ceab0aa97e483aa39f8608b0faee3d21fe29168f23a470df6b267123
3
  size 1064
run-1/checkpoint-268/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.4141806938515634,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-268",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,11 +10,11 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.5035493969917297,
14
- "eval_matthews_correlation": 0.4141806938515634,
15
- "eval_runtime": 0.7419,
16
- "eval_samples_per_second": 1405.832,
17
- "eval_steps_per_second": 88.96,
18
  "step": 268
19
  }
20
  ],
@@ -23,13 +23,25 @@
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 4,
25
  "save_steps": 500,
 
 
 
 
 
 
 
 
 
 
 
 
26
  "total_flos": 0,
27
  "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 1.0221265871912396e-05,
31
  "num_train_epochs": 4,
32
  "per_device_train_batch_size": 32,
33
- "seed": 8
34
  }
35
  }
 
1
  {
2
+ "best_metric": 0.3637991719695883,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-268",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.5182795524597168,
14
+ "eval_matthews_correlation": 0.3637991719695883,
15
+ "eval_runtime": 0.8749,
16
+ "eval_samples_per_second": 1192.137,
17
+ "eval_steps_per_second": 75.437,
18
  "step": 268
19
  }
20
  ],
 
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 4,
25
  "save_steps": 500,
26
+ "stateful_callbacks": {
27
+ "TrainerControl": {
28
+ "args": {
29
+ "should_epoch_stop": false,
30
+ "should_evaluate": false,
31
+ "should_log": false,
32
+ "should_save": true,
33
+ "should_training_stop": false
34
+ },
35
+ "attributes": {}
36
+ }
37
+ },
38
  "total_flos": 0,
39
  "train_batch_size": 32,
40
  "trial_name": null,
41
  "trial_params": {
42
+ "learning_rate": 7.650877926980232e-06,
43
  "num_train_epochs": 4,
44
  "per_device_train_batch_size": 32,
45
+ "seed": 28
46
  }
47
  }
run-1/checkpoint-268/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29d6b485a188c4e5c57b6f3bb948e3315674066d3a6ec8f44d6d328263cd659b
3
- size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55916040b5530f85fbbef38cd42dcd18934cd6b77c8a8a1a110fdc3d400f34d0
3
+ size 5304
runs/Sep26_13-34-33_f266a1036e13/events.out.tfevents.1727358189.f266a1036e13.258.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebf518373c6afe38ee8e31b1e4a6d789d20ac210800b0f4d65682c148044d916
3
+ size 5841
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed124d14dc79b84cb07ed86b8da4c02956606d59537d7769f990e0b60eecf882
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55916040b5530f85fbbef38cd42dcd18934cd6b77c8a8a1a110fdc3d400f34d0
3
  size 5304