Kira-Floris commited on
Commit
5edad91
1 Parent(s): fb00fc9

Training in progress, epoch 1

Browse files
logs/events.out.tfevents.1719311480.852b1e905a9a.223.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a56ff2e601bbf098efbcd94734bc850a385b1d63aeb575838f7d4a746faa2a7
3
+ size 5428
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d47eed6b6c10b89046c5579792754bc1f6f31fc160278e47e2d473bc77094d3
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d3cdebd4645b1d3aedb598d74b637f5ed037f958b572ee80608133aee3a9976
3
  size 17549312
run-1/checkpoint-527/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb1ca79a9bf8b490a2f6783a131c6de76de46d7d9d225d392b55c2bf9992c8ad
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d3cdebd4645b1d3aedb598d74b637f5ed037f958b572ee80608133aee3a9976
3
  size 17549312
run-1/checkpoint-527/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c745062c7e1e60a2fc3d1bc56b16a62f1c67a52915e29c53ed324c2ad2e257d
3
  size 35123898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acf0b6e139990c3307f08d479d701e93926f0f09437c5b321cb9081a954e142e
3
  size 35123898
run-1/checkpoint-527/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:940589cb04f9e8ff6df41bbdafd8a68677bbf95c887b63d983f5df8e3c1182bb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb5b0e469d1d3eab700f24f3dfac2d47dd96a3c9a2df7246109443b6077d1bd
3
  size 1064
run-1/checkpoint-527/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8107798165137615,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-1/checkpoint-527",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,18 +10,18 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 17.658132553100586,
14
- "learning_rate": 7.63128750557968e-05,
15
- "loss": 1.3361,
16
  "step": 527
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.8107798165137615,
21
- "eval_loss": 1.132369041442871,
22
- "eval_runtime": 2.6024,
23
- "eval_samples_per_second": 335.073,
24
- "eval_steps_per_second": 2.69,
25
  "step": 527
26
  }
27
  ],
@@ -46,9 +46,9 @@
46
  "train_batch_size": 128,
47
  "trial_name": null,
48
  "trial_params": {
49
- "alpha": 0.5918699224275719,
50
- "learning_rate": 0.00011446931258369519,
51
  "num_train_epochs": 3,
52
- "temperature": 9
53
  }
54
  }
 
1
  {
2
+ "best_metric": 0.8268348623853211,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-1/checkpoint-527",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 20.18393898010254,
14
+ "learning_rate": 0.0004400348679504635,
15
+ "loss": 1.3749,
16
  "step": 527
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.8268348623853211,
21
+ "eval_loss": 1.6724135875701904,
22
+ "eval_runtime": 2.5582,
23
+ "eval_samples_per_second": 340.862,
24
+ "eval_steps_per_second": 2.736,
25
  "step": 527
26
  }
27
  ],
 
46
  "train_batch_size": 128,
47
  "trial_name": null,
48
  "trial_params": {
49
+ "alpha": 0.22319309854701086,
50
+ "learning_rate": 0.0006600523019256953,
51
  "num_train_epochs": 3,
52
+ "temperature": 16
53
  }
54
  }
run-1/checkpoint-527/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cdb44a8bec3049f59e3c6aa052eb44c31862f011784d5f05f8553620eb8f64a0
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9990afd96f204321e9e33fc4071f73d76355111015fd2ec723f4a4e4849ce7
3
  size 5176
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15e7b4feae857373f91378a3d0efc15d0ec396bfba71e74c965086843aa6acf4
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9990afd96f204321e9e33fc4071f73d76355111015fd2ec723f4a4e4849ce7
3
  size 5176