saqidr commited on
Commit
0ed4437
·
verified ·
1 Parent(s): 258b98e

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:554a05c79b6970f05612f20a53fb142204c7ccd5808ae60149536d4c55264da9
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9032e9a88f6f9c79f637ab75f83694a2dc476cbc777aabf84fab1ceac1c70e1f
3
  size 268290900
run-4/checkpoint-1500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f905aa4e0351f726703bf94a11837bc1bc6a52dc919b464b433bb31ee44cf05
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:417f67bfc777c996b35c8996ff62c52ec34d71e7a766e99077134c8e94a8f85b
3
  size 268290900
run-4/checkpoint-1500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0f2a244de8293a04ffe52e6d12be4190e593992609ab16af5335db404902310
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa48a0c978c6a7ede2f05dfd7e1a4fdfa87e493dfd4351367eab5fe63f91142a
3
  size 536643898
run-4/checkpoint-1500/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e4150b40cdd095f99e6d506db714a6c0a9a316d6b4d021acbfec8d198c96919
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c10319269a5ccb2640eed78049edda0fca1ea40d757f64b6ab5474fe9e926f9
3
  size 14244
run-4/checkpoint-1500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71453465aad25f4c5a0a948496c64b1f74df850abda497954afe3695c00756ee
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55c8d3ce0734337fc0c187ca5543b4c70ca45d996531f199209b3a0c2a798109
3
  size 1064
run-4/checkpoint-1500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d5d2fff8a65a6470ff21893289269130aa490c201d7c1e86a6b03304d6d7dd8
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09c1d2b3517a81c25cfd3dc4720ca0f5c5cd50449810325441209751db6b15be
3
+ size 5176
run-5/checkpoint-500/config.json CHANGED
@@ -326,6 +326,6 @@
326
  "sinusoidal_pos_embds": false,
327
  "tie_weights_": true,
328
  "torch_dtype": "float32",
329
- "transformers_version": "4.37.2",
330
  "vocab_size": 30522
331
  }
 
326
  "sinusoidal_pos_embds": false,
327
  "tie_weights_": true,
328
  "torch_dtype": "float32",
329
+ "transformers_version": "4.41.1",
330
  "vocab_size": 30522
331
  }
run-5/checkpoint-500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c24b0a4a8801f00062afb827eb49d3d1a5b189f65890c2bf2e8b900738912d9c
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9032e9a88f6f9c79f637ab75f83694a2dc476cbc777aabf84fab1ceac1c70e1f
3
  size 268290900
run-5/checkpoint-500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2747916ed8ac1c16a5e74b2324d8c38bfccaba7207dae222205f1e3343c41964
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4663de9ae3e603da38c925519eb450716b9756d7e66f8d52d633f08329dad88
3
  size 536643898
run-5/checkpoint-500/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8174c1d6ac2627de77161655e4e20ef37d9f2235e2e7c4adc0da0d4e0e14b6d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9fb2a0dfb1b0ccef3590fe01e9bd16b6db86f247cc9c7e77290c217a53bac20
3
  size 14244
run-5/checkpoint-500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e1264523e958cf7990dc5f42d876cc12129475c4603804cf66868aaf25c2c24
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98041bd7cae455426e290a1a0ee683bd5dd30893f7451fec3a464ae8995b17e4
3
  size 1064
run-5/checkpoint-500/tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
run-5/checkpoint-500/trainer_state.json CHANGED
@@ -10,31 +10,44 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6558064516129032,
14
- "eval_loss": 0.3044227957725525,
15
- "eval_runtime": 1.3634,
16
- "eval_samples_per_second": 2273.787,
17
- "eval_steps_per_second": 47.676,
18
  "step": 318
19
  },
20
  {
21
- "epoch": 1.57,
22
- "learning_rate": 1.371069182389937e-05,
23
- "loss": 0.4709,
 
24
  "step": 500
25
  }
26
  ],
27
  "logging_steps": 500,
28
- "max_steps": 1590,
29
  "num_input_tokens_seen": 0,
30
- "num_train_epochs": 5,
31
  "save_steps": 500,
32
- "total_flos": 129219778448376.0,
 
 
 
 
 
 
 
 
 
 
 
 
33
  "train_batch_size": 48,
34
  "trial_name": null,
35
  "trial_params": {
36
- "alpha": 0.12690688175028453,
37
- "num_train_epochs": 5,
38
- "temperature": 3
39
  }
40
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.584516129032258,
14
+ "eval_loss": 0.19766665995121002,
15
+ "eval_runtime": 1.3839,
16
+ "eval_samples_per_second": 2239.966,
17
+ "eval_steps_per_second": 46.967,
18
  "step": 318
19
  },
20
  {
21
+ "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.5089908242225647,
23
+ "learning_rate": 1.650593990216632e-05,
24
+ "loss": 0.318,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 2862,
30
  "num_input_tokens_seen": 0,
31
+ "num_train_epochs": 9,
32
  "save_steps": 500,
33
+ "stateful_callbacks": {
34
+ "TrainerControl": {
35
+ "args": {
36
+ "should_epoch_stop": false,
37
+ "should_evaluate": false,
38
+ "should_log": false,
39
+ "should_save": true,
40
+ "should_training_stop": false
41
+ },
42
+ "attributes": {}
43
+ }
44
+ },
45
+ "total_flos": 130072209152340.0,
46
  "train_batch_size": 48,
47
  "trial_name": null,
48
  "trial_params": {
49
+ "alpha": 0.18633073638587916,
50
+ "num_train_epochs": 9,
51
+ "temperature": 12
52
  }
53
  }
run-5/checkpoint-500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fa1c7452d85339003243159437eb829c186323cd1ac6c8ab11eba049b601da9
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b710d040c65b4e79eb6b061acc6db3a0384cdfac91c487c974101b5770343aa
3
+ size 5176
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09c1d2b3517a81c25cfd3dc4720ca0f5c5cd50449810325441209751db6b15be
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b710d040c65b4e79eb6b061acc6db3a0384cdfac91c487c974101b5770343aa
3
  size 5176