Lichang-Chen commited on
Commit
5aa3053
·
verified ·
1 Parent(s): 250bfae

Model save

Browse files
README.md CHANGED
@@ -3,12 +3,9 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: Qwen/Qwen2.5-14B-Instruct
5
  tags:
6
- - alignment-handbook
7
- - trl
8
- - sft
9
- - generated_from_trainer
10
  - trl
11
  - sft
 
12
  - generated_from_trainer
13
  model-index:
14
  - name: Qwen2.5-14B-Instruct-star-nl-3Rounds-iter-1
 
3
  license: apache-2.0
4
  base_model: Qwen/Qwen2.5-14B-Instruct
5
  tags:
 
 
 
 
6
  - trl
7
  - sft
8
+ - alignment-handbook
9
  - generated_from_trainer
10
  model-index:
11
  - name: Qwen2.5-14B-Instruct-star-nl-3Rounds-iter-1
all_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 4.851063829787234,
3
  "total_flos": 1.70668694534357e+17,
4
- "train_loss": 0.559986629486084,
5
- "train_runtime": 582.7329,
6
  "train_samples": 748,
7
- "train_samples_per_second": 6.418,
8
  "train_steps_per_second": 0.043
9
  }
 
1
  {
2
  "epoch": 4.851063829787234,
3
  "total_flos": 1.70668694534357e+17,
4
+ "train_loss": 0.5626590156555176,
5
+ "train_runtime": 583.7651,
6
  "train_samples": 748,
7
+ "train_samples_per_second": 6.407,
8
  "train_steps_per_second": 0.043
9
  }
config.json CHANGED
@@ -24,7 +24,7 @@
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
  "transformers_version": "4.47.1",
27
- "use_cache": true,
28
  "use_sliding_window": false,
29
  "vocab_size": 151665
30
  }
 
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
  "transformers_version": "4.47.1",
27
+ "use_cache": false,
28
  "use_sliding_window": false,
29
  "vocab_size": 151665
30
  }
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:413386ad6d055588b7f28aa5d00caf27c8cab2cb680c415ceb0578149f5c207f
3
  size 4982125520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f9b5f88c1f454895e784effe9555c4c158670f4a73ae5a4c19b06f1e384898
3
  size 4982125520
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b430d2faacc0f0829c7859fd238f3ee1eeca1c8aea03acaf7e3540983c60978e
3
  size 4954847344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02e121ba84cccfb0893309ef0758528aea8ee01c8e16b6b7c880032e9e3483bd
3
  size 4954847344
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2454ceaf7475b5330ad7395f57b3b3abbb042825805b14cce721e9609351ed8
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac9f0ac0b86364b586ee0ba230934f5c9f9bb9c0b2db421d372660cbdb264479
3
  size 4954847392
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:739e9308f48a30826132cdc00887b8152b183679bd4d3a7c9f03e9baf91f603d
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c3516a4d0acf96e36897aac6f4fa094cbcb6f5d18cdd01be133e8488d8d2cc2
3
  size 4954847392
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f42f36be99b518998681df94d7de2270d3bcf9525d3c1a1d6061a5517092463
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb0c7b2071a3a2aff92ed9b7ed5d466b690c51e26669cdcf98042c43ba4add3f
3
  size 4954847392
model-00006-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fc45cd8dad35a0985906c9a25441e8932f8ace0b504752081a21699d9006db2
3
  size 4730447400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e89bae0f8f908685e0c8e831adef7608c22829ebadc5685c1650bff420cebe6
3
  size 4730447400
runs/Feb26_04-46-39_a100-80-8-zifeng-1/events.out.tfevents.1740545225.a100-80-8-zifeng-1.97947.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b35e3292972c92f61ae4e41f6fa035cce996401791fd9a4aeeb081c6749d9c20
3
+ size 7282
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 4.851063829787234,
3
  "total_flos": 1.70668694534357e+17,
4
- "train_loss": 0.559986629486084,
5
- "train_runtime": 582.7329,
6
  "train_samples": 748,
7
- "train_samples_per_second": 6.418,
8
  "train_steps_per_second": 0.043
9
  }
 
1
  {
2
  "epoch": 4.851063829787234,
3
  "total_flos": 1.70668694534357e+17,
4
+ "train_loss": 0.5626590156555176,
5
+ "train_runtime": 583.7651,
6
  "train_samples": 748,
7
+ "train_samples_per_second": 6.407,
8
  "train_steps_per_second": 0.043
9
  }
trainer_state.json CHANGED
@@ -10,53 +10,53 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.1702127659574468,
13
- "grad_norm": 1.0480686423347865,
14
  "learning_rate": 4.980286753286196e-06,
15
  "loss": 1.1367,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.851063829787234,
20
- "grad_norm": 0.7371347999735538,
21
  "learning_rate": 4.522542485937369e-06,
22
- "loss": 0.7211,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 1.851063829787234,
27
- "grad_norm": 0.1221598511317441,
28
  "learning_rate": 3.272542485937369e-06,
29
- "loss": 0.5451,
30
  "step": 10
31
  },
32
  {
33
  "epoch": 2.851063829787234,
34
- "grad_norm": 0.06221615866869028,
35
  "learning_rate": 1.7274575140626318e-06,
36
- "loss": 0.4954,
37
  "step": 15
38
  },
39
  {
40
  "epoch": 3.851063829787234,
41
- "grad_norm": 0.04156397934867294,
42
  "learning_rate": 4.774575140626317e-07,
43
- "loss": 0.478,
44
  "step": 20
45
  },
46
  {
47
  "epoch": 4.851063829787234,
48
- "grad_norm": 0.036582860908155705,
49
  "learning_rate": 0.0,
50
- "loss": 0.4771,
51
  "step": 25
52
  },
53
  {
54
  "epoch": 4.851063829787234,
55
  "step": 25,
56
  "total_flos": 1.70668694534357e+17,
57
- "train_loss": 0.559986629486084,
58
- "train_runtime": 582.7329,
59
- "train_samples_per_second": 6.418,
60
  "train_steps_per_second": 0.043
61
  }
62
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.1702127659574468,
13
+ "grad_norm": 1.0480449041222901,
14
  "learning_rate": 4.980286753286196e-06,
15
  "loss": 1.1367,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.851063829787234,
20
+ "grad_norm": 0.7218518716452021,
21
  "learning_rate": 4.522542485937369e-06,
22
+ "loss": 0.7212,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 1.851063829787234,
27
+ "grad_norm": 0.48974754683120497,
28
  "learning_rate": 3.272542485937369e-06,
29
+ "loss": 0.5486,
30
  "step": 10
31
  },
32
  {
33
  "epoch": 2.851063829787234,
34
+ "grad_norm": 0.05989476827451271,
35
  "learning_rate": 1.7274575140626318e-06,
36
+ "loss": 0.4988,
37
  "step": 15
38
  },
39
  {
40
  "epoch": 3.851063829787234,
41
+ "grad_norm": 0.04162142765751137,
42
  "learning_rate": 4.774575140626317e-07,
43
+ "loss": 0.4812,
44
  "step": 20
45
  },
46
  {
47
  "epoch": 4.851063829787234,
48
+ "grad_norm": 0.03625801845951793,
49
  "learning_rate": 0.0,
50
+ "loss": 0.4803,
51
  "step": 25
52
  },
53
  {
54
  "epoch": 4.851063829787234,
55
  "step": 25,
56
  "total_flos": 1.70668694534357e+17,
57
+ "train_loss": 0.5626590156555176,
58
+ "train_runtime": 583.7651,
59
+ "train_samples_per_second": 6.407,
60
  "train_steps_per_second": 0.043
61
  }
62
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b6cd22decd9ce87a02de6508d2ec702205300998b0483fdaf10bcd09a40928d
3
  size 7096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b82e3f589ead1fa3980b186350331e33ac1776d442bae40f34a7a0036f1a1f7d
3
  size 7096