Model save
Browse files- README.md +1 -4
- all_results.json +3 -3
- config.json +1 -1
- model-00001-of-00006.safetensors +1 -1
- model-00002-of-00006.safetensors +1 -1
- model-00003-of-00006.safetensors +1 -1
- model-00004-of-00006.safetensors +1 -1
- model-00005-of-00006.safetensors +1 -1
- model-00006-of-00006.safetensors +1 -1
- runs/Feb26_04-46-39_a100-80-8-zifeng-1/events.out.tfevents.1740545225.a100-80-8-zifeng-1.97947.0 +3 -0
- train_results.json +3 -3
- trainer_state.json +14 -14
- training_args.bin +1 -1
README.md
CHANGED
@@ -3,12 +3,9 @@ library_name: transformers
|
|
3 |
license: apache-2.0
|
4 |
base_model: Qwen/Qwen2.5-14B-Instruct
|
5 |
tags:
|
6 |
-
- alignment-handbook
|
7 |
-
- trl
|
8 |
-
- sft
|
9 |
-
- generated_from_trainer
|
10 |
- trl
|
11 |
- sft
|
|
|
12 |
- generated_from_trainer
|
13 |
model-index:
|
14 |
- name: Qwen2.5-14B-Instruct-star-nl-3Rounds-iter-1
|
|
|
3 |
license: apache-2.0
|
4 |
base_model: Qwen/Qwen2.5-14B-Instruct
|
5 |
tags:
|
|
|
|
|
|
|
|
|
6 |
- trl
|
7 |
- sft
|
8 |
+
- alignment-handbook
|
9 |
- generated_from_trainer
|
10 |
model-index:
|
11 |
- name: Qwen2.5-14B-Instruct-star-nl-3Rounds-iter-1
|
all_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 4.851063829787234,
|
3 |
"total_flos": 1.70668694534357e+17,
|
4 |
-
"train_loss": 0.
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 748,
|
7 |
-
"train_samples_per_second": 6.
|
8 |
"train_steps_per_second": 0.043
|
9 |
}
|
|
|
1 |
{
|
2 |
"epoch": 4.851063829787234,
|
3 |
"total_flos": 1.70668694534357e+17,
|
4 |
+
"train_loss": 0.5626590156555176,
|
5 |
+
"train_runtime": 583.7651,
|
6 |
"train_samples": 748,
|
7 |
+
"train_samples_per_second": 6.407,
|
8 |
"train_steps_per_second": 0.043
|
9 |
}
|
config.json
CHANGED
@@ -24,7 +24,7 @@
|
|
24 |
"tie_word_embeddings": false,
|
25 |
"torch_dtype": "bfloat16",
|
26 |
"transformers_version": "4.47.1",
|
27 |
-
"use_cache":
|
28 |
"use_sliding_window": false,
|
29 |
"vocab_size": 151665
|
30 |
}
|
|
|
24 |
"tie_word_embeddings": false,
|
25 |
"torch_dtype": "bfloat16",
|
26 |
"transformers_version": "4.47.1",
|
27 |
+
"use_cache": false,
|
28 |
"use_sliding_window": false,
|
29 |
"vocab_size": 151665
|
30 |
}
|
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4982125520
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8f9b5f88c1f454895e784effe9555c4c158670f4a73ae5a4c19b06f1e384898
|
3 |
size 4982125520
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02e121ba84cccfb0893309ef0758528aea8ee01c8e16b6b7c880032e9e3483bd
|
3 |
size 4954847344
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac9f0ac0b86364b586ee0ba230934f5c9f9bb9c0b2db421d372660cbdb264479
|
3 |
size 4954847392
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c3516a4d0acf96e36897aac6f4fa094cbcb6f5d18cdd01be133e8488d8d2cc2
|
3 |
size 4954847392
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb0c7b2071a3a2aff92ed9b7ed5d466b690c51e26669cdcf98042c43ba4add3f
|
3 |
size 4954847392
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4730447400
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e89bae0f8f908685e0c8e831adef7608c22829ebadc5685c1650bff420cebe6
|
3 |
size 4730447400
|
runs/Feb26_04-46-39_a100-80-8-zifeng-1/events.out.tfevents.1740545225.a100-80-8-zifeng-1.97947.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b35e3292972c92f61ae4e41f6fa035cce996401791fd9a4aeeb081c6749d9c20
|
3 |
+
size 7282
|
train_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 4.851063829787234,
|
3 |
"total_flos": 1.70668694534357e+17,
|
4 |
-
"train_loss": 0.
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 748,
|
7 |
-
"train_samples_per_second": 6.
|
8 |
"train_steps_per_second": 0.043
|
9 |
}
|
|
|
1 |
{
|
2 |
"epoch": 4.851063829787234,
|
3 |
"total_flos": 1.70668694534357e+17,
|
4 |
+
"train_loss": 0.5626590156555176,
|
5 |
+
"train_runtime": 583.7651,
|
6 |
"train_samples": 748,
|
7 |
+
"train_samples_per_second": 6.407,
|
8 |
"train_steps_per_second": 0.043
|
9 |
}
|
trainer_state.json
CHANGED
@@ -10,53 +10,53 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.1702127659574468,
|
13 |
-
"grad_norm": 1.
|
14 |
"learning_rate": 4.980286753286196e-06,
|
15 |
"loss": 1.1367,
|
16 |
"step": 1
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.851063829787234,
|
20 |
-
"grad_norm": 0.
|
21 |
"learning_rate": 4.522542485937369e-06,
|
22 |
-
"loss": 0.
|
23 |
"step": 5
|
24 |
},
|
25 |
{
|
26 |
"epoch": 1.851063829787234,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 3.272542485937369e-06,
|
29 |
-
"loss": 0.
|
30 |
"step": 10
|
31 |
},
|
32 |
{
|
33 |
"epoch": 2.851063829787234,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 1.7274575140626318e-06,
|
36 |
-
"loss": 0.
|
37 |
"step": 15
|
38 |
},
|
39 |
{
|
40 |
"epoch": 3.851063829787234,
|
41 |
-
"grad_norm": 0.
|
42 |
"learning_rate": 4.774575140626317e-07,
|
43 |
-
"loss": 0.
|
44 |
"step": 20
|
45 |
},
|
46 |
{
|
47 |
"epoch": 4.851063829787234,
|
48 |
-
"grad_norm": 0.
|
49 |
"learning_rate": 0.0,
|
50 |
-
"loss": 0.
|
51 |
"step": 25
|
52 |
},
|
53 |
{
|
54 |
"epoch": 4.851063829787234,
|
55 |
"step": 25,
|
56 |
"total_flos": 1.70668694534357e+17,
|
57 |
-
"train_loss": 0.
|
58 |
-
"train_runtime":
|
59 |
-
"train_samples_per_second": 6.
|
60 |
"train_steps_per_second": 0.043
|
61 |
}
|
62 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.1702127659574468,
|
13 |
+
"grad_norm": 1.0480449041222901,
|
14 |
"learning_rate": 4.980286753286196e-06,
|
15 |
"loss": 1.1367,
|
16 |
"step": 1
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.851063829787234,
|
20 |
+
"grad_norm": 0.7218518716452021,
|
21 |
"learning_rate": 4.522542485937369e-06,
|
22 |
+
"loss": 0.7212,
|
23 |
"step": 5
|
24 |
},
|
25 |
{
|
26 |
"epoch": 1.851063829787234,
|
27 |
+
"grad_norm": 0.48974754683120497,
|
28 |
"learning_rate": 3.272542485937369e-06,
|
29 |
+
"loss": 0.5486,
|
30 |
"step": 10
|
31 |
},
|
32 |
{
|
33 |
"epoch": 2.851063829787234,
|
34 |
+
"grad_norm": 0.05989476827451271,
|
35 |
"learning_rate": 1.7274575140626318e-06,
|
36 |
+
"loss": 0.4988,
|
37 |
"step": 15
|
38 |
},
|
39 |
{
|
40 |
"epoch": 3.851063829787234,
|
41 |
+
"grad_norm": 0.04162142765751137,
|
42 |
"learning_rate": 4.774575140626317e-07,
|
43 |
+
"loss": 0.4812,
|
44 |
"step": 20
|
45 |
},
|
46 |
{
|
47 |
"epoch": 4.851063829787234,
|
48 |
+
"grad_norm": 0.03625801845951793,
|
49 |
"learning_rate": 0.0,
|
50 |
+
"loss": 0.4803,
|
51 |
"step": 25
|
52 |
},
|
53 |
{
|
54 |
"epoch": 4.851063829787234,
|
55 |
"step": 25,
|
56 |
"total_flos": 1.70668694534357e+17,
|
57 |
+
"train_loss": 0.5626590156555176,
|
58 |
+
"train_runtime": 583.7651,
|
59 |
+
"train_samples_per_second": 6.407,
|
60 |
"train_steps_per_second": 0.043
|
61 |
}
|
62 |
],
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7096
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b82e3f589ead1fa3980b186350331e33ac1776d442bae40f34a7a0036f1a1f7d
|
3 |
size 7096
|