nblinh63 commited on
Commit
6f125ef
·
verified ·
1 Parent(s): c2b5392

End of training

Browse files
README.md CHANGED
@@ -103,7 +103,7 @@ xformers_attention: true
103
 
104
  This model is a fine-tuned version of [UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2](https://huggingface.co/UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2) on the None dataset.
105
  It achieves the following results on the evaluation set:
106
- - Loss: 0.7182
107
 
108
  ## Model description
109
 
@@ -135,7 +135,7 @@ The following hyperparameters were used during training:
135
 
136
  | Training Loss | Epoch | Step | Validation Loss |
137
  |:-------------:|:------:|:----:|:---------------:|
138
- | 0.5323 | 0.0002 | 10 | 0.7182 |
139
 
140
 
141
  ### Framework versions
 
103
 
104
  This model is a fine-tuned version of [UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2](https://huggingface.co/UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2) on the None dataset.
105
  It achieves the following results on the evaluation set:
106
+ - Loss: 0.7138
107
 
108
  ## Model description
109
 
 
135
 
136
  | Training Loss | Epoch | Step | Validation Loss |
137
  |:-------------:|:------:|:----:|:---------------:|
138
+ | 0.5258 | 0.0002 | 10 | 0.7138 |
139
 
140
 
141
  ### Framework versions
adapter_config.json CHANGED
@@ -21,11 +21,11 @@
21
  "revision": null,
22
  "target_modules": [
23
  "up_proj",
 
 
24
  "down_proj",
25
  "o_proj",
26
- "gate_proj",
27
  "k_proj",
28
- "v_proj",
29
  "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
21
  "revision": null,
22
  "target_modules": [
23
  "up_proj",
24
+ "v_proj",
25
+ "gate_proj",
26
  "down_proj",
27
  "o_proj",
 
28
  "k_proj",
 
29
  "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac50c8dc0677333db0d2d9674a7aa6e3dcf567a9d660a4af3edb6ec82085e6ce
3
  size 216284090
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7789771f9cb512c89fe0333ebf8ee7c2731c7eee526dbf9a682d9e6e8e807faa
3
  size 216284090
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c961c169dfe42e8e367c4ccef846b4a23ebffb79278121b87fb11b0d6701e6b
3
  size 216151256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d4bcc4dc11d7d8e56003e258778a55538250dda5ed8838131ec1381fb792ebc
3
  size 216151256
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34c0a4dfad0d34a995cc329aae43855a8a4c6d2ea5141723489f8a99e5e983f8
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cb5fdf2d06b318865cee65dfc8f4119cabbe3c5273190785df1942baeb4bbdb
3
  size 6776