KoichiYasuoka
commited on
Commit
·
fdfb365
1
Parent(s):
e44aa2c
model improved
Browse files
config.json
CHANGED
@@ -2,7 +2,6 @@
|
|
2 |
"architectures": [
|
3 |
"MistralForTokenClassification"
|
4 |
],
|
5 |
-
"attention_bias": false,
|
6 |
"attention_dropout": 0.0,
|
7 |
"auto_map": {
|
8 |
"AutoModelForTokenClassification": "upos.MistralForTokenClassification"
|
@@ -152,14 +151,11 @@
|
|
152 |
"X": 57
|
153 |
},
|
154 |
"max_position_embeddings": 32768,
|
155 |
-
"
|
156 |
-
"model_type": "llama",
|
157 |
"num_attention_heads": 32,
|
158 |
"num_hidden_layers": 32,
|
159 |
"num_key_value_heads": 8,
|
160 |
-
"pretraining_tp": 1,
|
161 |
"rms_norm_eps": 1e-05,
|
162 |
-
"rope_scaling": null,
|
163 |
"rope_theta": 10000.0,
|
164 |
"sliding_window": 4096,
|
165 |
"tie_word_embeddings": false,
|
|
|
2 |
"architectures": [
|
3 |
"MistralForTokenClassification"
|
4 |
],
|
|
|
5 |
"attention_dropout": 0.0,
|
6 |
"auto_map": {
|
7 |
"AutoModelForTokenClassification": "upos.MistralForTokenClassification"
|
|
|
151 |
"X": 57
|
152 |
},
|
153 |
"max_position_embeddings": 32768,
|
154 |
+
"model_type": "mistral",
|
|
|
155 |
"num_attention_heads": 32,
|
156 |
"num_hidden_layers": 32,
|
157 |
"num_key_value_heads": 8,
|
|
|
158 |
"rms_norm_eps": 1e-05,
|
|
|
159 |
"rope_theta": 10000.0,
|
160 |
"sliding_window": 4096,
|
161 |
"tie_word_embeddings": false,
|
pytorch_model-00001-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4913773120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9390f326afba489dfb25938fe3e8f2f8d1d7227d1eb8b33d92a24069dced0b6f
|
3 |
size 4913773120
|
pytorch_model-00002-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999825256
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:138623c84c3e5d85b51ae8017f08b39958a38f3dfb3978e16dc8d50d87209476
|
3 |
size 4999825256
|
pytorch_model-00003-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999825316
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:708976207133843ca3ae6c243cca9d5f54e8e089c695dcd910234e78149fb472
|
3 |
size 4999825316
|
pytorch_model-00004-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4832018324
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50c0d1273e3cc6e45ccdc865e3d78bac97353b6181bb640a6664f5e831f80d8c
|
3 |
size 4832018324
|
pytorch_model-00005-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999825320
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b0c0e4fdb9b4893ca0ab5ff41d3cff0162f54a20823b13369720e68308fca53
|
3 |
size 4999825320
|
pytorch_model-00006-of-00006.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3960601264
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:076923a6b328a83f9c8030cfa6fbd91d8f30d9f6a9fedda4ba069152e0f16a81
|
3 |
size 3960601264
|