Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- special_tokens_map.json +35 -5
- tokenizer_config.json +2 -2
- training_args.bin +1 -1
- vocab.txt +63 -63
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 439790024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65166500b7570db3dcfc88aa524185976006495bf5022e94d8c625a32dd10b52
|
3 |
size 439790024
|
special_tokens_map.json
CHANGED
@@ -1,7 +1,37 @@
|
|
1 |
{
|
2 |
-
"cls_token":
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7 |
}
|
|
|
1 |
{
|
2 |
+
"cls_token": {
|
3 |
+
"content": "[CLS]",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"mask_token": {
|
10 |
+
"content": "[MASK]",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": {
|
17 |
+
"content": "[PAD]",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"sep_token": {
|
24 |
+
"content": "[SEP]",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"unk_token": {
|
31 |
+
"content": "[UNK]",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
}
|
37 |
}
|
tokenizer_config.json
CHANGED
@@ -46,11 +46,11 @@
|
|
46 |
"do_basic_tokenize": true,
|
47 |
"do_lower_case": false,
|
48 |
"mask_token": "[MASK]",
|
49 |
-
"model_max_length":
|
50 |
"never_split": null,
|
51 |
"pad_token": "[PAD]",
|
52 |
"sep_token": "[SEP]",
|
53 |
-
"strip_accents":
|
54 |
"tokenize_chinese_chars": true,
|
55 |
"tokenizer_class": "BertTokenizer",
|
56 |
"unk_token": "[UNK]"
|
|
|
46 |
"do_basic_tokenize": true,
|
47 |
"do_lower_case": false,
|
48 |
"mask_token": "[MASK]",
|
49 |
+
"model_max_length": 512,
|
50 |
"never_split": null,
|
51 |
"pad_token": "[PAD]",
|
52 |
"sep_token": "[SEP]",
|
53 |
+
"strip_accents": false,
|
54 |
"tokenize_chinese_chars": true,
|
55 |
"tokenizer_class": "BertTokenizer",
|
56 |
"unk_token": "[UNK]"
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16e9276b4277f952eb2837dbd135ea42fc6615b865442e8c8ec1bf00f6101c18
|
3 |
size 4984
|
vocab.txt
CHANGED
@@ -939,69 +939,69 @@
|
|
939 |
[unused932]
|
940 |
[unused933]
|
941 |
[unused934]
|
942 |
-
|
943 |
-
|
944 |
-
|
945 |
-
|
946 |
-
|
947 |
-
|
948 |
-
|
949 |
-
|
950 |
-
|
951 |
-
|
952 |
-
|
953 |
-
|
954 |
-
|
955 |
-
|
956 |
-
|
957 |
-
|
958 |
-
|
959 |
-
|
960 |
-
[
|
961 |
-
[
|
962 |
-
|
963 |
-
|
964 |
-
|
965 |
-
|
966 |
-
|
967 |
-
|
968 |
-
|
969 |
-
|
970 |
-
|
971 |
-
|
972 |
-
|
973 |
-
|
974 |
-
|
975 |
-
|
976 |
-
|
977 |
-
|
978 |
-
|
979 |
-
|
980 |
-
|
981 |
-
|
982 |
-
|
983 |
-
|
984 |
-
|
985 |
-
|
986 |
-
|
987 |
-
|
988 |
-
|
989 |
-
|
990 |
-
|
991 |
-
|
992 |
-
|
993 |
-
|
994 |
-
|
995 |
-
|
996 |
-
|
997 |
-
|
998 |
-
|
999 |
-
|
1000 |
-
|
1001 |
-
|
1002 |
-
|
1003 |
-
|
1004 |
-
|
1005 |
w
|
1006 |
W
|
1007 |
##de
|
|
|
939 |
[unused932]
|
940 |
[unused933]
|
941 |
[unused934]
|
942 |
+
##|
|
943 |
+
|
|
944 |
+
##}
|
945 |
+
}
|
946 |
+
##{
|
947 |
+
{
|
948 |
+
##_
|
949 |
+
_
|
950 |
+
##+
|
951 |
+
+
|
952 |
+
##*
|
953 |
+
*
|
954 |
+
##&
|
955 |
+
&
|
956 |
+
##$
|
957 |
+
$
|
958 |
+
##]
|
959 |
+
]
|
960 |
+
##[
|
961 |
+
[
|
962 |
+
##=
|
963 |
+
=
|
964 |
+
##>
|
965 |
+
>
|
966 |
+
##<
|
967 |
+
<
|
968 |
+
##@
|
969 |
+
@
|
970 |
+
##\
|
971 |
+
\
|
972 |
+
##/
|
973 |
+
/
|
974 |
+
##%
|
975 |
+
%
|
976 |
+
##;
|
977 |
+
;
|
978 |
+
##7
|
979 |
+
7
|
980 |
+
##w
|
981 |
+
ñ
|
982 |
+
##k
|
983 |
+
k
|
984 |
+
##Z
|
985 |
+
Z
|
986 |
+
##X
|
987 |
+
X
|
988 |
+
##W
|
989 |
+
##Ñ
|
990 |
+
Ñ
|
991 |
+
##K
|
992 |
+
K
|
993 |
+
##J
|
994 |
+
J
|
995 |
+
##Ú
|
996 |
+
Ú
|
997 |
+
##Ó
|
998 |
+
Ó
|
999 |
+
##Í
|
1000 |
+
Í
|
1001 |
+
##É
|
1002 |
+
É
|
1003 |
+
##Á
|
1004 |
+
Á
|
1005 |
w
|
1006 |
W
|
1007 |
##de
|