asquevedos commited on
Commit
cc629bf
·
verified ·
1 Parent(s): 5d6b5c4

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e7fe573beeb54eecdee0ac28d30341a82c03d93867a8b2f63ce5bfb20e334fa
3
  size 439790024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65166500b7570db3dcfc88aa524185976006495bf5022e94d8c625a32dd10b52
3
  size 439790024
special_tokens_map.json CHANGED
@@ -1,7 +1,37 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
  }
tokenizer_config.json CHANGED
@@ -46,11 +46,11 @@
46
  "do_basic_tokenize": true,
47
  "do_lower_case": false,
48
  "mask_token": "[MASK]",
49
- "model_max_length": 1000000000000000019884624838656,
50
  "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
53
- "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
  "tokenizer_class": "BertTokenizer",
56
  "unk_token": "[UNK]"
 
46
  "do_basic_tokenize": true,
47
  "do_lower_case": false,
48
  "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
  "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
53
+ "strip_accents": false,
54
  "tokenize_chinese_chars": true,
55
  "tokenizer_class": "BertTokenizer",
56
  "unk_token": "[UNK]"
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2236158fa6e2c71392fc91511517f280b8c284bd525c7a5f30a4b9d9f2ef853
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16e9276b4277f952eb2837dbd135ea42fc6615b865442e8c8ec1bf00f6101c18
3
  size 4984
vocab.txt CHANGED
@@ -939,69 +939,69 @@
939
  [unused932]
940
  [unused933]
941
  [unused934]
942
- [unused935]
943
- [unused936]
944
- [unused937]
945
- [unused938]
946
- [unused939]
947
- [unused940]
948
- [unused941]
949
- [unused942]
950
- [unused943]
951
- [unused944]
952
- [unused945]
953
- [unused946]
954
- [unused947]
955
- [unused948]
956
- [unused949]
957
- [unused950]
958
- [unused951]
959
- [unused952]
960
- [unused953]
961
- [unused954]
962
- [unused955]
963
- [unused956]
964
- [unused957]
965
- [unused958]
966
- [unused959]
967
- [unused960]
968
- [unused961]
969
- [unused962]
970
- [unused963]
971
- [unused964]
972
- [unused965]
973
- [unused966]
974
- [unused967]
975
- [unused968]
976
- [unused969]
977
- [unused970]
978
- [unused971]
979
- [unused972]
980
- [unused973]
981
- [unused974]
982
- [unused975]
983
- [unused976]
984
- [unused977]
985
- [unused978]
986
- [unused979]
987
- [unused980]
988
- [unused981]
989
- [unused982]
990
- [unused983]
991
- [unused984]
992
- [unused985]
993
- [unused986]
994
- [unused987]
995
- [unused988]
996
- [unused989]
997
- [unused990]
998
- [unused991]
999
- [unused992]
1000
- [unused993]
1001
- [unused994]
1002
- [unused995]
1003
- [unused996]
1004
- [unused997]
1005
  w
1006
  W
1007
  ##de
 
939
  [unused932]
940
  [unused933]
941
  [unused934]
942
+ ##|
943
+ |
944
+ ##}
945
+ }
946
+ ##{
947
+ {
948
+ ##_
949
+ _
950
+ ##+
951
+ +
952
+ ##*
953
+ *
954
+ ##&
955
+ &
956
+ ##$
957
+ $
958
+ ##]
959
+ ]
960
+ ##[
961
+ [
962
+ ##=
963
+ =
964
+ ##>
965
+ >
966
+ ##<
967
+ <
968
+ ##@
969
+ @
970
+ ##\
971
+ \
972
+ ##/
973
+ /
974
+ ##%
975
+ %
976
+ ##;
977
+ ;
978
+ ##7
979
+ 7
980
+ ##w
981
+ ñ
982
+ ##k
983
+ k
984
+ ##Z
985
+ Z
986
+ ##X
987
+ X
988
+ ##W
989
+ ##Ñ
990
+ Ñ
991
+ ##K
992
+ K
993
+ ##J
994
+ J
995
+ ##Ú
996
+ Ú
997
+ ##Ó
998
+ Ó
999
+ ##Í
1000
+ Í
1001
+ ##É
1002
+ É
1003
+ ##Á
1004
+ Á
1005
  w
1006
  W
1007
  ##de