mahrnoud commited on
Commit
017af27
·
1 Parent(s): 6825cf2

Update Tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +2 -2
  2. tokenizer_config.json +2 -1
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae919b28537a24ab14728cdb016a2c3b0bdda997cb9e53779b168ab5500caf89
3
- size 14975662
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:046482a5ffbb33555a23deffdafbc1c85384660eb2ca4d4bb83ed91c06d62992
3
+ size 5000773
tokenizer_config.json CHANGED
@@ -67,7 +67,8 @@
67
  },
68
  "additional_special_tokens": [
69
  "[LANG_EN]",
70
- "[LANG_AR]"
 
71
  ],
72
  "clean_up_tokenization_spaces": true,
73
  "cls_token": "[CLS]",
 
67
  },
68
  "additional_special_tokens": [
69
  "[LANG_EN]",
70
+ "[LANG_AR]",
71
+ "[LANG_AR_EG]"
72
  ],
73
  "clean_up_tokenization_spaces": true,
74
  "cls_token": "[CLS]",