ljvmiranda921 commited on
Commit
88246bc
·
1 Parent(s): 8be416f

el_cop_sigtyp_trf-0.1.0: Update SIGTYP pipeline

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ el_cop_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
37
+ transformer/model filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - spacy
4
+ - token-classification
5
+ language:
6
+ - el
7
+ model-index:
8
+ - name: el_cop_sigtyp_trf
9
+ results:
10
+ - task:
11
+ name: TAG
12
+ type: token-classification
13
+ metrics:
14
+ - name: TAG (XPOS) Accuracy
15
+ type: accuracy
16
+ value: 0.2871376812
17
+ - task:
18
+ name: POS
19
+ type: token-classification
20
+ metrics:
21
+ - name: POS (UPOS) Accuracy
22
+ type: accuracy
23
+ value: 0.2895531401
24
+ - task:
25
+ name: MORPH
26
+ type: token-classification
27
+ metrics:
28
+ - name: Morph (UFeats) Accuracy
29
+ type: accuracy
30
+ value: 0.2904589372
31
+ - task:
32
+ name: LEMMA
33
+ type: token-classification
34
+ metrics:
35
+ - name: Lemma Accuracy
36
+ type: accuracy
37
+ value: 0.2949879227
38
+ - task:
39
+ name: UNLABELED_DEPENDENCIES
40
+ type: token-classification
41
+ metrics:
42
+ - name: Unlabeled Attachment Score (UAS)
43
+ type: f_score
44
+ value: 0.0240105541
45
+ - task:
46
+ name: LABELED_DEPENDENCIES
47
+ type: token-classification
48
+ metrics:
49
+ - name: Labeled Attachment Score (LAS)
50
+ type: f_score
51
+ value: 0.0216358839
52
+ - task:
53
+ name: SENTS
54
+ type: token-classification
55
+ metrics:
56
+ - name: Sentences F-Score
57
+ type: f_score
58
+ value: 0.9234234234
59
+ ---
60
+ | Feature | Description |
61
+ | --- | --- |
62
+ | **Name** | `el_cop_sigtyp_trf` |
63
+ | **Version** | `0.1.0` |
64
+ | **spaCy** | `>=3.6.1,<3.7.0` |
65
+ | **Default Pipeline** | `transformer`, `parser`, `trainable_lemmatizer`, `tagger`, `morphologizer` |
66
+ | **Components** | `transformer`, `parser`, `trainable_lemmatizer`, `tagger`, `morphologizer` |
67
+ | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
68
+ | **Sources** | n/a |
69
+ | **License** | n/a |
70
+ | **Author** | [n/a]() |
71
+
72
+ ### Label Scheme
73
+
74
+ <details>
75
+
76
+ <summary>View label scheme (293 labels for 3 components)</summary>
77
+
78
+ | Component | Labels |
79
+ | --- | --- |
80
+ | **`parser`** | `ROOT`, `acl:relcl`, `advcl`, `advmod`, `appos`, `aux`, `case`, `cc`, `ccomp`, `conj`, `cop`, `csubj`, `dep`, `det`, `discourse`, `dislocated`, `fixed`, `flat`, `iobj`, `mark`, `nmod`, `nsubj`, `nummod`, `obj`, `obl`, `obl:npmod`, `parataxis`, `punct`, `vocative`, `xcomp` |
81
+ | **`tagger`** | `AAOR`, `ACAUS`, `ACOND`, `ACOND_PPERS`, `ACOND_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=2\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=3\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Number=Plur\|Person=1\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Number=Plur\|Person=2\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Number=Plur\|Person=3\|PronType=Prs`, `ACOND_PPERS__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `ACONJ`, `ACONJ_PPERS`, `ACONJ_PPERS__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `ADV`, `ADV__Foreign=Yes`, `AFUTCONJ`, `AJUS`, `ALIM`, `ANEGAOR__Polarity=Neg`, `ANEGJUS__Polarity=Neg`, `ANEGOPT__Polarity=Neg`, `ANEGPST_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|Polarity=Neg\|PronType=Prs`, `ANEGPST__Polarity=Neg`, `ANY__Polarity=Neg`, `AOPT`, `AOPT_PPERS`, `AOPT_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=2\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=3\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Number=Plur\|Person=2\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Number=Plur\|Person=3\|PronType=Prs`, `AOPT_PPERS__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `APREC`, `APST`, `APST_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `ART`, `ART__Definite=Def\|Gender=Fem\|Number=Sing\|PronType=Art`, `ART__Definite=Def\|Gender=Masc\|Number=Sing\|PronType=Art`, `ART__Definite=Def\|Number=Plur\|PronType=Art`, `ART__Definite=Ind\|Number=Sing\|PronType=Art`, `ART__PronType=Art`, `CCIRC`, `CCIRC_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `CCIRC_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `CFOC`, `CFOC_PPERS`, `CFOC_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `CONJ`, `CONJ__Foreign=Yes`, `CONJ__Foreign=Yes\|Polarity=Neg`, `COP__Gender=Fem\|Number=Sing`, `COP__Gender=Masc\|Number=Sing`, `COP__Number=Plur`, `CPRET`, `CPRET_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `CREL`, `CREL_PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `EXIST`, `EXIST__Foreign=Yes`, `EXIST__Polarity=Neg`, `FM`, `FM__Foreign=Yes`, `FM__Foreign=Yes\|Polarity=Neg`, `FM__Polarity=Neg`, `FUT`, `IMOD`, `IMOD_PPERO__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `IMOD__Definite=Def\|PronType=Prs\|Reflex=Yes`, `IMOD__PronType=Tot`, `N`, `NEG__Foreign=Yes\|Polarity=Neg`, `NEG__Polarity=Neg`, `NPROP`, `NPROP__Foreign=Yes`, `NUM__Foreign=Yes\|NumType=Card`, `NUM__NumType=Card`, `N_PPERO__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `N_PPERO__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `N__Foreign=Yes`, `N__PronType=Rcp`, `PDEM`, `PDEM__Definite=Def\|Foreign=Yes\|Number=Plur\|PronType=Dem`, `PDEM__Definite=Def\|Gender=Fem\|Number=Sing\|PronType=Dem`, `PDEM__Definite=Def\|Gender=Masc\|Number=Sing\|PronType=Dem`, `PDEM__Definite=Def\|Number=Plur\|PronType=Dem`, `PINT__PronType=Ind`, `PINT__PronType=Int`, `PPERI__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `PPERI__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `PPERI__Definite=Def\|Gender=Masc\|Number=Sing\|Person=2\|PronType=Prs`, `PPERI__Definite=Def\|Gender=Masc\|Number=Sing\|Person=3\|PronType=Prs`, `PPERI__Definite=Def\|Number=Plur\|Person=1\|PronType=Prs`, `PPERI__Definite=Def\|Number=Plur\|Person=2\|PronType=Prs`, `PPERI__Definite=Def\|Number=Plur\|Person=3\|PronType=Prs`, `PPERI__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `PPERO`, `PPERO__Definite=Def\|Foreign=Yes\|Number=Plur\|Person=3\|PronType=Prs`, `PPERO__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `PPERO__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `PPERO__Definite=Def\|Gender=Masc\|Number=Sing\|Person=2\|PronType=Prs`, `PPERO__Definite=Def\|Gender=Masc\|Number=Sing\|Person=3\|PronType=Prs`, `PPERO__Definite=Def\|Number=Plur\|Person=1\|PronType=Prs`, `PPERO__Definite=Def\|Number=Plur\|Person=2\|PronType=Prs`, `PPERO__Definite=Def\|Number=Plur\|Person=3\|PronType=Prs`, `PPERO__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `PPERO__Definite=Def\|Poss=Yes\|PronType=Prs`, `PPERS`, `PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `PPERS__Definite=Def\|Gender=Fem\|Number=Sing\|Person=3\|PronType=Prs`, `PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=2\|PronType=Prs`, `PPERS__Definite=Def\|Gender=Masc\|Number=Sing\|Person=3\|PronType=Prs`, `PPERS__Definite=Def\|Number=Plur\|Person=1\|PronType=Prs`, `PPERS__Definite=Def\|Number=Plur\|Person=2\|PronType=Prs`, `PPERS__Definite=Def\|Number=Plur\|Person=3\|PronType=Prs`, `PPERS__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `PPOS`, `PPOS__Definite=Def\|Gender=Fem\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Sing\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Fem\|Number=Sing\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Sing\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender=Masc\|Number=Sing\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender[psor]=Fem\|Number=Plur\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender[psor]=Fem\|Number=Plur\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender[psor]=Masc\|Number=Plur\|Number[psor]=Sing\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Gender[psor]=Masc\|Number=Plur\|Number[psor]=Sing\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Number=Plur\|Number[psor]=Plur\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Number=Plur\|Number[psor]=Plur\|Person=2\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Number=Plur\|Number[psor]=Plur\|Person=3\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Number=Plur\|Number[psor]=Sing\|Person=1\|Poss=Yes\|PronType=Prs`, `PPOS__Definite=Def\|Number=Plur\|Poss=Yes\|PronType=Prs`, `PREP`, `PREP_PPERO`, `PREP_PPERO__Definite=Def\|Gender=Fem\|Number=Sing\|Person=2\|PronType=Prs`, `PREP_PPERO__Definite=Def\|Number=Sing\|Person=1\|PronType=Prs`, `PREP__Foreign=Yes`, `PTC`, `PTC__Foreign=Yes`, `PTC__Polarity=Neg`, `PUNCT`, `UNKNOWN`, `UNKNOWN__Foreign=Yes`, `VBD__VerbForm=Fin`, `VIMP__Foreign=Yes\|VerbForm=Fin`, `VIMP__VerbForm=Fin`, `VSTAT__VerbForm=Fin`, `V_PPERO__VerbForm=Fin`, `V__Foreign=Yes\|VerbForm=Fin`, `V__Foreign=Yes\|VerbForm=Inf`, `V__VerbForm=Fin`, `V__VerbForm=Inf` |
82
+ | **`morphologizer`** | `POS=AUX`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `POS=VERB\|VerbForm=Fin`, `POS=ADP`, `POS=PUNCT`, `Foreign=Yes\|POS=PART`, `POS=PART`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Foreign=Yes\|POS=NOUN`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `POS=NOUN`, `POS=CCONJ`, `POS=SCONJ`, `POS=ADV`, `POS=VERB`, `Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `POS=PRON\|PronType=Int`, `POS=AUX\|Polarity=Neg`, `Definite=Def\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Foreign=Yes\|POS=CCONJ`, `Definite=Def\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Foreign=Yes\|POS=VERB\|VerbForm=Fin`, `Foreign=Yes\|POS=PROPN`, `Definite=Def\|Gender=Fem\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=VERB\|Polarity=Neg`, `Gender=Masc\|Number=Sing\|POS=PRON`, `Definite=Def\|Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=NOUN\|PronType=Rcp`, `Definite=Def\|Number=Plur\|POS=DET\|PronType=Art`, `POS=ADV\|PronType=Tot`, `Definite=Def\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=DET\|PronType=Art`, `Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=PROPN`, `Definite=Def\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=ADV\|Polarity=Neg`, `Definite=Def\|Number=Plur\|POS=DET\|PronType=Dem`, `POS=PRON\|PronType=Ind`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Definite=Def\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender[psor]=Masc\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Masc\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=VERB\|VerbForm=Inf`, `Definite=Def\|Gender=Masc\|Gender[psor]=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `NumType=Card\|POS=NUM`, `Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender[psor]=Masc\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Def\|POS=ADV\|PronType=Prs\|Reflex=Yes`, `Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=AUX\|VerbForm=Fin`, `Foreign=Yes\|POS=ADV`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `POS=DET\|PronType=Art`, `Foreign=Yes\|POS=ADP`, `Number=Plur\|POS=PRON`, `Foreign=Yes\|POS=SCONJ`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=DET\|Poss=Yes\|PronType=Prs`, `Gender=Fem\|Number=Sing\|POS=PRON`, `POS=X`, `Definite=Def\|Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Foreign=Yes\|POS=CCONJ\|Polarity=Neg`, `Foreign=Yes\|POS=VERB\|VerbForm=Inf`, `Definite=Def\|Gender[psor]=Fem\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `POS=ADJ`, `POS=DET`, `Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `POS=PRON`, `Foreign=Yes\|POS=ADV\|Polarity=Neg`, `Definite=Def\|Gender=Masc\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Masc\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=PRON\|VerbForm=Fin`, `Definite=Def\|Gender=Masc\|Gender[psor]=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Foreign=Yes\|POS=X`, `Definite=Def\|Gender=Fem\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Number=Plur\|POS=DET\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Foreign=Yes\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Definite=Def\|Gender[psor]=Fem\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=X\|Polarity=Neg`, `POS=ADV\|PronType=Int`, `Definite=Def\|Foreign=Yes\|Number=Plur\|POS=DET\|PronType=Dem`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=2\|Polarity=Neg\|PronType=Prs`, `Foreign=Yes\|POS=AUX`, `POS=PART\|Polarity=Neg`, `Foreign=Yes\|NumType=Card\|POS=NUM`, `Foreign=Yes\|POS=X\|Polarity=Neg`, `Foreign=Yes\|POS=SCONJ\|Polarity=Neg`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=DET\|Poss=Yes\|PronType=Prs`, `Foreign=Yes\|POS=ADJ` |
83
+
84
+ </details>
85
+
86
+ ### Accuracy
87
+
88
+ | Type | Score |
89
+ | --- | --- |
90
+ | `DEP_UAS` | 2.40 |
91
+ | `DEP_LAS` | 2.16 |
92
+ | `SENTS_P` | 89.91 |
93
+ | `SENTS_R` | 94.91 |
94
+ | `SENTS_F` | 92.34 |
95
+ | `LEMMA_ACC` | 29.50 |
96
+ | `TAG_ACC` | 28.71 |
97
+ | `POS_ACC` | 28.96 |
98
+ | `MORPH_ACC` | 29.05 |
99
+ | `TRANSFORMER_LOSS` | 50704.88 |
100
+ | `PARSER_LOSS` | 36557.89 |
101
+ | `TRAINABLE_LEMMATIZER_LOSS` | 5620.72 |
102
+ | `TAGGER_LOSS` | 5386.44 |
103
+ | `MORPHOLOGIZER_LOSS` | 4269.79 |
config.cfg ADDED
@@ -0,0 +1,211 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [paths]
2
+ train = "corpus/train/cop_train.spacy"
3
+ dev = "corpus/dev/cop_valid.spacy"
4
+ vectors = null
5
+ init_tok2vec = null
6
+
7
+ [system]
8
+ gpu_allocator = "pytorch"
9
+ seed = 42
10
+
11
+ [nlp]
12
+ lang = "el"
13
+ pipeline = ["transformer","parser","trainable_lemmatizer","tagger","morphologizer"]
14
+ batch_size = 128
15
+ disabled = []
16
+ before_creation = null
17
+ after_creation = null
18
+ after_pipeline_creation = null
19
+ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+
21
+ [components]
22
+
23
+ [components.morphologizer]
24
+ factory = "morphologizer"
25
+ extend = false
26
+ label_smoothing = 0.0
27
+ overwrite = true
28
+ scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
29
+
30
+ [components.morphologizer.model]
31
+ @architectures = "spacy.Tagger.v2"
32
+ nO = null
33
+ normalize = false
34
+
35
+ [components.morphologizer.model.tok2vec]
36
+ @architectures = "spacy-transformers.TransformerListener.v1"
37
+ grad_factor = 1.0
38
+ pooling = {"@layers":"reduce_mean.v1"}
39
+ upstream = "*"
40
+
41
+ [components.parser]
42
+ factory = "parser"
43
+ learn_tokens = false
44
+ min_action_freq = 30
45
+ moves = null
46
+ scorer = {"@scorers":"spacy.parser_scorer.v1"}
47
+ update_with_oracle_cut_size = 100
48
+
49
+ [components.parser.model]
50
+ @architectures = "spacy.TransitionBasedParser.v2"
51
+ state_type = "parser"
52
+ extra_state_tokens = false
53
+ hidden_width = 128
54
+ maxout_pieces = 3
55
+ use_upper = false
56
+ nO = null
57
+
58
+ [components.parser.model.tok2vec]
59
+ @architectures = "spacy-transformers.TransformerListener.v1"
60
+ grad_factor = 1.0
61
+ pooling = {"@layers":"reduce_mean.v1"}
62
+ upstream = "*"
63
+
64
+ [components.tagger]
65
+ factory = "tagger"
66
+ label_smoothing = 0.0
67
+ neg_prefix = "!"
68
+ overwrite = false
69
+ scorer = {"@scorers":"spacy.tagger_scorer.v1"}
70
+
71
+ [components.tagger.model]
72
+ @architectures = "spacy.Tagger.v2"
73
+ nO = null
74
+ normalize = false
75
+
76
+ [components.tagger.model.tok2vec]
77
+ @architectures = "spacy-transformers.TransformerListener.v1"
78
+ grad_factor = 1.0
79
+ pooling = {"@layers":"reduce_mean.v1"}
80
+ upstream = "*"
81
+
82
+ [components.trainable_lemmatizer]
83
+ factory = "trainable_lemmatizer"
84
+ backoff = "orth"
85
+ min_tree_freq = 3
86
+ overwrite = false
87
+ scorer = {"@scorers":"spacy.lemmatizer_scorer.v1"}
88
+ top_k = 1
89
+
90
+ [components.trainable_lemmatizer.model]
91
+ @architectures = "spacy.Tagger.v2"
92
+ nO = null
93
+ normalize = false
94
+
95
+ [components.trainable_lemmatizer.model.tok2vec]
96
+ @architectures = "spacy-transformers.TransformerListener.v1"
97
+ grad_factor = 1.0
98
+ pooling = {"@layers":"reduce_mean.v1"}
99
+ upstream = "*"
100
+
101
+ [components.transformer]
102
+ factory = "transformer"
103
+ max_batch_items = 4096
104
+ set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
105
+
106
+ [components.transformer.model]
107
+ @architectures = "spacy-transformers.TransformerModel.v3"
108
+ name = "ljvmiranda921/LiBERTus-base"
109
+ mixed_precision = false
110
+
111
+ [components.transformer.model.get_spans]
112
+ @span_getters = "spacy-transformers.strided_spans.v1"
113
+ window = 128
114
+ stride = 96
115
+
116
+ [components.transformer.model.grad_scaler_config]
117
+
118
+ [components.transformer.model.tokenizer_config]
119
+ use_fast = true
120
+
121
+ [components.transformer.model.transformer_config]
122
+
123
+ [corpora]
124
+
125
+ [corpora.dev]
126
+ @readers = "spacy.Corpus.v1"
127
+ path = ${paths.dev}
128
+ max_length = 0
129
+ gold_preproc = false
130
+ limit = 0
131
+ augmenter = null
132
+
133
+ [corpora.train]
134
+ @readers = "spacy.Corpus.v1"
135
+ path = ${paths.train}
136
+ max_length = 0
137
+ gold_preproc = false
138
+ limit = 0
139
+ augmenter = null
140
+
141
+ [training]
142
+ accumulate_gradient = 3
143
+ dev_corpus = "corpora.dev"
144
+ train_corpus = "corpora.train"
145
+ seed = ${system.seed}
146
+ gpu_allocator = ${system.gpu_allocator}
147
+ dropout = 0.1
148
+ patience = 1600
149
+ max_epochs = 0
150
+ max_steps = 20000
151
+ eval_frequency = 200
152
+ frozen_components = []
153
+ annotating_components = []
154
+ before_to_disk = null
155
+ before_update = null
156
+
157
+ [training.batcher]
158
+ @batchers = "spacy.batch_by_padded.v1"
159
+ discard_oversize = true
160
+ size = 2000
161
+ buffer = 256
162
+ get_length = null
163
+
164
+ [training.logger]
165
+ @loggers = "spacy.ConsoleLogger.v3"
166
+ console_output = true
167
+ progress_bar = "eval"
168
+ output_file = null
169
+
170
+ [training.optimizer]
171
+ @optimizers = "Adam.v1"
172
+ beta1 = 0.9
173
+ beta2 = 0.999
174
+ L2_is_weight_decay = true
175
+ L2 = 0.01
176
+ grad_clip = 1.0
177
+ use_averages = false
178
+ eps = 0.00000001
179
+
180
+ [training.optimizer.learn_rate]
181
+ @schedules = "warmup_linear.v1"
182
+ warmup_steps = 250
183
+ total_steps = 20000
184
+ initial_rate = 0.00005
185
+
186
+ [training.score_weights]
187
+ dep_uas = 0.09
188
+ dep_las = 0.09
189
+ dep_las_per_type = null
190
+ sents_p = null
191
+ sents_r = null
192
+ sents_f = 0.0
193
+ lemma_acc = 0.17
194
+ tag_acc = 0.17
195
+ pos_acc = 0.25
196
+ morph_acc = 0.25
197
+ morph_per_feat = null
198
+
199
+ [pretraining]
200
+
201
+ [initialize]
202
+ vectors = ${paths.vectors}
203
+ init_tok2vec = ${paths.init_tok2vec}
204
+ vocab_data = null
205
+ lookups = null
206
+ before_init = null
207
+ after_init = null
208
+
209
+ [initialize.components]
210
+
211
+ [initialize.tokenizer]
el_cop_sigtyp_trf-any-py3-none-any.whl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75aa38e9b0bebe78a09167c28bfea17cd6e5357ca0988572a4c48ba990398a57
3
+ size 468549780
meta.json ADDED
@@ -0,0 +1,587 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lang":"el",
3
+ "name":"cop_sigtyp_trf",
4
+ "version":"0.1.0",
5
+ "description":"",
6
+ "author":"",
7
+ "email":"",
8
+ "url":"",
9
+ "license":"",
10
+ "spacy_version":">=3.6.1,<3.7.0",
11
+ "spacy_git_version":"458bc5f45",
12
+ "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null
17
+ },
18
+ "labels":{
19
+ "transformer":[
20
+
21
+ ],
22
+ "parser":[
23
+ "ROOT",
24
+ "acl:relcl",
25
+ "advcl",
26
+ "advmod",
27
+ "appos",
28
+ "aux",
29
+ "case",
30
+ "cc",
31
+ "ccomp",
32
+ "conj",
33
+ "cop",
34
+ "csubj",
35
+ "dep",
36
+ "det",
37
+ "discourse",
38
+ "dislocated",
39
+ "fixed",
40
+ "flat",
41
+ "iobj",
42
+ "mark",
43
+ "nmod",
44
+ "nsubj",
45
+ "nummod",
46
+ "obj",
47
+ "obl",
48
+ "obl:npmod",
49
+ "parataxis",
50
+ "punct",
51
+ "vocative",
52
+ "xcomp"
53
+ ],
54
+ "tagger":[
55
+ "AAOR",
56
+ "ACAUS",
57
+ "ACOND",
58
+ "ACOND_PPERS",
59
+ "ACOND_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
60
+ "ACOND_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
61
+ "ACOND_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
62
+ "ACOND_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
63
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=1|PronType=Prs",
64
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
65
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
66
+ "ACOND_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
67
+ "ACONJ",
68
+ "ACONJ_PPERS",
69
+ "ACONJ_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
70
+ "ADV",
71
+ "ADV__Foreign=Yes",
72
+ "AFUTCONJ",
73
+ "AJUS",
74
+ "ALIM",
75
+ "ANEGAOR__Polarity=Neg",
76
+ "ANEGJUS__Polarity=Neg",
77
+ "ANEGOPT__Polarity=Neg",
78
+ "ANEGPST_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|Polarity=Neg|PronType=Prs",
79
+ "ANEGPST__Polarity=Neg",
80
+ "ANY__Polarity=Neg",
81
+ "AOPT",
82
+ "AOPT_PPERS",
83
+ "AOPT_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
84
+ "AOPT_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
85
+ "AOPT_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
86
+ "AOPT_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
87
+ "AOPT_PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
88
+ "AOPT_PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
89
+ "AOPT_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
90
+ "APREC",
91
+ "APST",
92
+ "APST_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
93
+ "ART",
94
+ "ART__Definite=Def|Gender=Fem|Number=Sing|PronType=Art",
95
+ "ART__Definite=Def|Gender=Masc|Number=Sing|PronType=Art",
96
+ "ART__Definite=Def|Number=Plur|PronType=Art",
97
+ "ART__Definite=Ind|Number=Sing|PronType=Art",
98
+ "ART__PronType=Art",
99
+ "CCIRC",
100
+ "CCIRC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
101
+ "CCIRC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
102
+ "CFOC",
103
+ "CFOC_PPERS",
104
+ "CFOC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
105
+ "CONJ",
106
+ "CONJ__Foreign=Yes",
107
+ "CONJ__Foreign=Yes|Polarity=Neg",
108
+ "COP__Gender=Fem|Number=Sing",
109
+ "COP__Gender=Masc|Number=Sing",
110
+ "COP__Number=Plur",
111
+ "CPRET",
112
+ "CPRET_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
113
+ "CREL",
114
+ "CREL_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
115
+ "EXIST",
116
+ "EXIST__Foreign=Yes",
117
+ "EXIST__Polarity=Neg",
118
+ "FM",
119
+ "FM__Foreign=Yes",
120
+ "FM__Foreign=Yes|Polarity=Neg",
121
+ "FM__Polarity=Neg",
122
+ "FUT",
123
+ "IMOD",
124
+ "IMOD_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
125
+ "IMOD__Definite=Def|PronType=Prs|Reflex=Yes",
126
+ "IMOD__PronType=Tot",
127
+ "N",
128
+ "NEG__Foreign=Yes|Polarity=Neg",
129
+ "NEG__Polarity=Neg",
130
+ "NPROP",
131
+ "NPROP__Foreign=Yes",
132
+ "NUM__Foreign=Yes|NumType=Card",
133
+ "NUM__NumType=Card",
134
+ "N_PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
135
+ "N_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
136
+ "N__Foreign=Yes",
137
+ "N__PronType=Rcp",
138
+ "PDEM",
139
+ "PDEM__Definite=Def|Foreign=Yes|Number=Plur|PronType=Dem",
140
+ "PDEM__Definite=Def|Gender=Fem|Number=Sing|PronType=Dem",
141
+ "PDEM__Definite=Def|Gender=Masc|Number=Sing|PronType=Dem",
142
+ "PDEM__Definite=Def|Number=Plur|PronType=Dem",
143
+ "PINT__PronType=Ind",
144
+ "PINT__PronType=Int",
145
+ "PPERI__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
146
+ "PPERI__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
147
+ "PPERI__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
148
+ "PPERI__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
149
+ "PPERI__Definite=Def|Number=Plur|Person=1|PronType=Prs",
150
+ "PPERI__Definite=Def|Number=Plur|Person=2|PronType=Prs",
151
+ "PPERI__Definite=Def|Number=Plur|Person=3|PronType=Prs",
152
+ "PPERI__Definite=Def|Number=Sing|Person=1|PronType=Prs",
153
+ "PPERO",
154
+ "PPERO__Definite=Def|Foreign=Yes|Number=Plur|Person=3|PronType=Prs",
155
+ "PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
156
+ "PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
157
+ "PPERO__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
158
+ "PPERO__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
159
+ "PPERO__Definite=Def|Number=Plur|Person=1|PronType=Prs",
160
+ "PPERO__Definite=Def|Number=Plur|Person=2|PronType=Prs",
161
+ "PPERO__Definite=Def|Number=Plur|Person=3|PronType=Prs",
162
+ "PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
163
+ "PPERO__Definite=Def|Poss=Yes|PronType=Prs",
164
+ "PPERS",
165
+ "PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
166
+ "PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
167
+ "PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
168
+ "PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
169
+ "PPERS__Definite=Def|Number=Plur|Person=1|PronType=Prs",
170
+ "PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
171
+ "PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
172
+ "PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
173
+ "PPOS",
174
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
175
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
176
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
177
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
178
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
179
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
180
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
181
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
182
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Poss=Yes|PronType=Prs",
183
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
184
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
185
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
186
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
187
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
188
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
189
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
190
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
191
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Poss=Yes|PronType=Prs",
192
+ "PPOS__Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
193
+ "PPOS__Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
194
+ "PPOS__Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
195
+ "PPOS__Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
196
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
197
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
198
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
199
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
200
+ "PPOS__Definite=Def|Number=Plur|Poss=Yes|PronType=Prs",
201
+ "PREP",
202
+ "PREP_PPERO",
203
+ "PREP_PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
204
+ "PREP_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
205
+ "PREP__Foreign=Yes",
206
+ "PTC",
207
+ "PTC__Foreign=Yes",
208
+ "PTC__Polarity=Neg",
209
+ "PUNCT",
210
+ "UNKNOWN",
211
+ "UNKNOWN__Foreign=Yes",
212
+ "VBD__VerbForm=Fin",
213
+ "VIMP__Foreign=Yes|VerbForm=Fin",
214
+ "VIMP__VerbForm=Fin",
215
+ "VSTAT__VerbForm=Fin",
216
+ "V_PPERO__VerbForm=Fin",
217
+ "V__Foreign=Yes|VerbForm=Fin",
218
+ "V__Foreign=Yes|VerbForm=Inf",
219
+ "V__VerbForm=Fin",
220
+ "V__VerbForm=Inf"
221
+ ],
222
+ "morphologizer":[
223
+ "POS=AUX",
224
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs",
225
+ "POS=VERB|VerbForm=Fin",
226
+ "POS=ADP",
227
+ "POS=PUNCT",
228
+ "Foreign=Yes|POS=PART",
229
+ "POS=PART",
230
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art",
231
+ "Foreign=Yes|POS=NOUN",
232
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art",
233
+ "POS=NOUN",
234
+ "POS=CCONJ",
235
+ "POS=SCONJ",
236
+ "POS=ADV",
237
+ "POS=VERB",
238
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs",
239
+ "Definite=Def|Number=Sing|POS=PRON|Person=1|PronType=Prs",
240
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=2|PronType=Prs",
241
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs",
242
+ "POS=PRON|PronType=Int",
243
+ "POS=AUX|Polarity=Neg",
244
+ "Definite=Def|Number=Plur|POS=PRON|Person=3|PronType=Prs",
245
+ "Foreign=Yes|POS=CCONJ",
246
+ "Definite=Def|Number=Plur|POS=PRON|Person=1|PronType=Prs",
247
+ "Foreign=Yes|POS=VERB|VerbForm=Fin",
248
+ "Foreign=Yes|POS=PROPN",
249
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
250
+ "POS=VERB|Polarity=Neg",
251
+ "Gender=Masc|Number=Sing|POS=PRON",
252
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
253
+ "POS=NOUN|PronType=Rcp",
254
+ "Definite=Def|Number=Plur|POS=DET|PronType=Art",
255
+ "POS=ADV|PronType=Tot",
256
+ "Definite=Def|POS=PRON|Poss=Yes|PronType=Prs",
257
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art",
258
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
259
+ "POS=PROPN",
260
+ "Definite=Def|Number=Plur|POS=PRON|Person=2|PronType=Prs",
261
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
262
+ "POS=ADV|Polarity=Neg",
263
+ "Definite=Def|Number=Plur|POS=DET|PronType=Dem",
264
+ "POS=PRON|PronType=Ind",
265
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Dem",
266
+ "Definite=Def|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs",
267
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
268
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
269
+ "POS=VERB|VerbForm=Inf",
270
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
271
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
272
+ "NumType=Card|POS=NUM",
273
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
274
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
275
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
276
+ "Definite=Def|POS=ADV|PronType=Prs|Reflex=Yes",
277
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
278
+ "POS=AUX|VerbForm=Fin",
279
+ "Foreign=Yes|POS=ADV",
280
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Dem",
281
+ "POS=DET|PronType=Art",
282
+ "Foreign=Yes|POS=ADP",
283
+ "Number=Plur|POS=PRON",
284
+ "Foreign=Yes|POS=SCONJ",
285
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|Poss=Yes|PronType=Prs",
286
+ "Gender=Fem|Number=Sing|POS=PRON",
287
+ "POS=X",
288
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs",
289
+ "Foreign=Yes|POS=CCONJ|Polarity=Neg",
290
+ "Foreign=Yes|POS=VERB|VerbForm=Inf",
291
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
292
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|PronType=Prs",
293
+ "POS=ADJ",
294
+ "POS=DET",
295
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
296
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs",
297
+ "POS=PRON",
298
+ "Foreign=Yes|POS=ADV|Polarity=Neg",
299
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs",
300
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
301
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
302
+ "POS=PRON|VerbForm=Fin",
303
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
304
+ "Foreign=Yes|POS=X",
305
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs",
306
+ "Definite=Def|Number=Plur|POS=DET|Poss=Yes|PronType=Prs",
307
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=PRON|Person=3|PronType=Prs",
308
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
309
+ "POS=X|Polarity=Neg",
310
+ "POS=ADV|PronType=Int",
311
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=DET|PronType=Dem",
312
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|Polarity=Neg|PronType=Prs",
313
+ "Foreign=Yes|POS=AUX",
314
+ "POS=PART|Polarity=Neg",
315
+ "Foreign=Yes|NumType=Card|POS=NUM",
316
+ "Foreign=Yes|POS=X|Polarity=Neg",
317
+ "Foreign=Yes|POS=SCONJ|Polarity=Neg",
318
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|Poss=Yes|PronType=Prs",
319
+ "Foreign=Yes|POS=ADJ"
320
+ ]
321
+ },
322
+ "pipeline":[
323
+ "transformer",
324
+ "parser",
325
+ "trainable_lemmatizer",
326
+ "tagger",
327
+ "morphologizer"
328
+ ],
329
+ "components":[
330
+ "transformer",
331
+ "parser",
332
+ "trainable_lemmatizer",
333
+ "tagger",
334
+ "morphologizer"
335
+ ],
336
+ "disabled":[
337
+
338
+ ],
339
+ "performance":{
340
+ "dep_uas":0.0240105541,
341
+ "dep_las":0.0216358839,
342
+ "dep_las_per_type":{
343
+ "cc":{
344
+ "p":0.8260869565,
345
+ "r":0.1104651163,
346
+ "f":0.1948717949
347
+ },
348
+ "mark":{
349
+ "p":0.75,
350
+ "r":0.0069444444,
351
+ "f":0.0137614679
352
+ },
353
+ "nsubj":{
354
+ "p":0.0,
355
+ "r":0.0,
356
+ "f":0.0
357
+ },
358
+ "root":{
359
+ "p":0.2666666667,
360
+ "r":0.1111111111,
361
+ "f":0.1568627451
362
+ },
363
+ "case":{
364
+ "p":1.0,
365
+ "r":0.0012886598,
366
+ "f":0.0025740026
367
+ },
368
+ "obl":{
369
+ "p":0.0,
370
+ "r":0.0,
371
+ "f":0.0
372
+ },
373
+ "acl:relcl":{
374
+ "p":0.0,
375
+ "r":0.0,
376
+ "f":0.0
377
+ },
378
+ "det":{
379
+ "p":0.0,
380
+ "r":0.0,
381
+ "f":0.0
382
+ },
383
+ "aux":{
384
+ "p":0.0,
385
+ "r":0.0,
386
+ "f":0.0
387
+ },
388
+ "dislocated":{
389
+ "p":0.0,
390
+ "r":0.0,
391
+ "f":0.0
392
+ },
393
+ "advmod":{
394
+ "p":0.59375,
395
+ "r":0.0678571429,
396
+ "f":0.1217948718
397
+ },
398
+ "advcl":{
399
+ "p":0.0,
400
+ "r":0.0,
401
+ "f":0.0
402
+ },
403
+ "obj":{
404
+ "p":0.0,
405
+ "r":0.0,
406
+ "f":0.0
407
+ },
408
+ "ccomp":{
409
+ "p":0.0,
410
+ "r":0.0,
411
+ "f":0.0
412
+ },
413
+ "parataxis":{
414
+ "p":0.3333333333,
415
+ "r":0.0138888889,
416
+ "f":0.0266666667
417
+ },
418
+ "nmod":{
419
+ "p":0.0,
420
+ "r":0.0,
421
+ "f":0.0
422
+ },
423
+ "cop":{
424
+ "p":0.4736842105,
425
+ "r":0.1730769231,
426
+ "f":0.2535211268
427
+ },
428
+ "appos":{
429
+ "p":0.0,
430
+ "r":0.0,
431
+ "f":0.0
432
+ },
433
+ "conj":{
434
+ "p":0.5714285714,
435
+ "r":0.0291970803,
436
+ "f":0.0555555556
437
+ },
438
+ "fixed":{
439
+ "p":0.0,
440
+ "r":0.0,
441
+ "f":0.0
442
+ },
443
+ "xcomp":{
444
+ "p":0.0,
445
+ "r":0.0,
446
+ "f":0.0
447
+ },
448
+ "csubj":{
449
+ "p":0.0,
450
+ "r":0.0,
451
+ "f":0.0
452
+ },
453
+ "iobj":{
454
+ "p":0.0,
455
+ "r":0.0,
456
+ "f":0.0
457
+ },
458
+ "vocative":{
459
+ "p":0.0,
460
+ "r":0.0,
461
+ "f":0.0
462
+ },
463
+ "reparandum":{
464
+ "p":0.0,
465
+ "r":0.0,
466
+ "f":0.0
467
+ },
468
+ "discourse":{
469
+ "p":0.0,
470
+ "r":0.0,
471
+ "f":0.0
472
+ },
473
+ "amod":{
474
+ "p":0.0,
475
+ "r":0.0,
476
+ "f":0.0
477
+ },
478
+ "nummod":{
479
+ "p":0.0,
480
+ "r":0.0,
481
+ "f":0.0
482
+ },
483
+ "orphan":{
484
+ "p":0.0,
485
+ "r":0.0,
486
+ "f":0.0
487
+ },
488
+ "flat":{
489
+ "p":0.6666666667,
490
+ "r":0.4,
491
+ "f":0.5
492
+ },
493
+ "obl:npmod":{
494
+ "p":0.0,
495
+ "r":0.0,
496
+ "f":0.0
497
+ },
498
+ "acl":{
499
+ "p":0.0,
500
+ "r":0.0,
501
+ "f":0.0
502
+ }
503
+ },
504
+ "sents_p":0.899122807,
505
+ "sents_r":0.9490740741,
506
+ "sents_f":0.9234234234,
507
+ "lemma_acc":0.2949879227,
508
+ "tag_acc":0.2871376812,
509
+ "pos_acc":0.2895531401,
510
+ "morph_acc":0.2904589372,
511
+ "morph_per_feat":{
512
+ "Foreign":{
513
+ "p":0.9748743719,
514
+ "r":0.4041666667,
515
+ "f":0.5714285714
516
+ },
517
+ "Definite":{
518
+ "p":1.0,
519
+ "r":0.029318037,
520
+ "f":0.0569659443
521
+ },
522
+ "Gender":{
523
+ "p":1.0,
524
+ "r":0.0541666667,
525
+ "f":0.1027667984
526
+ },
527
+ "Number":{
528
+ "p":1.0,
529
+ "r":0.053030303,
530
+ "f":0.1007194245
531
+ },
532
+ "Person":{
533
+ "p":1.0,
534
+ "r":0.0326659642,
535
+ "f":0.0632653061
536
+ },
537
+ "PronType":{
538
+ "p":0.9444444444,
539
+ "r":0.0417947142,
540
+ "f":0.0800470865
541
+ },
542
+ "VerbForm":{
543
+ "p":0.9166666667,
544
+ "r":0.0995475113,
545
+ "f":0.1795918367
546
+ },
547
+ "Polarity":{
548
+ "p":1.0,
549
+ "r":0.3653846154,
550
+ "f":0.5352112676
551
+ },
552
+ "Gender[psor]":{
553
+ "p":0.0,
554
+ "r":0.0,
555
+ "f":0.0
556
+ },
557
+ "Number[psor]":{
558
+ "p":0.0,
559
+ "r":0.0,
560
+ "f":0.0
561
+ },
562
+ "Poss":{
563
+ "p":0.0,
564
+ "r":0.0,
565
+ "f":0.0
566
+ },
567
+ "NumType":{
568
+ "p":1.0,
569
+ "r":0.0666666667,
570
+ "f":0.125
571
+ },
572
+ "Reflex":{
573
+ "p":0.0,
574
+ "r":0.0,
575
+ "f":0.0
576
+ }
577
+ },
578
+ "transformer_loss":507.0488317468,
579
+ "parser_loss":365.5788776817,
580
+ "trainable_lemmatizer_loss":56.2071772462,
581
+ "tagger_loss":53.8643523407,
582
+ "morphologizer_loss":42.6978774554
583
+ },
584
+ "requirements":[
585
+ "spacy-transformers>=1.3.4,<1.4.0"
586
+ ]
587
+ }
morphologizer/cfg ADDED
@@ -0,0 +1,203 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "extend":false,
3
+ "label_smoothing":0.0,
4
+ "labels_morph":{
5
+ "POS=AUX":"",
6
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
7
+ "POS=VERB|VerbForm=Fin":"VerbForm=Fin",
8
+ "POS=ADP":"",
9
+ "POS=PUNCT":"",
10
+ "Foreign=Yes|POS=PART":"Foreign=Yes",
11
+ "POS=PART":"",
12
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Gender=Masc|Number=Sing|PronType=Art",
13
+ "Foreign=Yes|POS=NOUN":"Foreign=Yes",
14
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Gender=Fem|Number=Sing|PronType=Art",
15
+ "POS=NOUN":"",
16
+ "POS=CCONJ":"",
17
+ "POS=SCONJ":"",
18
+ "POS=ADV":"",
19
+ "POS=VERB":"",
20
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
21
+ "Definite=Def|Number=Sing|POS=PRON|Person=1|PronType=Prs":"Definite=Def|Number=Sing|Person=1|PronType=Prs",
22
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=2|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
23
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
24
+ "POS=PRON|PronType=Int":"PronType=Int",
25
+ "POS=AUX|Polarity=Neg":"Polarity=Neg",
26
+ "Definite=Def|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Definite=Def|Number=Plur|Person=3|PronType=Prs",
27
+ "Foreign=Yes|POS=CCONJ":"Foreign=Yes",
28
+ "Definite=Def|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Definite=Def|Number=Plur|Person=1|PronType=Prs",
29
+ "Foreign=Yes|POS=VERB|VerbForm=Fin":"Foreign=Yes|VerbForm=Fin",
30
+ "Foreign=Yes|POS=PROPN":"Foreign=Yes",
31
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
32
+ "POS=VERB|Polarity=Neg":"Polarity=Neg",
33
+ "Gender=Masc|Number=Sing|POS=PRON":"Gender=Masc|Number=Sing",
34
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Number=Plur|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
35
+ "POS=NOUN|PronType=Rcp":"PronType=Rcp",
36
+ "Definite=Def|Number=Plur|POS=DET|PronType=Art":"Definite=Def|Number=Plur|PronType=Art",
37
+ "POS=ADV|PronType=Tot":"PronType=Tot",
38
+ "Definite=Def|POS=PRON|Poss=Yes|PronType=Prs":"Definite=Def|Poss=Yes|PronType=Prs",
39
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art":"Definite=Ind|Number=Sing|PronType=Art",
40
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
41
+ "POS=PROPN":"",
42
+ "Definite=Def|Number=Plur|POS=PRON|Person=2|PronType=Prs":"Definite=Def|Number=Plur|Person=2|PronType=Prs",
43
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
44
+ "POS=ADV|Polarity=Neg":"Polarity=Neg",
45
+ "Definite=Def|Number=Plur|POS=DET|PronType=Dem":"Definite=Def|Number=Plur|PronType=Dem",
46
+ "POS=PRON|PronType=Ind":"PronType=Ind",
47
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Dem":"Definite=Def|Gender=Fem|Number=Sing|PronType=Dem",
48
+ "Definite=Def|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Number=Plur|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
49
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
50
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
51
+ "POS=VERB|VerbForm=Inf":"VerbForm=Inf",
52
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
53
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
54
+ "NumType=Card|POS=NUM":"NumType=Card",
55
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
56
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
57
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Number=Plur|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
58
+ "Definite=Def|POS=ADV|PronType=Prs|Reflex=Yes":"Definite=Def|PronType=Prs|Reflex=Yes",
59
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
60
+ "POS=AUX|VerbForm=Fin":"VerbForm=Fin",
61
+ "Foreign=Yes|POS=ADV":"Foreign=Yes",
62
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":"Definite=Def|Gender=Masc|Number=Sing|PronType=Dem",
63
+ "POS=DET|PronType=Art":"PronType=Art",
64
+ "Foreign=Yes|POS=ADP":"Foreign=Yes",
65
+ "Number=Plur|POS=PRON":"Number=Plur",
66
+ "Foreign=Yes|POS=SCONJ":"Foreign=Yes",
67
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Poss=Yes|PronType=Prs",
68
+ "Gender=Fem|Number=Sing|POS=PRON":"Gender=Fem|Number=Sing",
69
+ "POS=X":"",
70
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Number=Plur|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
71
+ "Foreign=Yes|POS=CCONJ|Polarity=Neg":"Foreign=Yes|Polarity=Neg",
72
+ "Foreign=Yes|POS=VERB|VerbForm=Inf":"Foreign=Yes|VerbForm=Inf",
73
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
74
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
75
+ "POS=ADJ":"",
76
+ "POS=DET":"",
77
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
78
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
79
+ "POS=PRON":"",
80
+ "Foreign=Yes|POS=ADV|Polarity=Neg":"Foreign=Yes|Polarity=Neg",
81
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
82
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
83
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
84
+ "POS=PRON|VerbForm=Fin":"VerbForm=Fin",
85
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
86
+ "Foreign=Yes|POS=X":"Foreign=Yes",
87
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
88
+ "Definite=Def|Number=Plur|POS=DET|Poss=Yes|PronType=Prs":"Definite=Def|Number=Plur|Poss=Yes|PronType=Prs",
89
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Definite=Def|Foreign=Yes|Number=Plur|Person=3|PronType=Prs",
90
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
91
+ "POS=X|Polarity=Neg":"Polarity=Neg",
92
+ "POS=ADV|PronType=Int":"PronType=Int",
93
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=DET|PronType=Dem":"Definite=Def|Foreign=Yes|Number=Plur|PronType=Dem",
94
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|Polarity=Neg|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Person=2|Polarity=Neg|PronType=Prs",
95
+ "Foreign=Yes|POS=AUX":"Foreign=Yes",
96
+ "POS=PART|Polarity=Neg":"Polarity=Neg",
97
+ "Foreign=Yes|NumType=Card|POS=NUM":"Foreign=Yes|NumType=Card",
98
+ "Foreign=Yes|POS=X|Polarity=Neg":"Foreign=Yes|Polarity=Neg",
99
+ "Foreign=Yes|POS=SCONJ|Polarity=Neg":"Foreign=Yes|Polarity=Neg",
100
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|Poss=Yes|PronType=Prs":"Definite=Def|Gender=Fem|Number=Sing|Poss=Yes|PronType=Prs",
101
+ "Foreign=Yes|POS=ADJ":"Foreign=Yes"
102
+ },
103
+ "labels_pos":{
104
+ "POS=AUX":87,
105
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
106
+ "POS=VERB|VerbForm=Fin":100,
107
+ "POS=ADP":85,
108
+ "POS=PUNCT":97,
109
+ "Foreign=Yes|POS=PART":94,
110
+ "POS=PART":94,
111
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art":90,
112
+ "Foreign=Yes|POS=NOUN":92,
113
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art":90,
114
+ "POS=NOUN":92,
115
+ "POS=CCONJ":89,
116
+ "POS=SCONJ":98,
117
+ "POS=ADV":86,
118
+ "POS=VERB":100,
119
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
120
+ "Definite=Def|Number=Sing|POS=PRON|Person=1|PronType=Prs":95,
121
+ "Definite=Def|Gender=Masc|Number=Sing|POS=PRON|Person=2|PronType=Prs":95,
122
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
123
+ "POS=PRON|PronType=Int":95,
124
+ "POS=AUX|Polarity=Neg":87,
125
+ "Definite=Def|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
126
+ "Foreign=Yes|POS=CCONJ":89,
127
+ "Definite=Def|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
128
+ "Foreign=Yes|POS=VERB|VerbForm=Fin":100,
129
+ "Foreign=Yes|POS=PROPN":96,
130
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
131
+ "POS=VERB|Polarity=Neg":100,
132
+ "Gender=Masc|Number=Sing|POS=PRON":95,
133
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
134
+ "POS=NOUN|PronType=Rcp":92,
135
+ "Definite=Def|Number=Plur|POS=DET|PronType=Art":90,
136
+ "POS=ADV|PronType=Tot":86,
137
+ "Definite=Def|POS=PRON|Poss=Yes|PronType=Prs":95,
138
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art":90,
139
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
140
+ "POS=PROPN":96,
141
+ "Definite=Def|Number=Plur|POS=PRON|Person=2|PronType=Prs":95,
142
+ "Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
143
+ "POS=ADV|Polarity=Neg":86,
144
+ "Definite=Def|Number=Plur|POS=DET|PronType=Dem":90,
145
+ "POS=PRON|PronType=Ind":95,
146
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Dem":90,
147
+ "Definite=Def|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
148
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
149
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
150
+ "POS=VERB|VerbForm=Inf":100,
151
+ "Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
152
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
153
+ "NumType=Card|POS=NUM":93,
154
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
155
+ "Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
156
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
157
+ "Definite=Def|POS=ADV|PronType=Prs|Reflex=Yes":86,
158
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
159
+ "POS=AUX|VerbForm=Fin":87,
160
+ "Foreign=Yes|POS=ADV":86,
161
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":90,
162
+ "POS=DET|PronType=Art":90,
163
+ "Foreign=Yes|POS=ADP":85,
164
+ "Number=Plur|POS=PRON":95,
165
+ "Foreign=Yes|POS=SCONJ":98,
166
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|Poss=Yes|PronType=Prs":90,
167
+ "Gender=Fem|Number=Sing|POS=PRON":95,
168
+ "POS=X":101,
169
+ "Definite=Def|Number=Plur|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
170
+ "Foreign=Yes|POS=CCONJ|Polarity=Neg":89,
171
+ "Foreign=Yes|POS=VERB|VerbForm=Inf":100,
172
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
173
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|PronType=Prs":95,
174
+ "POS=ADJ":84,
175
+ "POS=DET":90,
176
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
177
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
178
+ "POS=PRON":95,
179
+ "Foreign=Yes|POS=ADV|Polarity=Neg":86,
180
+ "Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
181
+ "Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
182
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
183
+ "POS=PRON|VerbForm=Fin":95,
184
+ "Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
185
+ "Foreign=Yes|POS=X":101,
186
+ "Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
187
+ "Definite=Def|Number=Plur|POS=DET|Poss=Yes|PronType=Prs":90,
188
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
189
+ "Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
190
+ "POS=X|Polarity=Neg":101,
191
+ "POS=ADV|PronType=Int":86,
192
+ "Definite=Def|Foreign=Yes|Number=Plur|POS=DET|PronType=Dem":90,
193
+ "Definite=Def|Gender=Fem|Number=Sing|POS=PRON|Person=2|Polarity=Neg|PronType=Prs":95,
194
+ "Foreign=Yes|POS=AUX":87,
195
+ "POS=PART|Polarity=Neg":94,
196
+ "Foreign=Yes|NumType=Card|POS=NUM":93,
197
+ "Foreign=Yes|POS=X|Polarity=Neg":101,
198
+ "Foreign=Yes|POS=SCONJ|Polarity=Neg":98,
199
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|Poss=Yes|PronType=Prs":90,
200
+ "Foreign=Yes|POS=ADJ":84
201
+ },
202
+ "overwrite":true
203
+ }
morphologizer/model ADDED
Binary file (299 kB). View file
 
parser/cfg ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "moves":null,
3
+ "update_with_oracle_cut_size":100,
4
+ "multitasks":[
5
+
6
+ ],
7
+ "min_action_freq":30,
8
+ "learn_tokens":false,
9
+ "beam_width":1,
10
+ "beam_density":0.0,
11
+ "beam_update_prob":0.0,
12
+ "incorrect_spans_key":null
13
+ }
parser/model ADDED
Binary file (903 kB). View file
 
parser/moves ADDED
@@ -0,0 +1 @@
 
 
1
+ ��moves�{"0":{"":25539},"1":{"":17115},"2":{"case":6409,"det":5028,"nsubj":3824,"mark":3159,"aux":2722,"cc":1233,"advmod":884,"punct":842,"dislocated":478,"advcl":309,"obl":180,"nummod":76,"vocative":51,"discourse":51,"dep":0},"3":{"obl":3420,"obj":2046,"punct":1929,"nmod":1427,"advmod":1336,"acl:relcl":1051,"conj":949,"advcl":863,"ccomp":575,"parataxis":534,"nsubj":454,"xcomp":444,"det":439,"cop":381,"appos":310,"fixed":236,"dislocated":194,"csubj":103,"vocative":79,"iobj":57,"obl:npmod":52,"flat":40,"dep":0},"4":{"ROOT":1730}}�cfg��neg_key�
tagger/cfg ADDED
@@ -0,0 +1,173 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "label_smoothing":0.0,
3
+ "labels":[
4
+ "AAOR",
5
+ "ACAUS",
6
+ "ACOND",
7
+ "ACOND_PPERS",
8
+ "ACOND_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
9
+ "ACOND_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
10
+ "ACOND_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
11
+ "ACOND_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
12
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=1|PronType=Prs",
13
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
14
+ "ACOND_PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
15
+ "ACOND_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
16
+ "ACONJ",
17
+ "ACONJ_PPERS",
18
+ "ACONJ_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
19
+ "ADV",
20
+ "ADV__Foreign=Yes",
21
+ "AFUTCONJ",
22
+ "AJUS",
23
+ "ALIM",
24
+ "ANEGAOR__Polarity=Neg",
25
+ "ANEGJUS__Polarity=Neg",
26
+ "ANEGOPT__Polarity=Neg",
27
+ "ANEGPST_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|Polarity=Neg|PronType=Prs",
28
+ "ANEGPST__Polarity=Neg",
29
+ "ANY__Polarity=Neg",
30
+ "AOPT",
31
+ "AOPT_PPERS",
32
+ "AOPT_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
33
+ "AOPT_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
34
+ "AOPT_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
35
+ "AOPT_PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
36
+ "AOPT_PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
37
+ "AOPT_PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
38
+ "AOPT_PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
39
+ "APREC",
40
+ "APST",
41
+ "APST_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
42
+ "ART",
43
+ "ART__Definite=Def|Gender=Fem|Number=Sing|PronType=Art",
44
+ "ART__Definite=Def|Gender=Masc|Number=Sing|PronType=Art",
45
+ "ART__Definite=Def|Number=Plur|PronType=Art",
46
+ "ART__Definite=Ind|Number=Sing|PronType=Art",
47
+ "ART__PronType=Art",
48
+ "CCIRC",
49
+ "CCIRC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
50
+ "CCIRC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
51
+ "CFOC",
52
+ "CFOC_PPERS",
53
+ "CFOC_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
54
+ "CONJ",
55
+ "CONJ__Foreign=Yes",
56
+ "CONJ__Foreign=Yes|Polarity=Neg",
57
+ "COP__Gender=Fem|Number=Sing",
58
+ "COP__Gender=Masc|Number=Sing",
59
+ "COP__Number=Plur",
60
+ "CPRET",
61
+ "CPRET_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
62
+ "CREL",
63
+ "CREL_PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
64
+ "EXIST",
65
+ "EXIST__Foreign=Yes",
66
+ "EXIST__Polarity=Neg",
67
+ "FM",
68
+ "FM__Foreign=Yes",
69
+ "FM__Foreign=Yes|Polarity=Neg",
70
+ "FM__Polarity=Neg",
71
+ "FUT",
72
+ "IMOD",
73
+ "IMOD_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
74
+ "IMOD__Definite=Def|PronType=Prs|Reflex=Yes",
75
+ "IMOD__PronType=Tot",
76
+ "N",
77
+ "NEG__Foreign=Yes|Polarity=Neg",
78
+ "NEG__Polarity=Neg",
79
+ "NPROP",
80
+ "NPROP__Foreign=Yes",
81
+ "NUM__Foreign=Yes|NumType=Card",
82
+ "NUM__NumType=Card",
83
+ "N_PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
84
+ "N_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
85
+ "N__Foreign=Yes",
86
+ "N__PronType=Rcp",
87
+ "PDEM",
88
+ "PDEM__Definite=Def|Foreign=Yes|Number=Plur|PronType=Dem",
89
+ "PDEM__Definite=Def|Gender=Fem|Number=Sing|PronType=Dem",
90
+ "PDEM__Definite=Def|Gender=Masc|Number=Sing|PronType=Dem",
91
+ "PDEM__Definite=Def|Number=Plur|PronType=Dem",
92
+ "PINT__PronType=Ind",
93
+ "PINT__PronType=Int",
94
+ "PPERI__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
95
+ "PPERI__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
96
+ "PPERI__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
97
+ "PPERI__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
98
+ "PPERI__Definite=Def|Number=Plur|Person=1|PronType=Prs",
99
+ "PPERI__Definite=Def|Number=Plur|Person=2|PronType=Prs",
100
+ "PPERI__Definite=Def|Number=Plur|Person=3|PronType=Prs",
101
+ "PPERI__Definite=Def|Number=Sing|Person=1|PronType=Prs",
102
+ "PPERO",
103
+ "PPERO__Definite=Def|Foreign=Yes|Number=Plur|Person=3|PronType=Prs",
104
+ "PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
105
+ "PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
106
+ "PPERO__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
107
+ "PPERO__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
108
+ "PPERO__Definite=Def|Number=Plur|Person=1|PronType=Prs",
109
+ "PPERO__Definite=Def|Number=Plur|Person=2|PronType=Prs",
110
+ "PPERO__Definite=Def|Number=Plur|Person=3|PronType=Prs",
111
+ "PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
112
+ "PPERO__Definite=Def|Poss=Yes|PronType=Prs",
113
+ "PPERS",
114
+ "PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
115
+ "PPERS__Definite=Def|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
116
+ "PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=2|PronType=Prs",
117
+ "PPERS__Definite=Def|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
118
+ "PPERS__Definite=Def|Number=Plur|Person=1|PronType=Prs",
119
+ "PPERS__Definite=Def|Number=Plur|Person=2|PronType=Prs",
120
+ "PPERS__Definite=Def|Number=Plur|Person=3|PronType=Prs",
121
+ "PPERS__Definite=Def|Number=Sing|Person=1|PronType=Prs",
122
+ "PPOS",
123
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
124
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
125
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
126
+ "PPOS__Definite=Def|Gender=Fem|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
127
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
128
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
129
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
130
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
131
+ "PPOS__Definite=Def|Gender=Fem|Number=Sing|Poss=Yes|PronType=Prs",
132
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
133
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
134
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
135
+ "PPOS__Definite=Def|Gender=Masc|Gender[psor]=Masc|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
136
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
137
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
138
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
139
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
140
+ "PPOS__Definite=Def|Gender=Masc|Number=Sing|Poss=Yes|PronType=Prs",
141
+ "PPOS__Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
142
+ "PPOS__Definite=Def|Gender[psor]=Fem|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
143
+ "PPOS__Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
144
+ "PPOS__Definite=Def|Gender[psor]=Masc|Number=Plur|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
145
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
146
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=2|Poss=Yes|PronType=Prs",
147
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
148
+ "PPOS__Definite=Def|Number=Plur|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
149
+ "PPOS__Definite=Def|Number=Plur|Poss=Yes|PronType=Prs",
150
+ "PREP",
151
+ "PREP_PPERO",
152
+ "PREP_PPERO__Definite=Def|Gender=Fem|Number=Sing|Person=2|PronType=Prs",
153
+ "PREP_PPERO__Definite=Def|Number=Sing|Person=1|PronType=Prs",
154
+ "PREP__Foreign=Yes",
155
+ "PTC",
156
+ "PTC__Foreign=Yes",
157
+ "PTC__Polarity=Neg",
158
+ "PUNCT",
159
+ "UNKNOWN",
160
+ "UNKNOWN__Foreign=Yes",
161
+ "VBD__VerbForm=Fin",
162
+ "VIMP__Foreign=Yes|VerbForm=Fin",
163
+ "VIMP__VerbForm=Fin",
164
+ "VSTAT__VerbForm=Fin",
165
+ "V_PPERO__VerbForm=Fin",
166
+ "V__Foreign=Yes|VerbForm=Fin",
167
+ "V__Foreign=Yes|VerbForm=Inf",
168
+ "V__VerbForm=Fin",
169
+ "V__VerbForm=Inf"
170
+ ],
171
+ "neg_prefix":"!",
172
+ "overwrite":false
173
+ }
tagger/model ADDED
Binary file (511 kB). View file
 
tokenizer ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ��prefix_search� �^''|^§|^%|^=|^\+[0-9]+%|^\'([0-9]){2}([\-]\'([0-9]){2})*|^\-([0-9]){1,9}\.([0-9]){1,9}|^\'([Α-Ωα-ωίϊΐόάέύϋΰήώ]+)\'|^([Α-Ωα-ωίϊΐόάέύϋΰήώ]){1,3}\'|^http://www.[A-Za-z]+\-[A-Za-z]+(\.[A-Za-z]+)+(\/[A-Za-z]+)*(\.[A-Za-z]+)*|^[ΈΆΊΑ-Ωα-ωίϊΐόάέύϋΰήώ]+\*|^\$([0-9])+([\,\.]([0-9])+){0,1}|^…|^……|^,|^:|^;|^\!|^\?|^¿|^؟|^¡|^\(|^\)|^\[|^\]|^\{|^\}|^<|^>|^_|^#|^\*|^&|^。|^?|^!|^,|^、|^;|^:|^~|^·|^।|^،|^۔|^؛|^٪|^\.\.+|^…|^\'|^"|^”|^“|^`|^‘|^´|^’|^‚|^,|^„|^»|^«|^「|^」|^『|^』|^(|^)|^〔|^〕|^【|^】|^《|^》|^〈|^〉|^〈|^〉|^⟦|^⟧|^\$|^£|^€|^¥|^฿|^US\$|^C\$|^A\$|^₽|^﷼|^₴|^₠|^₡|^₢|^₣|^₤|^₥|^₦|^₧|^₨|^₩|^₪|^₫|^€|^₭|^₮|^₯|^₰|^₱|^₲|^₳|^₴|^₵|^₶|^₷|^₸|^₹|^₺|^₻|^₼|^₽|^₾|^₿|^[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]�suffix_search�2�…$|……$|,$|:$|;$|\!$|\?$|¿$|؟$|¡$|\($|\)$|\[$|\]$|\{$|\}$|<$|>$|_$|#$|\*$|&$|。$|?$|!$|,$|、$|;$|:$|~$|·$|।$|،$|۔$|؛$|٪$|\.\.+$|…$|\'$|"$|”$|“$|`$|‘$|´$|’$|‚$|,$|„$|»$|«$|「$|」$|『$|』$|($|)$|〔$|〕$|【$|】$|《$|》$|〈$|〉$|〈$|〉$|⟦$|⟧$|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]$|(?<=[0-9])\+$|([0-9])+\'$|([A-Za-z])?\'$|^([0-9]){1,2}\.$| ([0-9]){1,2}\.$|([0-9]){1}\) $|^([0-9]){1}\)$$|(?<=°[FfCcKk])\.$|([0-9])+\&$|(?<=[0-9])(?:\$|£|€|¥|฿|US\$|C\$|A\$|₽|﷼|₴|₠|₡|₢|₣|₤|₥|₦|₧|₨|₩|₪|₫|€|₭|₮|₯|₰|₱|₲|₳|₴|₵|₶|₷|₸|₹|₺|₻|₼|₽|₾|₿)$|(?<=[0-9])(?:km|km²|km³|m|m²|m³|dm|dm²|dm³|cm|cm²|cm³|mm|mm²|mm³|ha|µm|nm|yd|in|ft|kg|g|mg|µg|t|lb|oz|m/s|km/h|kmh|mph|hPa|Pa|mbar|mb|MB|kb|KB|gb|GB|tb|TB|T|G|M|K|км|км²|км³|м|м²|м³|дм|дм²|дм³|см|см²|см³|мм|мм²|мм³|нм|кг|г|мг|м/с|км/ч|кПа|Па|мбар|Кб|КБ|кб|Мб|МБ|мб|Гб|ГБ|гб|Тб|ТБ|тб)$|(?<=[0-9a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F²\-\+(?:\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧)])\.$|(?<=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F][A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])\.$|(?<=[Α-Ωα-ωίϊΐόάέύϋΰήώ])\-$|(?<=[Α-Ωα-ωίϊΐόάέύϋΰήώ])\.$|^[Α-Ω]{1}\.$|\ [Α-Ω]{1}\.$|[ΈΆΊΑΌ-Ωα-ωίϊΐόάέύϋΰήώ]+([\-]([ΈΆΊΑΌ-Ωα-ωίϊΐόάέύϋΰήώ]+))+$|([0-9]+)mg$|([0-9]+)\.([0-9]+)m$�infix_finditer�?d\.\.+|…|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]|(?<=[0-9])[+\/\-\*^](?=[0-9])|([a-zA-Z]+)\/([a-zA-Z]+)\/([a-zA-Z]+)|([0-9])+(\.([0-9]+))*([\-]([0-9])+)+|([0-9])+[,]([0-9])+[\-]([0-9])+[,]([0-9])+|([0-9])+[ης]+([\-]([0-9])+)+|([0-9]){1,4}[\/]([0-9]){1,2}([\/]([0-9]){0,4}){0,1}|[A-Za-z]+\@[A-Za-z]+(\-[A-Za-z]+)*\.[A-Za-z]+|([a-zA-Z]+)(\-([a-zA-Z]+))+|(?<=[a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])\.(?=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]),(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])(?:-|–|—|--|---|——|~)(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])[:<>=/](?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])�token_match��url_match�
2
+ ��A�
3
+ � ��A� �$ΗΠΑ��A�$ΗΠΑ�'��A�'�''��A�''�'ΣΟΥΝ��A�'ΣΟΥΝC�είμαι�'βγαινε��A�'βγαινεC�βγαίνω�'βλεπε��A�'βλεπεC�βλέπω�'γραφα��A�'γραφαC�γράφω�'γω��A�'γωC�εγώ�'δειξε��A�'δειξεC�δείχνω�'θελα��A�'θελαC�θέλω�'κανε��A�'κανεC�κάνω�'κει��A�'κειC�εκεί�'κλεβε��A�'κλεβεC�κλέβω�'λεγα��A�'λεγαC�λέγω�'λεγαν��A�'λεγανC�λέγω�'λεγε��A�'λεγεC�λέγω�'μας��A�'μαςC�εμάς�'μαστε��A�'μαστεC�είμαι�'μεις��A�'μειςC�εγώ�'μετ��A�'μετC�μετά�'μουν��A�'μουνC�είμαι�'μουνα��A�'μουναC�είμαι�'ναι��A�'ναιC�είμαι�'ξερες��A�'ξερεςC�ξέρω�'ξομολογήθηκε��A�'ξομολογήθηκεC�εξομολογούμαι�'παιρνα��A�'παιρναC�παίρνω�'πανε��A�'πανεC�λέγω�'πε��A�'πεC�λέγω�'πρεπε��A�'πρεπεC�πρέπει�'ρθε��A�'ρθεC�έρχομαι�'ρθεί��A�'ρθείC�έρχομαι�'ρθει��A�'ρθειC�έρχομαι�'ρθουν��A�'ρθουνC�έρχομαι�'ρθούνε��A�'ρθούνεC�έρχομαι�'ριξε��A�'ριξεC�ρίχνω�'ρχεται��A�'ρχεταιC�έρχομαι�'σένα��A�'σέναC�εγώ�'σβηνε��A�'σβηνεC�σβήνω�'σκασε��A�'σκασεC�σκάω�'σπαγαν��A�'σπαγανC�σπάω�'ταν��A�'τανC�είμαι�'τανε��A�'τανεC�είμαι�'φαγε��A�'φαγεC�τρώω�'φερε��A�'φερεC�φέρνω�'φύγε��A�'φύγεC�φεύγω�'χα��A�'χαC�έχω�'χαμε��A�'χαμεC�έχω�'χε��A�'χεC�έχω�'χει��A�'χειC�έχω�'χεις��A�'χειςC�έχω�'χουμε��A�'χουμεC�έχω�'χουν��A�'χουνC�έχω�(*_*)��A�(*_*)�(-8��A�(-8�(-:��A�(-:�(-;��A�(-;�(-_-)��A�(-_-)�(._.)��A�(._.)�(:��A�(:�(;��A�(;�(=��A�(=�(>_<)��A�(>_<)�(^_^)��A�(^_^)�(o:��A�(o:�(¬_¬)��A�(¬_¬)�(ಠ_ಠ)��A�(ಠ_ಠ)�(╯°□°)╯︵┻━┻��A�(╯°□°)╯︵┻━┻�)-:��A�)-:�):��A�):�-_-��A�-_-�-__-��A�-__-�._.��A�._.�0.0��A�0.0�0.o��A�0.o�0_0��A�0_0�0_o��A�0_o�10μ.μ.��A�10�A�μ.μ.C�μ.μ.�10μμ��A�10�A�μμC�μ.μ.�10π.μ.��A�10�A�π.μ.C�π.μ.�10πμ��A�10�A�πμC�π.μ.�11μ.μ.��A�11�A�μ.μ.C�μ.μ.�11μμ��A�11�A�μμC�μ.μ.�11π.μ.��A�11�A�π.μ.C�π.μ.�11πμ��A�11�A�πμC�π.μ.�12μ.μ.��A�12�A�μ.μ.C�μ.μ.�12μμ��A�12�A�μμC�μ.μ.�12π.μ.��A�12�A�π.μ.C�π.μ.�12πμ��A�12�A�πμC�π.μ.�1μ.μ.��A�1�A�μ.μ.C�μ.μ.�1μμ��A�1�A�μμC�μ.μ.�1π.μ.��A�1�A�π.μ.C�π.μ.�1πμ��A�1�A�πμC�π.μ.�2μ.μ.��A�2�A�μ.μ.C�μ.μ.�2μμ��A�2�A�μμC�μ.μ.�2π.μ.��A�2�A�π.μ.C�π.μ.�2πμ��A�2�A�πμC�π.μ.�3μ.μ.��A�3�A�μ.μ.C�μ.μ.�3μμ��A�3�A�μμC�μ.μ.�3π.μ.��A�3�A�π.μ.C�π.μ.�3πμ��A�3�A�πμC�π.μ.�4μ.μ.��A�4�A�μ.μ.C�μ.μ.�4μμ��A�4�A�μμC�μ.μ.�4π.μ.��A�4�A�π.μ.C�π.μ.�4πμ��A�4�A�πμC�π.μ.�5μ.μ.��A�5�A�μ.μ.C�μ.μ.�5μμ��A�5�A�μμC�μ.μ.�5π.μ.��A�5�A�π.μ.C�π.μ.�5πμ��A�5�A�πμC�π.μ.�6μ.μ.��A�6�A�μ.μ.C�μ.μ.�6μμ��A�6�A�μμC�μ.μ.�6π.μ.��A�6�A�π.μ.C�π.μ.�6πμ��A�6�A�πμC�π.μ.�7μ.μ.��A�7�A�μ.μ.C�μ.μ.�7μμ��A�7�A�μμC�μ.μ.�7π.μ.��A�7�A�π.μ.C�π.μ.�7πμ��A�7�A�πμC�π.μ.�8)��A�8)�8-)��A�8-)�8-D��A�8-D�8D��A�8D�8μ.μ.��A�8�A�μ.μ.C�μ.μ.�8μμ��A�8�A�μμC�μ.μ.�8π.μ.��A�8�A�π.μ.C�π.μ.�8πμ��A�8�A�πμC�π.μ.�9μ.μ.��A�9�A�μ.μ.C�μ.μ.�9μμ��A�9�A�μμC�μ.μ.�9π.μ.��A�9�A�π.μ.C�π.μ.�9πμ��A�9�A�πμC�π.μ.�:'(��A�:'(�:')��A�:')�:'-(��A�:'-(�:'-)��A�:'-)�:(��A�:(�:((��A�:((�:(((��A�:(((�:()��A�:()�:)��A�:)�:))��A�:))�:)))��A�:)))�:*��A�:*�:-(��A�:-(�:-((��A�:-((�:-(((��A�:-(((�:-)��A�:-)�:-))��A�:-))�:-)))��A�:-)))�:-*��A�:-*�:-/��A�:-/�:-0��A�:-0�:-3��A�:-3�:->��A�:->�:-D��A�:-D�:-O��A�:-O�:-P��A�:-P�:-X��A�:-X�:-]��A�:-]�:-o��A�:-o�:-p��A�:-p�:-x��A�:-x�:-|��A�:-|�:-}��A�:-}�:/��A�:/�:0��A�:0�:1��A�:1�:3��A�:3�:>��A�:>�:D��A�:D�:O��A�:O�:P��A�:P�:X��A�:X�:]��A�:]�:o��A�:o�:o)��A�:o)�:p��A�:p�:x��A�:x�:|��A�:|�:}��A�:}�:’(��A�:’(�:’)��A�:’)�:’-(��A�:’-(�:’-)��A�:’-)�;)��A�;)�;-)��A�;-)�;-D��A�;-D�;D��A�;D�;_;��A�;_;�<.<��A�<.<�</3��A�</3�<3��A�<3�<33��A�<33�<333��A�<333�<space>��A�<space>�=(��A�=(�=)��A�=)�=/��A�=/�=3��A�=3�=D��A�=D�=[��A�=[�=]��A�=]�=|��A�=|�>.<��A�>.<�>.>��A�>.>�>:(��A�>:(�>:o��A�>:o�><(((*>��A�><(((*>�@_@��A�@_@�C++��A�C++�O.O��A�O.O�O.o��A�O.o�O_O��A�O_O�O_o��A�O_o�V.V��A�V.V�V_V��A�V_V�XD��A�XD�XDD��A�XDD�[-:��A�[-:�[:��A�[:�[=��A�[=�\")��A�\")�\n��A�\n�\t��A�\t�]=��A�]=�^_^��A�^_^�^__^��A�^__^�^___^��A�^___^�a.��A�a.�b.��A�b.�c.��A�c.�d.��A�d.�e.��A�e.�f.��A�f.�g.��A�g.�h.��A�h.�i.��A�i.�j.��A�j.�k.��A�k.�l.��A�l.�m.��A�m.�n.��A�n.�o.��A�o.�o.0��A�o.0�o.O��A�o.O�o.o��A�o.o�o_0��A�o_0�o_O��A�o_O�o_o��A�o_o�p.��A�p.�q.��A�q.�r.��A�r.�s.��A�s.�t.��A�t.�u.��A�u.�v.��A�v.�v.v��A�v.v�v_v��A�v_v�w.��A�w.�x.��A�x.�xD��A�xD�xDD��A�xDD�y.��A�y.�z.��A�z.� ��A� C� �¯\(ツ)/¯��A�¯\(ツ)/¯�°C.��A�°�A�C�A�.�°F.��A�°�A�F�A�.�°K.��A�°�A�K�A�.�°c.��A�°�A�c�A�.�°f.��A�°�A�f�A�.�°k.��A�°�A�k�A�.�ä.��A�ä.�ö.��A�ö.�ü.��A�ü.�Α'��A�Α'�Α.Ε.��A�Α.Ε.�Α.Ε.Β.Ε.��A�Α.Ε.Β.Ε.�Α.Ε.Ι.��A�Α.Ε.Ι.�Α.Ε.Π.��A�Α.Ε.Π.�Α.Μ.Α.��A�Α.Μ.Α.�Α.Π.Θ.��A�Α.Π.Θ.�Α.Τ.��A�Α.Τ.�Α.Χ.��A�Α.Χ.�ΑΓΡ.��A�ΑΓΡ.C�Αγροτικός�ΑΝ.��A�ΑΝ.�ΑΠ'��A�ΑΠ'C�από�ΑΠ’��A�ΑΠ’C�από�Αγ.��A�Αγ.�Αγ. Γρ.��A�Αγ. Γρ.C�Αγία Γραφή�Αγόρασ'��A�Αγόρασ'C�αγοράζω�Αγόρασ’��A�Αγόρασ’C�αγοράζω�Αθ.��A�Αθ.C�Αθανάσιος�Αλ.��A�Αλ.�Αλεξ.��A�Αλεξ.C�Αλέξανδρος�Αλλ'��A�Αλλ'C�αλλά�Αλλ’��A�Αλλ’C�αλλά�Αμ'��A�Αμ'C�άμα�Αμ’��A�Αμ’C�άμα�Αν.��A�Αν.�Αντ'��A�Αντ'C�αντί�Αντ.��A�Αντ.�Αντ’��A�Αντ’C�αντί�Απ'��A�Απ'C�από�Απ.��A�Απ.�Απρ.��A�Απρ.C�Απρίλιος�Απ’��A�Απ’C�από�Αφ'��A�Αφ'C�από�Αφ’��A�Αφ’C�από�Αύγ.��A�Αύγ.C�Αύγουστος�Α’��A�Α’�Β'��A�Β'�Β)��A�Β)�Β.Ζ.��A�Β.Ζ.�Β.Ι.Ο.��A�Β.Ι.Ο.�Β.Κ.��A�Β.Κ.�Β.Μ.Α.��A�Β.Μ.Α.�Βάψ'��A�Βάψ'C�βάφω�Βάψ’��A�Βάψ’C�βάφω�Βασ.��A�Βασ.�Β’��A�Β’�Γ'��A�Γ'�Γ)��A�Γ)�Γ.Γ.��A�Γ.Γ.�Γ.Δ.��A�Γ.Δ.�ΓΙ'��A�ΓΙ'C�για�ΓΙ’��A�ΓΙ’C�για�Γι'��A�Γι'C�για�Γι’��A�Γι’C�για�Γκ.��A�Γκ.�Γ’��A�Γ’�Δ.Ε.Η.��A�Δ.Ε.Η.�Δ.Ε.Σ.Ε.��A�Δ.Ε.Σ.Ε.�Δ.Ν.��A�Δ.Ν.�Δ.Ο.Υ.��A�Δ.Ο.Υ.�Δ.Σ.��A�Δ.Σ.�Δ.Υ.��A�Δ.Υ.�ΔΙ.ΚΑ.Τ.Σ.Α.��A�ΔΙ.ΚΑ.Τ.Σ.Α.�Δέσ'��A�Δέσ'C�δένω�Δέσ’��A�Δέσ’C�δένω�Δεκ.��A�Δεκ.C�Δεκέμβριος�Δεσ'��A�Δεσ'C�δένω�Δεσ’��A�Δεσ’C�δένω�Δηλ.��A�Δηλ.�Δημ.��A�Δημ.C�Δήμος�Δι'��A�Δι'C�δια�Διον.��A�Διον.�Δι’��A�Δι’C�δια�Δωσ'��A�Δωσ'C�δίνω�Δωσ’��A�Δωσ’C�δίνω�Δύσκολ'��A�Δύσκολ'C�δύσκολος�Δύσκολ’��A�Δύσκολ’C�δύσκολος�Ε.Α.��A�Ε.Α.�Ε.Α.Κ.��A�Ε.Α.Κ.�Ε.Α.Π.��A�Ε.Α.Π.�Ε.Ε.��A�Ε.Ε.�Ε.Κ.��A�Ε.Κ.�Ε.ΚΕ.ΠΙΣ.��A�Ε.ΚΕ.ΠΙΣ.�Ε.Λ.Α.��A�Ε.Λ.Α.�Ε.Λ.Ι.Α.��A�Ε.Λ.Ι.Α.�Ε.Π.Σ.��A�Ε.Π.Σ.�Ε.Π.Τ.Α.��A�Ε.Π.Τ.Α.�Ε.Σ.Ε.Ε.Κ.��A�Ε.Σ.Ε.Ε.Κ.�Ε.Υ.Κ.��A�Ε.Υ.Κ.�ΕΕ.��A�ΕΕ.�ΕΚ.��A�ΕΚ.�ΕΛ.��A�ΕΛ.�ΕΛ.ΑΣ.��A�ΕΛ.ΑΣ.�Εθν.��A�Εθν.�Ελ.��A�Ελ.�Εμ.��A�Εμ.�Επ'��A�Επ'C�επί�Επ.��A�Επ.�Επ’��A�Επ’C�επί�Ευ.��A�Ευ.�Εφ'��A�Εφ'C�επί�Εφ’��A�Εφ’C�επί�Η'��A�Η'�Η.Π.Α.��A�Η.Π.Α.�Η’��A�Η’�Θ'��A�Θ'C�θα�ΘΕ.��A�ΘΕ.�Θεμ.��A�Θεμ.�Θεοδ.��A�Θεοδ.�Θρ.��A�Θρ.�Θ’��A�Θ’C�θα�Ι.Ε.Κ.��A�Ι.Ε.Κ.�Ι.Κ.Α.��A�Ι.Κ.Α.�Ι.Κ.Υ.��A�Ι.Κ.Υ.�Ι.Σ.Θ.��A�Ι.Σ.Θ.�Ι.Χ.��A�Ι.Χ.�ΙΖ'��A�ΙΖ'�ΙΖ’��A�ΙΖ’�ΙΧ.��A�ΙΧ.�Ιαν.��A�Ιαν.C�Ιανουάριος�Ιούλ.��A�Ιούλ.C�Ιούλιος�Ιούν.��A�Ιούν.C�Ιούνιος�Ιωαν.��A�Ιωαν.C�Ιωάννης�Κ.Α.Α.��A�Κ.Α.Α.�Κ.Α.Ε.��A�Κ.Α.Ε.�Κ.Β.Σ.��A�Κ.Β.Σ.�Κ.Δ.��A�Κ.Δ.�Κ.Ε.��A�Κ.Ε.�Κ.Ε.Κ.��A�Κ.Ε.Κ.�Κ.Ι.��A�Κ.Ι.�Κ.Ι.Θ.��A�Κ.Ι.Θ.�Κ.Κ.��A�Κ.Κ.�Κ.ΚΕΚ.��A�Κ.ΚΕΚ.�Κ.Ο.��A�Κ.Ο.�Κ.Π.Ρ.��A�Κ.Π.Ρ.�ΚΑΤ.��A�ΚΑΤ.�ΚΚ.��A�ΚΚ.�Κάν'��A�Κάν'C�κάνω�Κάν’��A�Κάν’C�κάνω�Καθ'��A�Καθ'C�κάθε�Καθ’��A�Καθ’C�κάθε�Καν.��A�Καν.�Καρ.��A�Καρ.�Κατ'��A�Κατ'C�κατά�Κατ.��A�Κατ.�Κατ’��A�Κατ’C�κατά�Κυρ.��A�Κυρ.�Κων.��A�Κων.�Λ.Α.��A�Λ.Α.�Λ.Χ.��A�Λ.Χ.�Λ.χ.��A�Λ.χ.�Λήξ'��A�Λήξ'C�λήγω�Λήξ’��A�Λήξ’C�λήγω�Λεωφ.��A�Λεωφ.�Λι.��A�Λι.�Μ'��A�Μ'C�με�Μ. Ασία��A�Μ. ΑσίαC�Μικρά Ασία�Μ.Δ.Ε.��A�Μ.Δ.Ε.�Μ.Ε.Ο.��A�Μ.Ε.Ο.�Μ.Ζ.��A�Μ.Ζ.�Μ.Μ.Ε.��A�Μ.Μ.Ε.�Μ.Ο.��A�Μ.Ο.�ΜΕΤ'��A�ΜΕΤ'C�μετά�ΜΕΤ’��A�ΜΕΤ’C�μετά�Μάρτ'��A�Μάρτ'C�Μάρτιος�Μάρτ.��A�Μάρτ.C�Μάρτιος�Μάρτ’��A�Μάρτ’C�Μάρτιος�Μέσ'��A�Μέσ'C�μέσα�Μέσ’��A�Μέσ’C�μέσα�Μεγ.��A�Μεγ.�Μετ'��A�Μετ'C�μετά�Μετ’��A�Μετ’C�μετά�Μιλτ.��A�Μιλτ.�Μιχ.��A�Μιχ.�Μ’��A�Μ’C�με�Ν'��A�Ν'C�να�Ν.Δ.��A�Ν.Δ.�Ν.Ε.Α.��A�Ν.Ε.Α.�Ν.Κ.��A�Ν.Κ.�Ν.Ο.��A�Ν.Ο.�Ν.Ο.Θ.��A�Ν.Ο.Θ.�Ν.Π.Δ.Δ.��A�Ν.Π.Δ.Δ.�Ν.Υ.��A�Ν.Υ.�ΝΔ.��A�ΝΔ.�Νικ.��A�Νικ.�Νοέμβρ.��A�Νοέμβρ.C�Νοέμβριος�Ντ'��A�Ντ'�Ντ.��A�Ντ.�Ντ’��A�Ντ’�Ν’��A�Ν’C�να�Ο'��A�Ο'�Ο.Α.��A�Ο.Α.�Ο.Α.Ε.Δ.��A�Ο.Α.Ε.Δ.�Ο.Δ.��A�Ο.Δ.�Ο.Ε.Ε.��A�Ο.Ε.Ε.�Ο.Ε.Ε.Κ.��A�Ο.Ε.Ε.Κ.�Ο.Η.Ε.��A�Ο.Η.Ε.�Ο.Κ.��A�Ο.Κ.�Οκτ.��A���κτ.C�Οκτώβριος�Ο’��A�Ο’�Π.Δ.��A�Π.Δ.�Π.Ε.Κ.Δ.Υ.��A�Π.Ε.Κ.Δ.Υ.�Π.Ε.Π.��A�Π.Ε.Π.�Π.Μ.Σ.��A�Π.Μ.Σ.�Π.Χ.��A�Π.Χ.�ΠΑΡ'��A�ΠΑΡ'C�παρά�ΠΑΡ’��A�ΠΑΡ’C�παρά�ΠΟΛ.��A�ΠΟΛ.�Πάρ'��A�Πάρ'C�παίρνω�Πάρ’��A�Πάρ’C�παίρνω�Παίξ'��A�Παίξ'C�παίζω�Παίξ’��A�Παίξ’C�παίζω�Παρ'��A�Παρ'C�παρά�Παρ.��A�Παρ.�Παρ’��A�Παρ’C�παρά�Πλ.��A�Πλ.�Πρ.��A�Πρ.�Σ'��A�Σ'C�σε�Σ.Δ.Ο.Ε.��A�Σ.Δ.Ο.Ε.�Σ.Ε.��A�Σ.Ε.�Σ.Ε.Κ.��A�Σ.Ε.Κ.�Σ.Π.Δ.Ω.Β.��A�Σ.Π.Δ.Ω.Β.�Σ.Τ.��A�Σ.Τ.�Σαβ.��A�Σαβ.�Σεπτ.��A�Σεπτ.C�Σεπτέμβριος�Στ'��A�Στ'C�στο�Στ.��A�Στ.�ΣτΕ.��A�ΣτΕ.�Στρ.��A�Στρ.�Στ’��A�Στ’C�στο�Σ’��A�Σ’C�σε�Τ'��A�Τ'C�το�Τ.Α.��A�Τ.Α.�Τ.Ε.Ε.��A�Τ.Ε.Ε.�Τ.Ε.Ι.��A�Τ.Ε.Ι.�ΤΡ.��A�ΤΡ.�Τζ.��A�Τζ.�Τηλ.��A�Τηλ.�Τ’��A�Τ’C�το�Υ.Γ.��A�Υ.Γ.�ΥΓ.��A�ΥΓ.�ΥΠ.Ε.Π.Θ.��A�ΥΠ.Ε.Π.Θ.�Υπ'��A�Υπ'C�υπό�Υπ’��A�Υπ’C�υπό�Φ.Α.Β.Ε.��A�Φ.Α.Β.Ε.�Φ.Κ.��A�Φ.Κ.�Φ.Π.Α.��A�Φ.Π.Α.�Φ.Σ.��A�Φ.Σ.�Φ.Χ.��A�Φ.Χ.�Φέρ'��A�Φέρ'C�φέρνω�Φέρ’��A�Φέρ’C�φέρνω�Φεβρ.��A�Φεβρ.C�Φεβρουάριος�Φερ'��A�Φερ'C�φέρνω�Φερ’��A�Φερ’C�φέρνω�Φιλ.��A�Φιλ.�Χ.Α.Α.��A�Χ.Α.Α.�Χ.Χ.��A�Χ.Χ.�ΧΡ.��A�ΧΡ.�Χαρ.��A�Χαρ.�Χιλ.��A�Χιλ.�Χρ.��A�Χρ.�άγ.��A�άγ.�άρθρ.��A�άρθρ.�άσ'��A�άσ'C�αφήνω�άσ’��A�άσ’C�αφήνω�έφθασ'��A�έφθασ'C�φθάνω�έφθασ’��A�έφθασ’C�φθάνω�αι.��A�αι.�αλλ'��A�αλλ'C�αλλά�αλλ’��A�αλλ’C�αλλά�αν.��A�αν.�απ.��A�απ.�αρ.��A�αρ.�αριθ.��A�αριθ.�αριθμ.��A�αριθμ.�αφ'��A�αφ'C�από�αφ’��A�αφ’C�από�β'��A�β'�βλ.��A�βλ.�β’��A�β’�γ.γ.��A�γ.γ.�γεν.��A�γεν.�γι'��A�γι'C�για�γι’��A�γι’C�για�γραμμ.��A�γραμμ.�δ.δ.��A�δ.δ.�δ.σ.��A�δ.σ.�δεσ'��A�δεσ'C�δένω�δεσ’��A�δεσ’C�δένω�δηλ.��A�δηλ.�δι'��A�δι'C�δια�δισ.��A�δισ.�δι’��A�δι’C�δια�δολ.��A�δολ.�δρχ.��A�δρχ.�δώσ'��A�δώσ'C�δίνω�δώσ’��A�δώσ’C�δίνω�εκ.��A�εκ.�εκατ.��A�εκατ.�ελ.��A�ελ.�εξ'��A�εξ'C�εκ�εξ’��A�εξ’C�εκ�επ'��A�επ'C�επί�επ’��A�επ’C�επί�εφ'��A�εφ'C�επί�εφ’��A�εφ’C�επί�θ'��A�θ'C�θα�θιν'��A�θιν'�θιν’��A�θιν’�θ’��A�θ’C�θα�κ'τσή��A�κ'τσήC�κουτσός�κ.��A�κ.�κ.ά.��A�κ.ά.�κ.α.��A�κ.α.�κ.κ.��A�κ.κ.�κ.λπ.��A�κ.λπ.�κ.ο.κ.��A�κ.ο.κ.�κ.τ.λ.��A�κ.τ.λ.�καθ'��A�καθ'C�κάθε�καθ’��A�καθ’C�κάθε�κατ'��A�κατ'C�κατά�κατ’��A�κατ’C�κατά�κι��A�κιC�και�κλπ.��A�κλπ.�κτλ.��A�κτλ.�κυβ.��A�κυβ.�κ’τσή��A�κ’τσήC�κουτσός�λ.χ.��A�λ.χ.�μ'��A�μ'C�με�μ.��A�μ.�μ.Χ.��A�μ.Χ.�μ.μ.��A�μ.μ.�μέσ'��A�μέσ'C�μέσα�μέσ’��A�μέσ’C�μέσα�μεσ'��A�μεσ'C�μέσα�μεσ’��A�μεσ’C�μέσα�μηδ'��A�μηδ'C�μήδε�μηδ’��A�μηδ’C�μήδε�μιλ.��A�μιλ.�μ’��A�μ’C�με�ν'��A�ν'C�να�ντ'��A�ντ'�ντ’��A�ντ’�ν’��A�ν’C�να�ολ'��A�ολ'C�όλος�ολ’��A�ολ’C�όλος�π.Χ.��A�π.Χ.�π.β.��A�π.β.�π.δ.��A�π.δ.�π.μ.��A�π.μ.�π.χ.��A�π.χ.�πάρ'��A�πάρ'C�παίρνω�πάρ’��A�πάρ’C�παίρνω�παρ'��A�παρ'C�παρά�παρ’��A�παρ’C�παρά�σ'��A�σ'C�σε�σ.��A�σ.�σ.α.λ.��A�σ.α.λ.�σ.σ.��A�σ.σ.�σελ.��A�σελ.�στρ.��A�στρ.�σ’��A�σ’C�σε�τ'��A�τ'C�το�τ'ς��A�τ'ς�τ.μ.��A�τ.μ.�τίποτ'��A�τίποτ'C�τίποτα�τίποτ’��A�τίποτ’C�τίποτα�τετ.��A�τετ.�τετρ.��A�τετρ.�τηλ.��A�τηλ.�τρισ.��A�τρισ.�τόν.��A�τόν.�τ’��A�τ’C�το�τ’ς��A�τ’ς�υπ'��A�υπ'C�υπό�υπ.��A�υπ.�υπ’��A�υπ’C�υπό�φέρ'��A�φέρ'C�φέρνω�φέρ’��A�φέρ’C�φέρνω�φερ'��A�φερ'C�φέρνω�φερ’��A�φερ’C�φέρνω�χ.μ.��A�χ.μ.�χγρ.��A�χγρ.�χιλ.��A�χιλ.�χλμ.��A�χλμ.�όμουρφ'��A�όμουρφ'C�όμορφος�όμουρφ’��A�όμουρφ’C�όμορφος�ύστερ'��A�ύστερ'C�ύστερα�ύστερ’��A�ύστερ’C�ύστερα�ಠ_ಠ��A�ಠ_ಠ�ಠ︵ಠ��A�ಠ︵ಠ�—��A�—�’��A�’�’ΣΟΥΝ��A�’ΣΟΥΝC�είμαι�’βγαινε��A�’βγαινεC�βγαίνω�’βλεπε��A�’βλεπεC�βλέπω�’γραφα��A�’γραφαC�γράφω�’γω��A�’γωC�εγώ�’δειξε��A�’δειξεC�δείχνω�’θελα��A�’θελαC�θέλω�’κανε��A�’κανεC�κάνω�’κει��A�’κειC�εκεί�’κλεβε��A�’κλεβεC�κλέβω�’λεγα��A�’λεγαC�λέγω�’λεγαν��A�’λεγανC�λέγω�’λεγε��A�’λεγεC�λέγω�’μας��A�’μαςC�εμάς�’μαστε��A�’μαστεC�είμαι�’μεις��A�’μειςC�εγώ�’μετ��A�’μετC�μετά�’μουν��A�’μουνC�είμαι�’μουνα��A�’μουναC�είμαι�’ναι��A�’ναιC�είμαι�’ξερες��A�’ξερεςC�ξέρω�’ξομολογήθηκε��A�’ξομολογήθηκεC�εξομολογούμαι�’παιρνα��A�’παιρναC�παίρνω�’πανε��A�’πανεC�λέγω�’πε��A�’πεC�λέγω�’πρεπε��A�’πρεπεC�πρέπει�’ρθε��A�’ρθεC�έρχομαι�’ρθεί��A�’ρθείC�έρχομαι�’ρθει��A�’ρθειC�έρχομαι�’ρθουν��A�’ρθουνC�έρχομαι�’ρθούνε��A�’ρθούνεC�έρχομαι�’ριξε��A�’ριξεC�ρίχνω�’ρχεται��A�’ρχεταιC�έρχομαι�’σένα��A�’σέναC�εγώ�’σβηνε��A�’σβηνεC�σβήνω�’σκασε��A�’σκασεC�σκάω�’σπαγαν��A�’σπαγανC�σπάω�’ταν��A�’τανC�είμαι�’τανε��A�’τανεC�είμαι�’φαγε��A�’φαγεC�τρώω�’φερε��A�’φερεC�φέρνω�’φύγε��A�’φύγεC�φεύγω�’χα��A�’χαC�έχω�’χαμε��A�’χαμεC�έχω�’χε��A�’χεC�έχω�’χει��A�’χειC�έχω�’χεις��A�’χειςC�έχω�’χουμε��A�’χουμεC�έχω�’χουν��A�’χουνC�έχω�’’��A�’’�faster_heuristics�
trainable_lemmatizer/cfg ADDED
@@ -0,0 +1,215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "labels":[
3
+ 0,
4
+ 2,
5
+ 4,
6
+ 6,
7
+ 8,
8
+ 9,
9
+ 11,
10
+ 14,
11
+ 16,
12
+ 17,
13
+ 19,
14
+ 22,
15
+ 23,
16
+ 24,
17
+ 26,
18
+ 27,
19
+ 28,
20
+ 30,
21
+ 31,
22
+ 35,
23
+ 37,
24
+ 40,
25
+ 42,
26
+ 44,
27
+ 47,
28
+ 48,
29
+ 50,
30
+ 52,
31
+ 54,
32
+ 56,
33
+ 57,
34
+ 58,
35
+ 59,
36
+ 61,
37
+ 64,
38
+ 67,
39
+ 71,
40
+ 74,
41
+ 78,
42
+ 49,
43
+ 79,
44
+ 82,
45
+ 83,
46
+ 85,
47
+ 13,
48
+ 87,
49
+ 90,
50
+ 91,
51
+ 93,
52
+ 95,
53
+ 96,
54
+ 100,
55
+ 101,
56
+ 104,
57
+ 107,
58
+ 109,
59
+ 111,
60
+ 113,
61
+ 115,
62
+ 117,
63
+ 118,
64
+ 120,
65
+ 51,
66
+ 121,
67
+ 124,
68
+ 128,
69
+ 131,
70
+ 133,
71
+ 136,
72
+ 138,
73
+ 139,
74
+ 143,
75
+ 145,
76
+ 147,
77
+ 149,
78
+ 151,
79
+ 153,
80
+ 154,
81
+ 156,
82
+ 158,
83
+ 161,
84
+ 162,
85
+ 165,
86
+ 166,
87
+ 169,
88
+ 172,
89
+ 174,
90
+ 175,
91
+ 180,
92
+ 181,
93
+ 183,
94
+ 184,
95
+ 186,
96
+ 187,
97
+ 188,
98
+ 189,
99
+ 191,
100
+ 195,
101
+ 196,
102
+ 198,
103
+ 200,
104
+ 202,
105
+ 204,
106
+ 206,
107
+ 208,
108
+ 210,
109
+ 212,
110
+ 214,
111
+ 216,
112
+ 217,
113
+ 218,
114
+ 108,
115
+ 221,
116
+ 223,
117
+ 226,
118
+ 228,
119
+ 150,
120
+ 230,
121
+ 233,
122
+ 234,
123
+ 235,
124
+ 239,
125
+ 173,
126
+ 241,
127
+ 244,
128
+ 245,
129
+ 247,
130
+ 250,
131
+ 252,
132
+ 255,
133
+ 63,
134
+ 256,
135
+ 259,
136
+ 262,
137
+ 264,
138
+ 266,
139
+ 270,
140
+ 272,
141
+ 273,
142
+ 274,
143
+ 275,
144
+ 276,
145
+ 278,
146
+ 280,
147
+ 281,
148
+ 283,
149
+ 286,
150
+ 290,
151
+ 293,
152
+ 295,
153
+ 297,
154
+ 298,
155
+ 299,
156
+ 301,
157
+ 303,
158
+ 306,
159
+ 309,
160
+ 311,
161
+ 312,
162
+ 314,
163
+ 317,
164
+ 321,
165
+ 323,
166
+ 324,
167
+ 326,
168
+ 328,
169
+ 330,
170
+ 332,
171
+ 333,
172
+ 334,
173
+ 336,
174
+ 337,
175
+ 338,
176
+ 340,
177
+ 343,
178
+ 345,
179
+ 347,
180
+ 349,
181
+ 352,
182
+ 354,
183
+ 358,
184
+ 361,
185
+ 362,
186
+ 363,
187
+ 364,
188
+ 368,
189
+ 370,
190
+ 372,
191
+ 373,
192
+ 374,
193
+ 376,
194
+ 377,
195
+ 379,
196
+ 381,
197
+ 382,
198
+ 386,
199
+ 388,
200
+ 73,
201
+ 389,
202
+ 391,
203
+ 393,
204
+ 395,
205
+ 397,
206
+ 399,
207
+ 401,
208
+ 402,
209
+ 404,
210
+ 407,
211
+ 408,
212
+ 409,
213
+ 322
214
+ ]
215
+ }
trainable_lemmatizer/model ADDED
Binary file (650 kB). View file
 
trainable_lemmatizer/trees ADDED
Binary file (21.4 kB). View file
 
transformer/cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "max_batch_items":4096
3
+ }
transformer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffc1456e2d78569293895e274be9acf7ee02aef4f7af9aa9efc230966f26a204
3
+ size 508592662
vocab/key2row ADDED
@@ -0,0 +1 @@
 
 
1
+
vocab/lookups.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
+ size 1
vocab/strings.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab/vectors ADDED
Binary file (128 Bytes). View file
 
vocab/vectors.cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "mode":"default"
3
+ }