phonemetransformers
/

CHILDES-PortugueseBr-phoneme-tokenizer

Inference Endpoints

Model card Files Files and versions Community

codebyzeb commited on 22 days ago

Commit

cfa3f65

·

verified ·

1 Parent(s): 26ee18d

Upload tokenizer

Files changed (2) hide show

tokenizer.json +9 -0
tokenizer_config.json +8 -0

tokenizer.json CHANGED Viewed

@@ -21,6 +21,15 @@
       "normalized": false,
       "special": true
     },
     {
       "id": 3,
       "content": "UTT_BOUNDARY",

       "normalized": false,
       "special": true
     },
+    {
+      "id": 2,
+      "content": "WORD_BOUNDARY",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
     {
       "id": 3,
       "content": "UTT_BOUNDARY",

tokenizer_config.json CHANGED Viewed

@@ -17,6 +17,14 @@
       "single_word": false,
       "special": true
     },
     "3": {
       "content": "UTT_BOUNDARY",
       "lstrip": false,

       "single_word": false,
       "special": true
     },
+    "2": {
+      "content": "WORD_BOUNDARY",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
     "3": {
       "content": "UTT_BOUNDARY",
       "lstrip": false,