Upload tokenizer
Browse files- tokenizer_config.json +2 -1
- vocab.json +4 -3
tokenizer_config.json
CHANGED
|
@@ -4,6 +4,7 @@
|
|
| 4 |
"language": null,
|
| 5 |
"model_max_length": 1000000000000000019884624838656,
|
| 6 |
"pad_token": "<pad>",
|
| 7 |
-
"
|
|
|
|
| 8 |
"unk_token": "<unk>"
|
| 9 |
}
|
|
|
|
| 4 |
"language": null,
|
| 5 |
"model_max_length": 1000000000000000019884624838656,
|
| 6 |
"pad_token": "<pad>",
|
| 7 |
+
"phonemize": true,
|
| 8 |
+
"tokenizer_class": "VitsTokenizer",
|
| 9 |
"unk_token": "<unk>"
|
| 10 |
}
|
vocab.json
CHANGED
|
@@ -1,13 +1,14 @@
|
|
| 1 |
{
|
| 2 |
-
"": 16,
|
| 3 |
"!": 5,
|
| 4 |
"\"": 11,
|
| 5 |
"'": 176,
|
|
|
|
| 6 |
".": 4,
|
| 7 |
":": 2,
|
| 8 |
";": 1,
|
| 9 |
-
"<pad>":
|
| 10 |
-
"<unk>":
|
| 11 |
"?": 6,
|
| 12 |
"A": 17,
|
| 13 |
"B": 18,
|
|
|
|
| 1 |
{
|
| 2 |
+
" ": 16,
|
| 3 |
"!": 5,
|
| 4 |
"\"": 11,
|
| 5 |
"'": 176,
|
| 6 |
+
",": 3,
|
| 7 |
".": 4,
|
| 8 |
":": 2,
|
| 9 |
";": 1,
|
| 10 |
+
"<pad>": 177,
|
| 11 |
+
"<unk>": 178,
|
| 12 |
"?": 6,
|
| 13 |
"A": 17,
|
| 14 |
"B": 18,
|