tokenizer_config.json
287 B · 13 lines · json Raw
1 {
2 "add_blank": true,
3 "clean_up_tokenization_spaces": true,
4 "is_uroman": false,
5 "language": "hat",
6 "model_max_length": 1000000000000000019884624838656,
7 "normalize": true,
8 "pad_token": "|",
9 "phonemize": false,
10 "tokenizer_class": "VitsTokenizer",
11 "unk_token": "<unk>"
12 }
13