From 5414c23932627aa2ef2e7a740c3b46e2d6b4387e Mon Sep 17 00:00:00 2001 From: Patrick von Platen Date: Tue, 30 Nov 2021 12:06:11 +0000 Subject: [PATCH] correct tokenizer config --- tokenizer_config.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tokenizer_config.json b/tokenizer_config.json index 94d9657..a5b5a87 100644 --- a/tokenizer_config.json +++ b/tokenizer_config.json @@ -1 +1 @@ -{"unk_token": "", "bos_token": "", "eos_token": "", "pad_token": "", "do_lower_case": false, "word_delimiter_token": "|", "tokenizer_class": "Wav2Vec2CTCTokenizer"} \ No newline at end of file +{"unk_token": "", "bos_token": "", "eos_token": "", "pad_token": "", "word_delimiter_token": "|", "phonemizer_lang": "en-us", "phonemizer_backend": "espeak", "do_lower_case": false, "special_tokens_map_file": "../wav2vec2-xlsr-53-espeak-cv-ft/special_tokens_map.json", "tokenizer_file": null, "name_or_path": "../wav2vec2-xlsr-53-espeak-cv-ft/", "tokenizer_class": "Wav2Vec2PhonemeCTCTokenizer"} \ No newline at end of file