Commit
·
e591f8d
1
Parent(s):
ca150fa
Tokens and LM
Browse files- config.json +1 -1
- preprocessor_config.json +1 -0
- special_tokens_map.json +1 -1
- tokenizer_config.json +1 -1
config.json
CHANGED
|
@@ -101,7 +101,7 @@
|
|
| 101 |
1
|
| 102 |
],
|
| 103 |
"torch_dtype": "float32",
|
| 104 |
-
"transformers_version": "4.
|
| 105 |
"use_weighted_layer_sum": false,
|
| 106 |
"vocab_size": 57,
|
| 107 |
"xvector_output_dim": 512
|
|
|
|
| 101 |
1
|
| 102 |
],
|
| 103 |
"torch_dtype": "float32",
|
| 104 |
+
"transformers_version": "4.16.0",
|
| 105 |
"use_weighted_layer_sum": false,
|
| 106 |
"vocab_size": 57,
|
| 107 |
"xvector_output_dim": 512
|
preprocessor_config.json
CHANGED
|
@@ -4,6 +4,7 @@
|
|
| 4 |
"feature_size": 1,
|
| 5 |
"padding_side": "right",
|
| 6 |
"padding_value": 0.0,
|
|
|
|
| 7 |
"return_attention_mask": true,
|
| 8 |
"sampling_rate": 16000
|
| 9 |
}
|
|
|
|
| 4 |
"feature_size": 1,
|
| 5 |
"padding_side": "right",
|
| 6 |
"padding_value": 0.0,
|
| 7 |
+
"processor_class": "Wav2Vec2ProcessorWithLM",
|
| 8 |
"return_attention_mask": true,
|
| 9 |
"sampling_rate": 16000
|
| 10 |
}
|
special_tokens_map.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
|
|
|
|
| 1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
|
tokenizer_config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "
|
|
|
|
| 1 |
+
{"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "anuragshas/wav2vec2-large-xls-r-300m-ur-cv8", "tokenizer_class": "Wav2Vec2CTCTokenizer", "processor_class": "Wav2Vec2ProcessorWithLM"}
|