Upload processor
Browse files- preprocessor_config.json +0 -0
- special_tokens_map.json +8 -1
- tokenizer_config.json +2 -1
preprocessor_config.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
CHANGED
@@ -108,5 +108,12 @@
|
|
108 |
"<|notimestamps|>"
|
109 |
],
|
110 |
"bos_token": "<|endoftext|>",
|
111 |
-
"eos_token": "<|endoftext|>"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
112 |
}
|
|
|
108 |
"<|notimestamps|>"
|
109 |
],
|
110 |
"bos_token": "<|endoftext|>",
|
111 |
+
"eos_token": "<|endoftext|>",
|
112 |
+
"unk_token": {
|
113 |
+
"content": "<|endoftext|>",
|
114 |
+
"lstrip": false,
|
115 |
+
"normalized": true,
|
116 |
+
"rstrip": false,
|
117 |
+
"single_word": false
|
118 |
+
}
|
119 |
}
|
tokenizer_config.json
CHANGED
@@ -19,8 +19,9 @@
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 1024,
|
22 |
-
"name_or_path": "whisper-
|
23 |
"pad_token": null,
|
|
|
24 |
"special_tokens_map_file": null,
|
25 |
"tokenizer_class": "WhisperTokenizer",
|
26 |
"unk_token": {
|
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 1024,
|
22 |
+
"name_or_path": "ArthurZ/whisper-small.en",
|
23 |
"pad_token": null,
|
24 |
+
"processor_class": "WhisperProcessor",
|
25 |
"special_tokens_map_file": null,
|
26 |
"tokenizer_class": "WhisperTokenizer",
|
27 |
"unk_token": {
|