jraramhoej
commited on
Commit
·
36a641a
1
Parent(s):
af1bbb4
Training in progress, step 1000
Browse files- config.json +1 -1
- fine-tune-whisper-streaming.ipynb +112 -272
- pytorch_model.bin +1 -1
- runs/Dec15_09-48-30_129-213-18-196/events.out.tfevents.1671097754.129-213-18-196.69807.0 +2 -2
- runs/Dec15_14-18-11_129-213-18-196/1671113929.6254616/events.out.tfevents.1671113929.129-213-18-196.4128231.1 +3 -0
- runs/Dec15_14-18-11_129-213-18-196/events.out.tfevents.1671113929.129-213-18-196.4128231.0 +3 -0
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"architectures": [
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "checkpoint-2000",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"architectures": [
|
fine-tune-whisper-streaming.ipynb
CHANGED
@@ -154,71 +154,14 @@
|
|
154 |
"execution_count": 2,
|
155 |
"id": "a2787582-554f-44ce-9f38-4180a5ed6b44",
|
156 |
"metadata": {},
|
157 |
-
"outputs": [
|
158 |
-
{
|
159 |
-
"data": {
|
160 |
-
"application/vnd.jupyter.widget-view+json": {
|
161 |
-
"model_id": "a5bfb5c5097d427e97faf28bc5c3aa8a",
|
162 |
-
"version_major": 2,
|
163 |
-
"version_minor": 0
|
164 |
-
},
|
165 |
-
"text/plain": [
|
166 |
-
"Downloading builder script: 0%| | 0.00/8.30k [00:00<?, ?B/s]"
|
167 |
-
]
|
168 |
-
},
|
169 |
-
"metadata": {},
|
170 |
-
"output_type": "display_data"
|
171 |
-
},
|
172 |
-
{
|
173 |
-
"data": {
|
174 |
-
"application/vnd.jupyter.widget-view+json": {
|
175 |
-
"model_id": "86fc1ce2e457497ea0d838ee2221bce4",
|
176 |
-
"version_major": 2,
|
177 |
-
"version_minor": 0
|
178 |
-
},
|
179 |
-
"text/plain": [
|
180 |
-
"Downloading readme: 0%| | 0.00/12.2k [00:00<?, ?B/s]"
|
181 |
-
]
|
182 |
-
},
|
183 |
-
"metadata": {},
|
184 |
-
"output_type": "display_data"
|
185 |
-
},
|
186 |
-
{
|
187 |
-
"data": {
|
188 |
-
"application/vnd.jupyter.widget-view+json": {
|
189 |
-
"model_id": "03d8267a06a5435c8de7726bb0492621",
|
190 |
-
"version_major": 2,
|
191 |
-
"version_minor": 0
|
192 |
-
},
|
193 |
-
"text/plain": [
|
194 |
-
"Downloading extra modules: 0%| | 0.00/3.44k [00:00<?, ?B/s]"
|
195 |
-
]
|
196 |
-
},
|
197 |
-
"metadata": {},
|
198 |
-
"output_type": "display_data"
|
199 |
-
},
|
200 |
-
{
|
201 |
-
"data": {
|
202 |
-
"application/vnd.jupyter.widget-view+json": {
|
203 |
-
"model_id": "67700bc114c74e05b2e8c0fa31ef479c",
|
204 |
-
"version_major": 2,
|
205 |
-
"version_minor": 0
|
206 |
-
},
|
207 |
-
"text/plain": [
|
208 |
-
"Downloading extra modules: 0%| | 0.00/60.9k [00:00<?, ?B/s]"
|
209 |
-
]
|
210 |
-
},
|
211 |
-
"metadata": {},
|
212 |
-
"output_type": "display_data"
|
213 |
-
}
|
214 |
-
],
|
215 |
"source": [
|
216 |
"from datasets import IterableDatasetDict\n",
|
217 |
"\n",
|
218 |
"raw_datasets = IterableDatasetDict()\n",
|
219 |
"\n",
|
220 |
-
"raw_datasets[\"train\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"
|
221 |
-
"raw_datasets[\"test\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"
|
222 |
]
|
223 |
},
|
224 |
{
|
@@ -254,110 +197,11 @@
|
|
254 |
"execution_count": 3,
|
255 |
"id": "77d9f0c5-8607-4642-a8ac-c3ab2e223ea6",
|
256 |
"metadata": {},
|
257 |
-
"outputs": [
|
258 |
-
{
|
259 |
-
"data": {
|
260 |
-
"application/vnd.jupyter.widget-view+json": {
|
261 |
-
"model_id": "75b767165e6e43db816df3911cfa841d",
|
262 |
-
"version_major": 2,
|
263 |
-
"version_minor": 0
|
264 |
-
},
|
265 |
-
"text/plain": [
|
266 |
-
"Downloading: 0%| | 0.00/185k [00:00<?, ?B/s]"
|
267 |
-
]
|
268 |
-
},
|
269 |
-
"metadata": {},
|
270 |
-
"output_type": "display_data"
|
271 |
-
},
|
272 |
-
{
|
273 |
-
"data": {
|
274 |
-
"application/vnd.jupyter.widget-view+json": {
|
275 |
-
"model_id": "147d3f2f6bcf46b694088b963c0b8bbb",
|
276 |
-
"version_major": 2,
|
277 |
-
"version_minor": 0
|
278 |
-
},
|
279 |
-
"text/plain": [
|
280 |
-
"Downloading: 0%| | 0.00/829 [00:00<?, ?B/s]"
|
281 |
-
]
|
282 |
-
},
|
283 |
-
"metadata": {},
|
284 |
-
"output_type": "display_data"
|
285 |
-
},
|
286 |
-
{
|
287 |
-
"data": {
|
288 |
-
"application/vnd.jupyter.widget-view+json": {
|
289 |
-
"model_id": "0a2ef4e849214883809f2717e04e8efd",
|
290 |
-
"version_major": 2,
|
291 |
-
"version_minor": 0
|
292 |
-
},
|
293 |
-
"text/plain": [
|
294 |
-
"Downloading: 0%| | 0.00/1.04M [00:00<?, ?B/s]"
|
295 |
-
]
|
296 |
-
},
|
297 |
-
"metadata": {},
|
298 |
-
"output_type": "display_data"
|
299 |
-
},
|
300 |
-
{
|
301 |
-
"data": {
|
302 |
-
"application/vnd.jupyter.widget-view+json": {
|
303 |
-
"model_id": "157bdd4e09944f2fb4a564b5498ac986",
|
304 |
-
"version_major": 2,
|
305 |
-
"version_minor": 0
|
306 |
-
},
|
307 |
-
"text/plain": [
|
308 |
-
"Downloading: 0%| | 0.00/494k [00:00<?, ?B/s]"
|
309 |
-
]
|
310 |
-
},
|
311 |
-
"metadata": {},
|
312 |
-
"output_type": "display_data"
|
313 |
-
},
|
314 |
-
{
|
315 |
-
"data": {
|
316 |
-
"application/vnd.jupyter.widget-view+json": {
|
317 |
-
"model_id": "37577267369d486aaf821fb9b616e54a",
|
318 |
-
"version_major": 2,
|
319 |
-
"version_minor": 0
|
320 |
-
},
|
321 |
-
"text/plain": [
|
322 |
-
"Downloading: 0%| | 0.00/52.7k [00:00<?, ?B/s]"
|
323 |
-
]
|
324 |
-
},
|
325 |
-
"metadata": {},
|
326 |
-
"output_type": "display_data"
|
327 |
-
},
|
328 |
-
{
|
329 |
-
"data": {
|
330 |
-
"application/vnd.jupyter.widget-view+json": {
|
331 |
-
"model_id": "abc2d68feaff450c92d0b2223841d551",
|
332 |
-
"version_major": 2,
|
333 |
-
"version_minor": 0
|
334 |
-
},
|
335 |
-
"text/plain": [
|
336 |
-
"Downloading: 0%| | 0.00/2.11k [00:00<?, ?B/s]"
|
337 |
-
]
|
338 |
-
},
|
339 |
-
"metadata": {},
|
340 |
-
"output_type": "display_data"
|
341 |
-
},
|
342 |
-
{
|
343 |
-
"data": {
|
344 |
-
"application/vnd.jupyter.widget-view+json": {
|
345 |
-
"model_id": "7483217a05e944309128f439da2e0a11",
|
346 |
-
"version_major": 2,
|
347 |
-
"version_minor": 0
|
348 |
-
},
|
349 |
-
"text/plain": [
|
350 |
-
"Downloading: 0%| | 0.00/2.06k [00:00<?, ?B/s]"
|
351 |
-
]
|
352 |
-
},
|
353 |
-
"metadata": {},
|
354 |
-
"output_type": "display_data"
|
355 |
-
}
|
356 |
-
],
|
357 |
"source": [
|
358 |
"from transformers import WhisperProcessor\n",
|
359 |
"\n",
|
360 |
-
"processor = WhisperProcessor.from_pretrained(\"openai/whisper-small\", language=\"
|
361 |
]
|
362 |
},
|
363 |
{
|
@@ -715,22 +559,7 @@
|
|
715 |
"execution_count": 14,
|
716 |
"id": "b22b4011-f31f-4b57-b684-c52332f92890",
|
717 |
"metadata": {},
|
718 |
-
"outputs": [
|
719 |
-
{
|
720 |
-
"data": {
|
721 |
-
"application/vnd.jupyter.widget-view+json": {
|
722 |
-
"model_id": "98ab67e0e7c14bbebd4f8526e604c70b",
|
723 |
-
"version_major": 2,
|
724 |
-
"version_minor": 0
|
725 |
-
},
|
726 |
-
"text/plain": [
|
727 |
-
"Downloading builder script: 0%| | 0.00/4.49k [00:00<?, ?B/s]"
|
728 |
-
]
|
729 |
-
},
|
730 |
-
"metadata": {},
|
731 |
-
"output_type": "display_data"
|
732 |
-
}
|
733 |
-
],
|
734 |
"source": [
|
735 |
"import evaluate\n",
|
736 |
"\n",
|
@@ -809,40 +638,11 @@
|
|
809 |
"execution_count": 16,
|
810 |
"id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
|
811 |
"metadata": {},
|
812 |
-
"outputs": [
|
813 |
-
{
|
814 |
-
"data": {
|
815 |
-
"application/vnd.jupyter.widget-view+json": {
|
816 |
-
"model_id": "e72a167577c24decbca6625ad8586d16",
|
817 |
-
"version_major": 2,
|
818 |
-
"version_minor": 0
|
819 |
-
},
|
820 |
-
"text/plain": [
|
821 |
-
"Downloading: 0%| | 0.00/1.97k [00:00<?, ?B/s]"
|
822 |
-
]
|
823 |
-
},
|
824 |
-
"metadata": {},
|
825 |
-
"output_type": "display_data"
|
826 |
-
},
|
827 |
-
{
|
828 |
-
"data": {
|
829 |
-
"application/vnd.jupyter.widget-view+json": {
|
830 |
-
"model_id": "b801991734784e80a45e0fa326e29760",
|
831 |
-
"version_major": 2,
|
832 |
-
"version_minor": 0
|
833 |
-
},
|
834 |
-
"text/plain": [
|
835 |
-
"Downloading: 0%| | 0.00/967M [00:00<?, ?B/s]"
|
836 |
-
]
|
837 |
-
},
|
838 |
-
"metadata": {},
|
839 |
-
"output_type": "display_data"
|
840 |
-
}
|
841 |
-
],
|
842 |
"source": [
|
843 |
"from transformers import WhisperForConditionalGeneration\n",
|
844 |
"\n",
|
845 |
-
"model = WhisperForConditionalGeneration.from_pretrained(\"
|
846 |
]
|
847 |
},
|
848 |
{
|
@@ -1065,8 +865,8 @@
|
|
1065 |
" Gradient Accumulation steps = 1\n",
|
1066 |
" Total optimization steps = 2000\n",
|
1067 |
" Number of trainable parameters = 241734912\n",
|
1068 |
-
"Reading metadata...:
|
1069 |
-
"Reading metadata...:
|
1070 |
"The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
|
1071 |
]
|
1072 |
},
|
@@ -1076,8 +876,8 @@
|
|
1076 |
"\n",
|
1077 |
" <div>\n",
|
1078 |
" \n",
|
1079 |
-
" <progress value='
|
1080 |
-
" [
|
1081 |
" </div>\n",
|
1082 |
" <table border=\"1\" class=\"dataframe\">\n",
|
1083 |
" <thead>\n",
|
@@ -1085,16 +885,9 @@
|
|
1085 |
" <th>Step</th>\n",
|
1086 |
" <th>Training Loss</th>\n",
|
1087 |
" <th>Validation Loss</th>\n",
|
1088 |
-
" <th>Wer</th>\n",
|
1089 |
" </tr>\n",
|
1090 |
" </thead>\n",
|
1091 |
" <tbody>\n",
|
1092 |
-
" <tr>\n",
|
1093 |
-
" <td>1000</td>\n",
|
1094 |
-
" <td>0.009000</td>\n",
|
1095 |
-
" <td>0.444009</td>\n",
|
1096 |
-
" <td>34.279589</td>\n",
|
1097 |
-
" </tr>\n",
|
1098 |
" </tbody>\n",
|
1099 |
"</table><p>"
|
1100 |
],
|
@@ -1109,60 +902,108 @@
|
|
1109 |
"name": "stderr",
|
1110 |
"output_type": "stream",
|
1111 |
"text": [
|
1112 |
-
"Reading metadata...:
|
1113 |
-
"Reading metadata...:
|
1114 |
-
"Reading metadata...:
|
1115 |
-
"Reading metadata...:
|
1116 |
-
"Reading metadata...:
|
1117 |
-
"Reading metadata...:
|
1118 |
-
"Reading metadata...:
|
1119 |
-
"Reading metadata...:
|
1120 |
-
"Reading metadata...:
|
1121 |
-
"Reading metadata...:
|
1122 |
-
"Reading metadata...:
|
1123 |
-
"Reading metadata...:
|
1124 |
-
"Reading metadata...:
|
1125 |
-
"Reading metadata...:
|
1126 |
-
"Reading metadata...:
|
1127 |
-
"Reading metadata...:
|
1128 |
-
"
|
1129 |
-
"
|
1130 |
-
"
|
1131 |
-
"Reading metadata...:
|
1132 |
-
"
|
1133 |
-
"
|
1134 |
-
"
|
1135 |
-
"
|
1136 |
-
"
|
1137 |
-
"
|
1138 |
-
"
|
1139 |
-
"
|
1140 |
-
"
|
1141 |
-
"
|
1142 |
-
"
|
1143 |
-
"
|
1144 |
-
"Reading metadata...:
|
1145 |
-
"Reading metadata...:
|
1146 |
-
"Reading metadata...:
|
1147 |
-
"Reading metadata...:
|
1148 |
-
"Reading metadata...:
|
1149 |
-
"Reading metadata...:
|
1150 |
-
"Reading metadata...:
|
1151 |
-
"Reading metadata...:
|
1152 |
-
"Reading metadata...:
|
1153 |
-
"Reading metadata...:
|
1154 |
-
"Reading metadata...:
|
1155 |
-
"Reading metadata...:
|
1156 |
-
"Reading metadata...:
|
1157 |
-
"Reading metadata...:
|
1158 |
-
"Reading metadata...:
|
1159 |
-
"Reading metadata...:
|
1160 |
-
"Reading metadata...:
|
1161 |
-
"Reading metadata...:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1162 |
"***** Running Evaluation *****\n",
|
1163 |
" Num examples: Unknown\n",
|
1164 |
" Batch size = 8\n",
|
1165 |
-
"Reading metadata...:
|
1166 |
"The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
|
1167 |
]
|
1168 |
}
|
@@ -1201,8 +1042,7 @@
|
|
1201 |
"kwargs = {\n",
|
1202 |
" \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
|
1203 |
" \"dataset\": \"Common Voice 11.0\", # a 'pretty' name for the training dataset\n",
|
1204 |
-
" \"
|
1205 |
-
" \"model_name\": \"Whisper Small Lt and Sr\", # a 'pretty' name for your model\n",
|
1206 |
" \"finetuned_from\": \"openai/whisper-small\",\n",
|
1207 |
" \"tasks\": \"automatic-speech-recognition\",\n",
|
1208 |
" \"tags\": \"whisper-event\",\n",
|
|
|
154 |
"execution_count": 2,
|
155 |
"id": "a2787582-554f-44ce-9f38-4180a5ed6b44",
|
156 |
"metadata": {},
|
157 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
158 |
"source": [
|
159 |
"from datasets import IterableDatasetDict\n",
|
160 |
"\n",
|
161 |
"raw_datasets = IterableDatasetDict()\n",
|
162 |
"\n",
|
163 |
+
"raw_datasets[\"train\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"sr\", split=\"train+validation\", use_auth_token=True) # set split=\"train+validation\" for low-resource\n",
|
164 |
+
"raw_datasets[\"test\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"sr\", split=\"test\", use_auth_token=True)"
|
165 |
]
|
166 |
},
|
167 |
{
|
|
|
197 |
"execution_count": 3,
|
198 |
"id": "77d9f0c5-8607-4642-a8ac-c3ab2e223ea6",
|
199 |
"metadata": {},
|
200 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
201 |
"source": [
|
202 |
"from transformers import WhisperProcessor\n",
|
203 |
"\n",
|
204 |
+
"processor = WhisperProcessor.from_pretrained(\"openai/whisper-small\", language=\"Serbian\", task=\"transcribe\")"
|
205 |
]
|
206 |
},
|
207 |
{
|
|
|
559 |
"execution_count": 14,
|
560 |
"id": "b22b4011-f31f-4b57-b684-c52332f92890",
|
561 |
"metadata": {},
|
562 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
563 |
"source": [
|
564 |
"import evaluate\n",
|
565 |
"\n",
|
|
|
638 |
"execution_count": 16,
|
639 |
"id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
|
640 |
"metadata": {},
|
641 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
642 |
"source": [
|
643 |
"from transformers import WhisperForConditionalGeneration\n",
|
644 |
"\n",
|
645 |
+
"model = WhisperForConditionalGeneration.from_pretrained(\"checkpoint-2000\")"
|
646 |
]
|
647 |
},
|
648 |
{
|
|
|
865 |
" Gradient Accumulation steps = 1\n",
|
866 |
" Total optimization steps = 2000\n",
|
867 |
" Number of trainable parameters = 241734912\n",
|
868 |
+
"Reading metadata...: 1045it [00:00, 5692.34it/s]\n",
|
869 |
+
"Reading metadata...: 623it [00:00, 4270.71it/s]\n",
|
870 |
"The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
|
871 |
]
|
872 |
},
|
|
|
876 |
"\n",
|
877 |
" <div>\n",
|
878 |
" \n",
|
879 |
+
" <progress value='1001' max='2000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
|
880 |
+
" [1001/2000 1:45:14 < 1:45:14, 0.16 it/s, Epoch 49.01/9223372036854775807]\n",
|
881 |
" </div>\n",
|
882 |
" <table border=\"1\" class=\"dataframe\">\n",
|
883 |
" <thead>\n",
|
|
|
885 |
" <th>Step</th>\n",
|
886 |
" <th>Training Loss</th>\n",
|
887 |
" <th>Validation Loss</th>\n",
|
|
|
888 |
" </tr>\n",
|
889 |
" </thead>\n",
|
890 |
" <tbody>\n",
|
|
|
|
|
|
|
|
|
|
|
|
|
891 |
" </tbody>\n",
|
892 |
"</table><p>"
|
893 |
],
|
|
|
902 |
"name": "stderr",
|
903 |
"output_type": "stream",
|
904 |
"text": [
|
905 |
+
"Reading metadata...: 1045it [00:00, 5867.31it/s]\n",
|
906 |
+
"Reading metadata...: 623it [00:00, 4899.32it/s]\n",
|
907 |
+
"Reading metadata...: 1045it [00:00, 10001.87it/s]\n",
|
908 |
+
"Reading metadata...: 623it [00:00, 4402.30it/s]\n",
|
909 |
+
"Reading metadata...: 1045it [00:00, 10266.26it/s]\n",
|
910 |
+
"Reading metadata...: 623it [00:00, 3253.67it/s]\n",
|
911 |
+
"Reading metadata...: 1045it [00:00, 13354.24it/s]\n",
|
912 |
+
"Reading metadata...: 623it [00:00, 7292.22it/s]\n",
|
913 |
+
"Reading metadata...: 1045it [00:00, 33723.01it/s]\n",
|
914 |
+
"Reading metadata...: 623it [00:00, 28938.73it/s]\n",
|
915 |
+
"Reading metadata...: 1045it [00:00, 12782.78it/s]\n",
|
916 |
+
"Reading metadata...: 623it [00:00, 6901.10it/s]\n",
|
917 |
+
"Reading metadata...: 1045it [00:00, 34292.66it/s]\n",
|
918 |
+
"Reading metadata...: 623it [00:00, 33494.65it/s]\n",
|
919 |
+
"Reading metadata...: 1045it [00:00, 39667.03it/s]\n",
|
920 |
+
"Reading metadata...: 623it [00:00, 28214.13it/s]\n",
|
921 |
+
"Reading metadata...: 1045it [00:00, 42047.25it/s]\n",
|
922 |
+
"Reading metadata...: 623it [00:00, 32434.88it/s]\n",
|
923 |
+
"Reading metadata...: 1045it [00:00, 41330.01it/s]\n",
|
924 |
+
"Reading metadata...: 623it [00:00, 32047.04it/s]\n",
|
925 |
+
"Reading metadata...: 1045it [00:00, 29199.29it/s]\n",
|
926 |
+
"Reading metadata...: 623it [00:00, 30785.24it/s]\n",
|
927 |
+
"Reading metadata...: 1045it [00:00, 42721.43it/s]\n",
|
928 |
+
"Reading metadata...: 623it [00:00, 19130.06it/s]\n",
|
929 |
+
"Reading metadata...: 1045it [00:01, 738.01it/s]\n",
|
930 |
+
"Reading metadata...: 623it [00:01, 541.43it/s]\n",
|
931 |
+
"Reading metadata...: 1045it [00:00, 44482.59it/s]\n",
|
932 |
+
"Reading metadata...: 623it [00:00, 32484.48it/s]\n",
|
933 |
+
"Reading metadata...: 1045it [00:00, 41314.82it/s]\n",
|
934 |
+
"Reading metadata...: 623it [00:00, 28735.69it/s]\n",
|
935 |
+
"Reading metadata...: 1045it [00:00, 44215.15it/s]\n",
|
936 |
+
"Reading metadata...: 623it [00:00, 31580.71it/s]\n",
|
937 |
+
"Reading metadata...: 1045it [00:00, 1623.63it/s]\n",
|
938 |
+
"Reading metadata...: 623it [00:00, 1009.77it/s]\n",
|
939 |
+
"Reading metadata...: 1045it [00:00, 44171.93it/s]\n",
|
940 |
+
"Reading metadata...: 623it [00:00, 30811.38it/s]\n",
|
941 |
+
"Reading metadata...: 1045it [00:00, 43079.18it/s]\n",
|
942 |
+
"Reading metadata...: 623it [00:00, 15485.94it/s]\n",
|
943 |
+
"Reading metadata...: 1045it [00:00, 40702.87it/s]\n",
|
944 |
+
"Reading metadata...: 623it [00:00, 28661.31it/s]\n",
|
945 |
+
"Reading metadata...: 1045it [00:00, 44402.38it/s]\n",
|
946 |
+
"Reading metadata...: 623it [00:00, 31105.90it/s]\n",
|
947 |
+
"Reading metadata...: 1045it [00:00, 24505.06it/s]\n",
|
948 |
+
"Reading metadata...: 623it [00:00, 19740.06it/s]\n",
|
949 |
+
"Reading metadata...: 1045it [00:00, 4819.73it/s]\n",
|
950 |
+
"Reading metadata...: 623it [00:00, 4116.76it/s]\n",
|
951 |
+
"Reading metadata...: 1045it [00:00, 42929.81it/s]\n",
|
952 |
+
"Reading metadata...: 623it [00:00, 30741.78it/s]\n",
|
953 |
+
"Reading metadata...: 1045it [00:00, 9124.52it/s]\n",
|
954 |
+
"Reading metadata...: 623it [00:00, 4622.41it/s]\n",
|
955 |
+
"Reading metadata...: 1045it [00:00, 40983.75it/s]\n",
|
956 |
+
"Reading metadata...: 623it [00:00, 28923.67it/s]\n",
|
957 |
+
"Reading metadata...: 1045it [00:00, 9164.05it/s]\n",
|
958 |
+
"Reading metadata...: 623it [00:00, 5771.93it/s]\n",
|
959 |
+
"Reading metadata...: 1045it [00:00, 6674.98it/s]\n",
|
960 |
+
"Reading metadata...: 623it [00:00, 3780.80it/s]\n",
|
961 |
+
"Reading metadata...: 1045it [00:00, 43593.76it/s]\n",
|
962 |
+
"Reading metadata...: 623it [00:00, 21590.29it/s]\n",
|
963 |
+
"Reading metadata...: 1045it [00:00, 41968.74it/s]\n",
|
964 |
+
"Reading metadata...: 623it [00:00, 32694.20it/s]\n",
|
965 |
+
"Reading metadata...: 1045it [00:00, 17046.83it/s]\n",
|
966 |
+
"Reading metadata...: 623it [00:00, 11208.51it/s]\n",
|
967 |
+
"Reading metadata...: 1045it [00:00, 37953.07it/s]\n",
|
968 |
+
"Reading metadata...: 623it [00:00, 31590.64it/s]\n",
|
969 |
+
"Reading metadata...: 1045it [00:00, 39963.96it/s]\n",
|
970 |
+
"Reading metadata...: 623it [00:00, 30293.44it/s]\n",
|
971 |
+
"Reading metadata...: 1045it [00:00, 45293.92it/s]\n",
|
972 |
+
"Reading metadata...: 623it [00:00, 28211.39it/s]\n",
|
973 |
+
"Reading metadata...: 1045it [00:00, 3469.64it/s]\n",
|
974 |
+
"Reading metadata...: 623it [00:00, 6854.28it/s]\n",
|
975 |
+
"Reading metadata...: 1045it [00:00, 43085.10it/s]\n",
|
976 |
+
"Reading metadata...: 623it [00:00, 33438.50it/s]\n",
|
977 |
+
"Reading metadata...: 1045it [00:00, 32567.86it/s]\n",
|
978 |
+
"Reading metadata...: 623it [00:00, 27699.11it/s]\n",
|
979 |
+
"Reading metadata...: 1045it [00:00, 42481.27it/s]\n",
|
980 |
+
"Reading metadata...: 623it [00:00, 31889.43it/s]\n",
|
981 |
+
"Reading metadata...: 1045it [00:00, 16001.43it/s]\n",
|
982 |
+
"Reading metadata...: 623it [00:00, 13026.76it/s]\n",
|
983 |
+
"Reading metadata...: 1045it [00:00, 45249.50it/s]\n",
|
984 |
+
"Reading metadata...: 623it [00:00, 27699.70it/s]\n",
|
985 |
+
"Reading metadata...: 1045it [00:00, 41886.92it/s]\n",
|
986 |
+
"Reading metadata...: 623it [00:00, 30486.41it/s]\n",
|
987 |
+
"Reading metadata...: 1045it [00:00, 39246.49it/s]\n",
|
988 |
+
"Reading metadata...: 623it [00:00, 29180.46it/s]\n",
|
989 |
+
"Reading metadata...: 1045it [00:00, 40768.74it/s]\n",
|
990 |
+
"Reading metadata...: 623it [00:00, 25073.18it/s]\n",
|
991 |
+
"Reading metadata...: 1045it [00:00, 41413.97it/s]\n",
|
992 |
+
"Reading metadata...: 623it [00:00, 34066.69it/s]\n",
|
993 |
+
"Reading metadata...: 1045it [00:00, 43446.41it/s]\n",
|
994 |
+
"Reading metadata...: 623it [00:00, 14088.58it/s]\n",
|
995 |
+
"Reading metadata...: 1045it [00:00, 42264.17it/s]\n",
|
996 |
+
"Reading metadata...: 623it [00:00, 33832.48it/s]\n",
|
997 |
+
"Reading metadata...: 1045it [00:00, 35855.79it/s]\n",
|
998 |
+
"Reading metadata...: 623it [00:00, 14966.70it/s]\n",
|
999 |
+
"Reading metadata...: 1045it [00:00, 37491.43it/s]\n",
|
1000 |
+
"Reading metadata...: 623it [00:00, 25462.13it/s]\n",
|
1001 |
+
"Reading metadata...: 1045it [00:00, 18279.76it/s]\n",
|
1002 |
+
"Reading metadata...: 623it [00:00, 9944.59it/s]\n",
|
1003 |
"***** Running Evaluation *****\n",
|
1004 |
" Num examples: Unknown\n",
|
1005 |
" Batch size = 8\n",
|
1006 |
+
"Reading metadata...: 677it [00:00, 4738.28it/s]\n",
|
1007 |
"The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
|
1008 |
]
|
1009 |
}
|
|
|
1042 |
"kwargs = {\n",
|
1043 |
" \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
|
1044 |
" \"dataset\": \"Common Voice 11.0\", # a 'pretty' name for the training dataset\n",
|
1045 |
+
" \"model_name\": \"Whisper Small Lithuanian and Serbian sequentially trained\", # a 'pretty' name for your model\n",
|
|
|
1046 |
" \"finetuned_from\": \"openai/whisper-small\",\n",
|
1047 |
" \"tasks\": \"automatic-speech-recognition\",\n",
|
1048 |
" \"tags\": \"whisper-event\",\n",
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 967102601
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c102a56223c9d4c0073bf307faa42881b324cda17921f66be674baeaac81536
|
3 |
size 967102601
|
runs/Dec15_09-48-30_129-213-18-196/events.out.tfevents.1671097754.129-213-18-196.69807.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:111a1faf82a941b0dd777617baa73f1608b1d0d430dce19d00ba139736484de6
|
3 |
+
size 17822
|
runs/Dec15_14-18-11_129-213-18-196/1671113929.6254616/events.out.tfevents.1671113929.129-213-18-196.4128231.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e59c4de1c5f36a53463a3c2eb9bdca8cf8c8cce7e955aab755b08013d5a8b019
|
3 |
+
size 5864
|
runs/Dec15_14-18-11_129-213-18-196/events.out.tfevents.1671113929.129-213-18-196.4128231.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79e3c278a91be84dc37fe3af83dfcdc461de029979a79195988c9f7a1dbaf16e
|
3 |
+
size 10865
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3579
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3f2bc41361967c98d61c9072b7d10b71ba361fe800039babbb310b5e56c86cb
|
3 |
size 3579
|