Training in progress, step 200
Browse files- .gitattributes +1 -0
- cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-4ec5d413f38fa76b.arrow +3 -0
- cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-580592b2fb57127e.arrow +3 -0
- cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-aa87c5bc3604ea74.arrow +3 -0
- cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/tmpf0pfrlg9 +3 -0
- pytorch_model.bin +1 -1
- run.sh +4 -2
- run_speech_recognition_seq2seq_streaming.py +12 -0
- runs/Mar07_17-04-19_23e47d4ed5a0/events.out.tfevents.1678208691.23e47d4ed5a0.1578177.0 +2 -2
- runs/Mar12_08-09-39_23e47d4ed5a0/1678613181.4145474/events.out.tfevents.1678613181.23e47d4ed5a0.410.1 +3 -0
- runs/Mar12_08-09-39_23e47d4ed5a0/events.out.tfevents.1678613181.23e47d4ed5a0.410.0 +3 -0
- training_args.bin +1 -1
.gitattributes
CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
+
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/tmpf0pfrlg9 filter=lfs diff=lfs merge=lfs -text
|
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-4ec5d413f38fa76b.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be2c8116543fdb45df72a764c42670f1b2ea5f5440c4e59c9aaa7bb1afb4b778
|
3 |
+
size 2773103360
|
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-580592b2fb57127e.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:962039a3de3e4deb6206cd9b228180d23138d1f8d824ca89ba81e1db89cd8d94
|
3 |
+
size 280592
|
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-aa87c5bc3604ea74.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50aba9e485e22ed0f82d6e42a16d474ce3f2877016b8579a3fabe2c399f00157
|
3 |
+
size 33048025696
|
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/tmpf0pfrlg9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:debee7770f9aff51ae42f4edf49a4b9e383f9f4d9c6560a01b92e0eb9bcde35c
|
3 |
+
size 3842117464
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6173655480
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de9477105cad7c3c04c8d72d24b68c5edc9f6011efa2ffd0c035f5cb0db38aa6
|
3 |
size 6173655480
|
run.sh
CHANGED
@@ -15,9 +15,9 @@ python run_speech_recognition_seq2seq_streaming.py \
|
|
15 |
--learning_rate="1e-5" \
|
16 |
--warmup_steps="500" \
|
17 |
--evaluation_strategy="steps" \
|
18 |
-
--eval_steps="
|
19 |
--save_strategy="steps" \
|
20 |
-
--save_steps="
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
@@ -36,6 +36,8 @@ python run_speech_recognition_seq2seq_streaming.py \
|
|
36 |
--do_eval \
|
37 |
--predict_with_generate \
|
38 |
--do_normalize_eval \
|
|
|
|
|
39 |
--streaming="False" \
|
40 |
--use_auth_token \
|
41 |
--push_to_hub
|
|
|
15 |
--learning_rate="1e-5" \
|
16 |
--warmup_steps="500" \
|
17 |
--evaluation_strategy="steps" \
|
18 |
+
--eval_steps="200" \
|
19 |
--save_strategy="steps" \
|
20 |
+
--save_steps="200" \
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
|
|
36 |
--do_eval \
|
37 |
--predict_with_generate \
|
38 |
--do_normalize_eval \
|
39 |
+
--do_lower_case \
|
40 |
+
--do_remove_punctuation \
|
41 |
--streaming="False" \
|
42 |
--use_auth_token \
|
43 |
--push_to_hub
|
run_speech_recognition_seq2seq_streaming.py
CHANGED
@@ -23,6 +23,7 @@ with 🤗 Datasets' streaming mode.
|
|
23 |
import logging
|
24 |
import os
|
25 |
import sys
|
|
|
26 |
from dataclasses import dataclass, field
|
27 |
from typing import Any, Dict, List, Optional, Union
|
28 |
|
@@ -477,6 +478,16 @@ def main():
|
|
477 |
else raw_datasets["eval"].select(range(data_args.max_eval_samples))
|
478 |
)
|
479 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
480 |
def prepare_dataset(batch):
|
481 |
# process audio
|
482 |
sample = batch[audio_column_name]
|
@@ -489,6 +500,7 @@ def main():
|
|
489 |
input_str = batch[text_column_name].lower() if do_lower_case else batch[text_column_name]
|
490 |
if do_remove_punctuation:
|
491 |
input_str = normalizer(input_str).strip()
|
|
|
492 |
batch["labels"] = tokenizer(input_str).input_ids
|
493 |
return batch
|
494 |
|
|
|
23 |
import logging
|
24 |
import os
|
25 |
import sys
|
26 |
+
import re
|
27 |
from dataclasses import dataclass, field
|
28 |
from typing import Any, Dict, List, Optional, Union
|
29 |
|
|
|
478 |
else raw_datasets["eval"].select(range(data_args.max_eval_samples))
|
479 |
)
|
480 |
|
481 |
+
def my_normalize(text):
|
482 |
+
valid_tokens = "ж - п и щ я о ш ц ъ д а й х э г т з ч ю б н ф ы е ё к р в ь с л у м"
|
483 |
+
valid_tokens = set([x.lower() for x in valid_tokens])
|
484 |
+
# The caret in the character class ([^) means match anything but
|
485 |
+
invalid_chars_regex = f"[^\s{re.escape(''.join(set(valid_tokens)))}]"
|
486 |
+
text = text.lower() if do_lower_case else text.upper()
|
487 |
+
text = re.sub(invalid_chars_regex, " ", text)
|
488 |
+
text = re.sub("\s+", " ", text).strip()
|
489 |
+
return text
|
490 |
+
|
491 |
def prepare_dataset(batch):
|
492 |
# process audio
|
493 |
sample = batch[audio_column_name]
|
|
|
500 |
input_str = batch[text_column_name].lower() if do_lower_case else batch[text_column_name]
|
501 |
if do_remove_punctuation:
|
502 |
input_str = normalizer(input_str).strip()
|
503 |
+
input_str = my_normalize(input_str).strip()
|
504 |
batch["labels"] = tokenizer(input_str).input_ids
|
505 |
return batch
|
506 |
|
runs/Mar07_17-04-19_23e47d4ed5a0/events.out.tfevents.1678208691.23e47d4ed5a0.1578177.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e0f5e3772e57e55a0ed5979498fd8fc21c659ef8c330a7125ead7721caf6bf7
|
3 |
+
size 22672
|
runs/Mar12_08-09-39_23e47d4ed5a0/1678613181.4145474/events.out.tfevents.1678613181.23e47d4ed5a0.410.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5773c502d21c61df4d71265495f122e8e78cc1356f28c143b2bdfc150b945744
|
3 |
+
size 6027
|
runs/Mar12_08-09-39_23e47d4ed5a0/events.out.tfevents.1678613181.23e47d4ed5a0.410.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47204d466cacdb28ccdb97755f2aff49e3f3bc93a97167d9dd55097a88d76070
|
3 |
+
size 6181
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3707
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7d55acb6843dac8089f2fa21146da1a4542b214f1e31b9f55026e7d8f400336
|
3 |
size 3707
|