Shiry commited on
Commit
1e7b9e3
1 Parent(s): 3b6efd8

Training in progress, step 200

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/tmpf0pfrlg9 filter=lfs diff=lfs merge=lfs -text
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-4ec5d413f38fa76b.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be2c8116543fdb45df72a764c42670f1b2ea5f5440c4e59c9aaa7bb1afb4b778
3
+ size 2773103360
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-580592b2fb57127e.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:962039a3de3e4deb6206cd9b228180d23138d1f8d824ca89ba81e1db89cd8d94
3
+ size 280592
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/cache-aa87c5bc3604ea74.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50aba9e485e22ed0f82d6e42a16d474ce3f2877016b8579a3fabe2c399f00157
3
+ size 33048025696
cache/common_voice_walkie/ru/6.1.0/da0b466819242bff763a2319e08f49c101cf8efe6dae0d7468c3536a40b1addd/tmpf0pfrlg9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:debee7770f9aff51ae42f4edf49a4b9e383f9f4d9c6560a01b92e0eb9bcde35c
3
+ size 3842117464
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06d41119ed8ad3928ee7ca7219544b2c601fdde4ae17701d9e382de4615843db
3
  size 6173655480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de9477105cad7c3c04c8d72d24b68c5edc9f6011efa2ffd0c035f5cb0db38aa6
3
  size 6173655480
run.sh CHANGED
@@ -15,9 +15,9 @@ python run_speech_recognition_seq2seq_streaming.py \
15
  --learning_rate="1e-5" \
16
  --warmup_steps="500" \
17
  --evaluation_strategy="steps" \
18
- --eval_steps="1000" \
19
  --save_strategy="steps" \
20
- --save_steps="1000" \
21
  --generation_max_length="225" \
22
  --length_column_name="input_length" \
23
  --max_duration_in_seconds="30" \
@@ -36,6 +36,8 @@ python run_speech_recognition_seq2seq_streaming.py \
36
  --do_eval \
37
  --predict_with_generate \
38
  --do_normalize_eval \
 
 
39
  --streaming="False" \
40
  --use_auth_token \
41
  --push_to_hub
 
15
  --learning_rate="1e-5" \
16
  --warmup_steps="500" \
17
  --evaluation_strategy="steps" \
18
+ --eval_steps="200" \
19
  --save_strategy="steps" \
20
+ --save_steps="200" \
21
  --generation_max_length="225" \
22
  --length_column_name="input_length" \
23
  --max_duration_in_seconds="30" \
 
36
  --do_eval \
37
  --predict_with_generate \
38
  --do_normalize_eval \
39
+ --do_lower_case \
40
+ --do_remove_punctuation \
41
  --streaming="False" \
42
  --use_auth_token \
43
  --push_to_hub
run_speech_recognition_seq2seq_streaming.py CHANGED
@@ -23,6 +23,7 @@ with 🤗 Datasets' streaming mode.
23
  import logging
24
  import os
25
  import sys
 
26
  from dataclasses import dataclass, field
27
  from typing import Any, Dict, List, Optional, Union
28
 
@@ -477,6 +478,16 @@ def main():
477
  else raw_datasets["eval"].select(range(data_args.max_eval_samples))
478
  )
479
 
 
 
 
 
 
 
 
 
 
 
480
  def prepare_dataset(batch):
481
  # process audio
482
  sample = batch[audio_column_name]
@@ -489,6 +500,7 @@ def main():
489
  input_str = batch[text_column_name].lower() if do_lower_case else batch[text_column_name]
490
  if do_remove_punctuation:
491
  input_str = normalizer(input_str).strip()
 
492
  batch["labels"] = tokenizer(input_str).input_ids
493
  return batch
494
 
 
23
  import logging
24
  import os
25
  import sys
26
+ import re
27
  from dataclasses import dataclass, field
28
  from typing import Any, Dict, List, Optional, Union
29
 
 
478
  else raw_datasets["eval"].select(range(data_args.max_eval_samples))
479
  )
480
 
481
+ def my_normalize(text):
482
+ valid_tokens = "ж - п и щ я о ш ц ъ д а й х э г т з ч ю б н ф ы е ё к р в ь с л у м"
483
+ valid_tokens = set([x.lower() for x in valid_tokens])
484
+ # The caret in the character class ([^) means match anything but
485
+ invalid_chars_regex = f"[^\s{re.escape(''.join(set(valid_tokens)))}]"
486
+ text = text.lower() if do_lower_case else text.upper()
487
+ text = re.sub(invalid_chars_regex, " ", text)
488
+ text = re.sub("\s+", " ", text).strip()
489
+ return text
490
+
491
  def prepare_dataset(batch):
492
  # process audio
493
  sample = batch[audio_column_name]
 
500
  input_str = batch[text_column_name].lower() if do_lower_case else batch[text_column_name]
501
  if do_remove_punctuation:
502
  input_str = normalizer(input_str).strip()
503
+ input_str = my_normalize(input_str).strip()
504
  batch["labels"] = tokenizer(input_str).input_ids
505
  return batch
506
 
runs/Mar07_17-04-19_23e47d4ed5a0/events.out.tfevents.1678208691.23e47d4ed5a0.1578177.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2339fa7b3a4df20c5631216ae0e9097d62b73b9b954b968e0cd964b829bc53bb
3
- size 17805
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e0f5e3772e57e55a0ed5979498fd8fc21c659ef8c330a7125ead7721caf6bf7
3
+ size 22672
runs/Mar12_08-09-39_23e47d4ed5a0/1678613181.4145474/events.out.tfevents.1678613181.23e47d4ed5a0.410.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5773c502d21c61df4d71265495f122e8e78cc1356f28c143b2bdfc150b945744
3
+ size 6027
runs/Mar12_08-09-39_23e47d4ed5a0/events.out.tfevents.1678613181.23e47d4ed5a0.410.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47204d466cacdb28ccdb97755f2aff49e3f3bc93a97167d9dd55097a88d76070
3
+ size 6181
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c72dfc4edc78d738167d1d68154d3eb5f654ca466d6c04b4318f13d108c8f6f
3
  size 3707
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7d55acb6843dac8089f2fa21146da1a4542b214f1e31b9f55026e7d8f400336
3
  size 3707