patrickvonplaten commited on
Commit
9965f67
β€’
1 Parent(s): 521ad3f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -3
README.md CHANGED
@@ -34,13 +34,13 @@ The model can be used directly (without a language model) as follows:
34
  import torch
35
  import torchaudio
36
  import librosa
37
- from datasets import load_dataset
38
  import MeCab
39
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
40
 
41
  # config
42
  wakati = MeCab.Tagger("-Owakati")
43
- chars_to_ignore_regex = '[\\,\\、\\。\\.\\γ€Œ\\」\\…\\?\\・]'
44
 
45
  # load data, processor and model
46
  test_dataset = load_dataset("common_voice", "ja", split="test[:2%]")
@@ -79,7 +79,7 @@ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
79
 
80
  #config
81
  wakati = MeCab.Tagger("-Owakati")
82
- chars_to_ignore_regex = '[\\,\\、\\。\\.\\γ€Œ\\」\\…\\?\\・]'
83
 
84
  # load data, processor and model
85
  test_dataset = load_dataset("common_voice", "ja", split="test")
 
34
  import torch
35
  import torchaudio
36
  import librosa
37
+ from datasets import load_dataset, load_metric
38
  import MeCab
39
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
40
 
41
  # config
42
  wakati = MeCab.Tagger("-Owakati")
43
+ chars_to_ignore_regex = '[\\\\,\\\\、\\\\。\\\\.\\\\γ€Œ\\\\」\\\\…\\\\?\\\\・]'
44
 
45
  # load data, processor and model
46
  test_dataset = load_dataset("common_voice", "ja", split="test[:2%]")
 
79
 
80
  #config
81
  wakati = MeCab.Tagger("-Owakati")
82
+ chars_to_ignore_regex = '[\\\\,\\\\、\\\\。\\\\.\\\\γ€Œ\\\\」\\\\…\\\\?\\\\・]'
83
 
84
  # load data, processor and model
85
  test_dataset = load_dataset("common_voice", "ja", split="test")