Spaces:

AndrewRWilliams
/

video-whisper

Runtime error

App Files Files Community

AndrewRWilliams commited on Oct 13, 2022

Commit

89d17ad

•

1 Parent(s): 4a2cf48

file.orig_name for audio?

Browse files

Files changed (1) hide show

app.py +22 -5

app.py CHANGED Viewed

@@ -1,30 +1,47 @@
 import gradio as gr
 import os
 import whisper
 from whisper.utils import write_srt
 model = whisper.load_model("base")
 def transcribe(file):
     result = model.transcribe(file)
     #transcript
-    with open(os.path.basename(file) + "-transcript.txt", 'w', encoding="utf-8") as f:
         f.write(result['text'])
     #subtitles
-    with open(os.path.basename(file) + "-subs.srt", 'w', encoding="utf-8") as srt:
         write_srt(result["segments"], file=srt)
     download = []
-    download.append(os.path.basename(file) + "-subs.srt");
-    download.append(os.path.basename(file) + "-transcript.txt");
     return download
 iface = gr.Interface(
-    title = 'Whisper transcription and subtitles from file.',
     fn=transcribe,
     inputs=[
         gr.inputs.Audio(source="upload", type="filepath", label="Upload Audio")

 import gradio as gr
 import os
+import unicodedata
 import whisper
 from whisper.utils import write_srt
 model = whisper.load_model("base")
+def slugify(value, allow_unicode=False):
+    """
+    Taken from https://github.com/django/django/blob/master/django/utils/text.py
+    Convert to ASCII if 'allow_unicode' is False. Convert spaces or repeated
+    dashes to single dashes. Remove characters that aren't alphanumerics,
+    underscores, or hyphens. Convert to lowercase. Also strip leading and
+    trailing whitespace, dashes, and underscores.
+    """
+    value = str(value)
+    if allow_unicode:
+        value = unicodedata.normalize('NFKC', value)
+    else:
+        value = unicodedata.normalize('NFKD', value).encode('ascii', 'ignore').decode('ascii')
+    value = re.sub(r'[^\w\s-]', '', value.lower())
+    return re.sub(r'[-\s]+', '-', value).strip('-_')
 def transcribe(file):
     result = model.transcribe(file)
     #transcript
+    with open(str(file.orig_name) + "-transcript.txt", 'w', encoding="utf-8") as f:
         f.write(result['text'])
     #subtitles
+    with open(str(file.orig_name) + "-subs.srt", 'w', encoding="utf-8") as srt:
         write_srt(result["segments"], file=srt)
     download = []
+    download.append(str(file.orig_name) + "-subs.srt");
+    download.append(str(file.orig_name) + "-transcript.txt");
     return download
 iface = gr.Interface(
+    title = 'Whisper transcription and subtitles from file',
     fn=transcribe,
     inputs=[
         gr.inputs.Audio(source="upload", type="filepath", label="Upload Audio")