Spaces:

yuangongfdu
/

whisper-at

Running

yuangongfdu commited on Jul 19, 2023

Commit

b8b03ab

•

1 Parent(s): cdcbb14

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,13 +9,14 @@ paper_text = "[Paper]"
 model = whisper.load_model("tiny")
 print('model loaded')
 def predict(audio_path, time_resolution):
-    def round_time_resolution(time_resolution):
-        multiple = float(time_resolution) / 0.4
-        rounded_multiple = round(multiple)
-        rounded_time_resolution = rounded_multiple * 0.4
-        return rounded_time_resolution
-    # audio_tagging_time_resolution = round_time_resolution(time_resolution)
     # result = model.transcribe(audio_path, at_time_res=audio_tagging_time_resolution)
     # # ASR Results
     # print(result["text"])
@@ -31,7 +32,7 @@ def predict(audio_path, time_resolution):
     #     print(segment)
     #     at_output = at_output + str(segment['time']['start']) + 's-' + str(segment['time']['end']) + 's: ' + ','.join([x[0] for x in segment['audio tags']]) + '\n'
     #     print(at_output)
-    asr_output, at_output = 's', 'k'
     return asr_output, at_output
 iface = gr.Interface(fn=predict,

 model = whisper.load_model("tiny")
 print('model loaded')
+def round_time_resolution(time_resolution):
+    multiple = float(time_resolution) / 0.4
+    rounded_multiple = round(multiple)
+    rounded_time_resolution = rounded_multiple * 0.4
+    return rounded_time_resolution
 def predict(audio_path, time_resolution):
+    audio_tagging_time_resolution = round_time_resolution(time_resolution)
     # result = model.transcribe(audio_path, at_time_res=audio_tagging_time_resolution)
     # # ASR Results
     # print(result["text"])
     #     print(segment)
     #     at_output = at_output + str(segment['time']['start']) + 's-' + str(segment['time']['end']) + 's: ' + ','.join([x[0] for x in segment['audio tags']]) + '\n'
     #     print(at_output)
+    asr_output, at_output = str(audio_tagging_time_resolution), 'k'
     return asr_output, at_output
 iface = gr.Interface(fn=predict,