knowledge-scribe

Sleeping

dwb2023 commited on Oct 4, 2024

Commit

069559b

verified ·

1 Parent(s): a573025

update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,6 +18,14 @@ from transformers.pipelines.audio_utils import ffmpeg_read
 import torch
 from datasets import load_dataset, Dataset, DatasetDict
 import spaces
 # Constants
 MODEL_NAME = "openai/whisper-large-v3-turbo"
@@ -56,7 +64,7 @@ pipe = pipeline(
     model=model,
     tokenizer=tokenizer,
     feature_extractor=feature_extractor,
-    chunk_length_s=30,
 )
 def reset_and_update_dataset(new_data):

 import torch
 from datasets import load_dataset, Dataset, DatasetDict
 import spaces
+import subprocess
+# Install Flash Attention if possible
+subprocess.run(
+    "pip install flash-attn --no-build-isolation",
+    env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
+    shell=True,
+)
 # Constants
 MODEL_NAME = "openai/whisper-large-v3-turbo"
     model=model,
     tokenizer=tokenizer,
     feature_extractor=feature_extractor,
+    chunk_length_s=900,  # Increased to 15 minutes
 )
 def reset_and_update_dataset(new_data):