Spaces:

yellowcandle
/

whisper-v3-gradio

Sleeping

App Files Files Community

yellowcandle commited on Jun 18, 2024

Commit

a28c209

unverified ·

1 Parent(s): 7f92c21

try to fix error

Browse files

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from transformers import AutoModelForSpeechSeq2Seq, AutoProcessor, pipeline, Aut
 transcribe_model = None
 proofread_model = None
-@spaces.GPU(duration=60)
 def transcribe_audio(audio):
     global transcribe_model
     if audio is None:
@@ -16,7 +16,7 @@ def transcribe_audio(audio):
     if transcribe_model is None:
         return "Please select a model."
-    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     processor = AutoProcessor.from_pretrained(transcribe_model)
@@ -36,13 +36,13 @@ def transcribe_audio(audio):
     result = pipe(audio)
     return result["text"]
-@spaces.GPU(duration=120)
 def proofread(text):
     global proofread_model
     if text is None:
         return "Please provide the transcribed text for proofreading."
-    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     messages = [
@@ -63,7 +63,7 @@ def proofread(text):
 def load_models(transcribe_model_id, proofread_model_id):
     global transcribe_model, proofread_model
-    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     transcribe_model = AutoModelForSpeechSeq2Seq.from_pretrained(
@@ -84,7 +84,7 @@ with gr.Blocks() as demo:
                 """)
     with gr.Row():
-        transcribe_model_dropdown = gr.Dropdown(choices=["openai/whisper-large-v3", "alvanlii/whisper-small-cantonese"], value="alvanlii/whisper-small-cantonese", label="Select Transcription Model")
         proofread_model_dropdown = gr.Dropdown(choices=["hfl/llama-3-chinese-8b-instruct-v3"], value="hfl/llama-3-chinese-8b-instruct-v3", label="Select Proofreading Model")
         load_button = gr.Button("Load Models")

 transcribe_model = None
 proofread_model = None
+@spaces.gpu(duration=60)
 def transcribe_audio(audio):
     global transcribe_model
     if audio is None:
     if transcribe_model is None:
         return "Please select a model."
+    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     processor = AutoProcessor.from_pretrained(transcribe_model)
     result = pipe(audio)
     return result["text"]
+@spaces.gpu(duration=120)
 def proofread(text):
     global proofread_model
     if text is None:
         return "Please provide the transcribed text for proofreading."
+    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     messages = [
 def load_models(transcribe_model_id, proofread_model_id):
     global transcribe_model, proofread_model
+    device = "cuda:0" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
     torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
     transcribe_model = AutoModelForSpeechSeq2Seq.from_pretrained(
                 """)
     with gr.Row():
+        transcribe_model_dropdown = gr.Dropdown(choices=["openai/whisper-large-v2", "alvanlii/whisper-small-cantonese"], value="alvanlii/whisper-small-cantonese", label="Select Transcription Model")
         proofread_model_dropdown = gr.Dropdown(choices=["hfl/llama-3-chinese-8b-instruct-v3"], value="hfl/llama-3-chinese-8b-instruct-v3", label="Select Proofreading Model")
         load_button = gr.Button("Load Models")