Speech-ChatGPT-Speech

Runtime error

Update app.py

#14

by Yusin - opened Dec 11, 2022

←

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,9 +6,9 @@ default_lang = "en"
 # ChatGPT
 from pyChatGPT import ChatGPT
-import whisper
-whisper_model = whisper.load_model("small")
-#whisper = gr.Blocks.load(name="spaces/sanchit-gandhi/whisper-large-v2")
 import os
 session_token = os.environ.get('SessionToken')
@@ -46,40 +46,40 @@ def chat_hf(audio, custom_token, language):
     return whisper_text, gpt_response, fp.name
 # whisper
-def translate(audio):
-    print("""
-    —
-    Sending audio to Whisper ...
-    —
-    """)
-    audio = whisper.load_audio(audio)
-    audio = whisper.pad_or_trim(audio)
-    mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
-    _, probs = whisper_model.detect_language(mel)
-    transcript_options = whisper.DecodingOptions(task="transcribe", fp16 = False)
-    transcription = whisper.decode(whisper_model, mel, transcript_options)
-    print("language spoken: " + transcription.language)
-    print("transcript: " + transcription.text)
-    print("———————————————————————————————————————————")
-    return transcription.text
 #def translate(audio):
 #    print("""
 #    —
 #    Sending audio to Whisper ...
 #    —
 #    """)
-#
-#    text_result = whisper(audio, None, "transcribe", fn_index=0)
-#    print(text_result)
-#    return text_result
 with gr.Blocks() as blocks:

 # ChatGPT
 from pyChatGPT import ChatGPT
+#import whisper
+#whisper_model = whisper.load_model("small")
+whisper = gr.Interface.load(name="spaces/sanchit-gandhi/whisper-large-v2")
 import os
 session_token = os.environ.get('SessionToken')
     return whisper_text, gpt_response, fp.name
 # whisper
 #def translate(audio):
 #    print("""
 #    —
 #    Sending audio to Whisper ...
 #    —
 #    """)
+#
+#    audio = whisper.load_audio(audio)
+#    audio = whisper.pad_or_trim(audio)
+#
+#    mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
+#
+#    _, probs = whisper_model.detect_language(mel)
+#
+#    transcript_options = whisper.DecodingOptions(task="transcribe", fp16 = False)
+#
+#    transcription = whisper.decode(whisper_model, mel, transcript_options)
+#
+#    print("language spoken: " + transcription.language)
+#    print("transcript: " + transcription.text)
+#    print("———————————————————————————————————————————")
+#
+#    return transcription.text
+def translate(audio):
+    print("""
+    —
+    Sending audio to Whisper ...
+    —
+    """)
+    text_result = whisper(audio, None, "transcribe", fn_index=0)
+    print(text_result)
+    return text_result
 with gr.Blocks() as blocks: