diff --git a/extensions/whisper_stt/script.py b/extensions/whisper_stt/script.py index dcb4dfc9..9f07e5c9 100644 --- a/extensions/whisper_stt/script.py +++ b/extensions/whisper_stt/script.py @@ -1,17 +1,12 @@ import gradio as gr import speech_recognition as sr - input_hijack = { 'state': False, 'value': ["", ""] } -def input_modifier(string): - return string - - def do_stt(): transcription = "" r = sr.Recognizer() @@ -30,7 +25,13 @@ def do_stt(): return transcription +def update_hijack(val): + input_hijack.update({"state": True, "value": [val, val]}) + return val + + def ui(): speech_button = gr.Button(value="🎙️") - output_transcription = gr.Textbox(label="STT-Preview", placeholder="Speech Preview. Click \"Generate\" to send") + output_transcription = gr.Textbox(label="STT-Input", placeholder="Speech Preview. Click \"Generate\" to send", interactive=True) + output_transcription.change(fn=update_hijack, inputs=[output_transcription]) speech_button.click(do_stt, outputs=[output_transcription])