Ver código fonte

interactive preview window

EliasVincent 2 anos atrás
pai
commit
00359ba054
1 arquivos alterados com 7 adições e 6 exclusões
  1. 7 6
      extensions/whisper_stt/script.py

+ 7 - 6
extensions/whisper_stt/script.py

@@ -1,17 +1,12 @@
 import gradio as gr
 import gradio as gr
 import speech_recognition as sr
 import speech_recognition as sr
 
 
-
 input_hijack = {
 input_hijack = {
     'state': False,
     'state': False,
     'value': ["", ""]
     'value': ["", ""]
 }
 }
 
 
 
 
-def input_modifier(string):
-    return string
-
-
 def do_stt():
 def do_stt():
     transcription = ""
     transcription = ""
     r = sr.Recognizer()
     r = sr.Recognizer()
@@ -30,7 +25,13 @@ def do_stt():
     return transcription
     return transcription
 
 
 
 
+def update_hijack(val):
+    input_hijack.update({"state": True, "value": [val, val]})
+    return val
+
+
 def ui():
 def ui():
     speech_button = gr.Button(value="🎙️")
     speech_button = gr.Button(value="🎙️")
-    output_transcription = gr.Textbox(label="STT-Preview", placeholder="Speech Preview. Click \"Generate\" to send")
+    output_transcription = gr.Textbox(label="STT-Input", placeholder="Speech Preview. Click \"Generate\" to send", interactive=True)
+    output_transcription.change(fn=update_hijack, inputs=[output_transcription])
     speech_button.click(do_stt, outputs=[output_transcription])
     speech_button.click(do_stt, outputs=[output_transcription])