Spaces:

jinggujiwoo7
/

speechfeedback

Sleeping

jinggujiwoo7 commited on Jun 17

Commit

fb11cf4

•

1 Parent(s): 187a6f4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,14 +4,16 @@ from Levenshtein import ratio
 import tempfile
 import numpy as np
 import soundfile as sf
 def transcribe_audio(file_info):
     r = sr.Recognizer()
-    with tempfile.NamedTemporaryFile(delete=True, suffix=".wav") as tmpfile:
         sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
         tmpfile.seek(0)
         with sr.AudioFile(tmpfile.name) as source:
             audio_data = r.record(source)
     try:
         text = r.recognize_google(audio_data)
         return text
@@ -49,8 +51,7 @@ def download_audio(file_info):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
         sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
         tmpfile.seek(0)
-        with open(tmpfile.name, "rb") as f:
-            return f.read(), "recording.wav"
 with gr.Blocks() as app:
     with gr.Row():
@@ -61,6 +62,7 @@ with gr.Blocks() as app:
     pronunciation_feedback = gr.Textbox(label="Pronunciation Feedback")
     pronunciation_score = gr.Number(label="Pronunciation Accuracy Score: 0 (No Match) ~ 1 (Perfect)")
     download_audio_button = gr.Button("Download Recording")
     sentence_input.change(
         validate_sentence,
@@ -77,7 +79,7 @@ with gr.Blocks() as app:
     download_audio_button.click(
         download_audio,
         inputs=[audio_input],
-        outputs=gr.File(label="Download Your Recording")
     )
 app.launch(debug=True)

 import tempfile
 import numpy as np
 import soundfile as sf
+import os
 def transcribe_audio(file_info):
     r = sr.Recognizer()
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
         sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
         tmpfile.seek(0)
         with sr.AudioFile(tmpfile.name) as source:
             audio_data = r.record(source)
+        os.remove(tmpfile.name)  # Cleanup temporary file
     try:
         text = r.recognize_google(audio_data)
         return text
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
         sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
         tmpfile.seek(0)
+        return tmpfile.name  # Return file path for download
 with gr.Blocks() as app:
     with gr.Row():
     pronunciation_feedback = gr.Textbox(label="Pronunciation Feedback")
     pronunciation_score = gr.Number(label="Pronunciation Accuracy Score: 0 (No Match) ~ 1 (Perfect)")
     download_audio_button = gr.Button("Download Recording")
+    download_output = gr.File(label="Download Your Recording")
     sentence_input.change(
         validate_sentence,
     download_audio_button.click(
         download_audio,
         inputs=[audio_input],
+        outputs=download_output
     )
 app.launch(debug=True)