Spaces:

bori0824
/

CTQAndSpeechFeedback

App Files Files Community

bori0824 commited on Jun 17

Commit

a0c3c1e

•

1 Parent(s): b55e3bf

Create app.py

Files changed (1) hide show

app.py +85 -0

app.py ADDED Viewed

	@@ -0,0 +1,85 @@

+import gradio as gr
+import speech_recognition as sr
+from Levenshtein import ratio
+import tempfile
+import numpy as np
+import soundfile as sf
+import os
+def transcribe_audio(file_info):
+    r = sr.Recognizer()
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
+        sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
+        tmpfile.seek(0)
+        with sr.AudioFile(tmpfile.name) as source:
+            audio_data = r.record(source)
+        os.remove(tmpfile.name)  # Cleanup temporary file
+    try:
+        text = r.recognize_google(audio_data)
+        return text
+    except sr.UnknownValueError:
+        return "Could not understand audio"
+    except sr.RequestError as e:
+        return f"Could not request results; {e}"
+def pronunciation_correction(expected_text, file_info):
+    print(f"Expected text: {expected_text}")
+    user_spoken_text = transcribe_audio(file_info)
+    print(f"User spoken text: {user_spoken_text}")
+    similarity = ratio(expected_text.lower(), user_spoken_text.lower())
+    description = f"{similarity:.2f}"
+    if similarity >= 0.9:
+        feedback = "Excellent pronunciation!"
+    elif similarity >= 0.7:
+        feedback = "Good pronunciation!"
+    elif similarity >= 0.5:
+        feedback = "Needs improvement."
+    else:
+        feedback = "Poor pronunciation, try to focus more on clarity."
+    print(f"Similarity: {similarity}, Feedback: {feedback}")
+    return feedback, description
+def validate_sentence(sentence):
+    if not sentence.strip():
+        return "Please enter a sentence."
+    return sentence
+def download_audio(file_info):
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmpfile:
+        sf.write(tmpfile.name, data=file_info[1], samplerate=44100, format='WAV')
+        tmpfile.seek(0)
+        return tmpfile.name  # Return file path for download
+with gr.Blocks() as app:
+    with gr.Row():
+        sentence_input = gr.Textbox(label="Enter Your Sentence Here")
+    validated_sentence = gr.Textbox(label="Valid Sentence", interactive=False)
+    audio_input = gr.Audio(label="Upload or Record Audio File", type="numpy")
+    check_pronunciation_button = gr.Button("Check Pronunciation")
+    pronunciation_feedback = gr.Textbox(label="Pronunciation Feedback")
+    pronunciation_score = gr.Number(label="Pronunciation Accuracy Score: 0 (No Match) ~ 1 (Perfect)")
+    download_audio_button = gr.Button("Download Recording")
+    download_output = gr.File(label="Download Your Recording")
+    sentence_input.change(
+        validate_sentence,
+        inputs=sentence_input,
+        outputs=validated_sentence
+    )
+    check_pronunciation_button.click(
+        pronunciation_correction,
+        inputs=[validated_sentence, audio_input],
+        outputs=[pronunciation_feedback, pronunciation_score]
+    )
+    download_audio_button.click(
+        download_audio,
+        inputs=[audio_input],
+        outputs=download_output
+    )
+app.launch(debug=True)