Spaces:

ktangri
/

call-sentiment

Runtime error

ktangri commited on Apr 6, 2022

Commit

eb6ba59

•

1 Parent(s): 1e629a8

Add punctuation correction

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,17 +1,20 @@
 import gradio as gr
 from transformers import pipeline, Wav2Vec2ProcessorWithLM
 from librosa import load, resample
 asr_model = 'patrickvonplaten/wav2vec2-base-100h-with-lm'
 processor = Wav2Vec2ProcessorWithLM.from_pretrained(asr_model)
 asr = pipeline('automatic-speech-recognition', model=asr_model, tokenizer=processor.tokenizer, feature_extractor=processor.feature_extractor, decoder=processor.decoder)
 def transcribe(filepath):
 	speech, sampling_rate = load(filepath)
 	if sampling_rate != 16000:
 		speech = resample(speech, sampling_rate, 16000)
 	text = asr(speech)['text']
 	return text
 mic = gr.inputs.Audio(source='microphone', type='filepath', label='Speech input', optional=False)

 import gradio as gr
 from transformers import pipeline, Wav2Vec2ProcessorWithLM
 from librosa import load, resample
+from rpunct import RestorePuncts
 asr_model = 'patrickvonplaten/wav2vec2-base-100h-with-lm'
 processor = Wav2Vec2ProcessorWithLM.from_pretrained(asr_model)
 asr = pipeline('automatic-speech-recognition', model=asr_model, tokenizer=processor.tokenizer, feature_extractor=processor.feature_extractor, decoder=processor.decoder)
+rpunct = RestorePuncts()
 def transcribe(filepath):
 	speech, sampling_rate = load(filepath)
 	if sampling_rate != 16000:
 		speech = resample(speech, sampling_rate, 16000)
 	text = asr(speech)['text']
+	text = rpunct.punctuate(text.lower())
 	return text
 mic = gr.inputs.Audio(source='microphone', type='filepath', label='Speech input', optional=False)

requirements.txt CHANGED Viewed

@@ -3,3 +3,4 @@ transformers
 librosa
 pyctcdecode
 pypi-kenlm

 librosa
 pyctcdecode
 pypi-kenlm
+git+https://github.com/anuragshas/rpunct.git