Kevin676 commited on
Commit
38c3668
1 Parent(s): 116ce39

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -8
app.py CHANGED
@@ -8,12 +8,14 @@ from voicefixer import VoiceFixer
8
  voicefixer = VoiceFixer()
9
  import gradio as gr
10
  import openai
 
11
  import torchaudio
12
- from speechbrain.pretrained import WaveformEnhancement
13
- enhance_model = WaveformEnhancement.from_hparams(
14
- source="speechbrain/mtl-mimic-voicebank",
15
- savedir="pretrained_models/mtl-mimic-voicebank",
16
- run_opts={"device":"cuda"},
 
17
  )
18
 
19
  mes1 = [
@@ -78,10 +80,12 @@ def transcribe(apikey, upload, audio, choice1):
78
  cuda=True, # whether to use gpu acceleration
79
  mode = 0) # You can try out mode 0, 1, or 2 to find out the best result
80
 
81
- enhanced = enhance_model.enhance_file("audio1.wav")
 
 
82
 
83
- # Saving enhanced signal on disk
84
- torchaudio.save("enhanced.wav", enhanced.unsqueeze(0).cpu(), 16000)
85
 
86
  return [result.text, chat_response, "enhanced.wav"]
87
 
 
8
  voicefixer = VoiceFixer()
9
  import gradio as gr
10
  import openai
11
+ import torch
12
  import torchaudio
13
+ from speechbrain.pretrained import SpectralMaskEnhancement
14
+
15
+ enhance_model = SpectralMaskEnhancement.from_hparams(
16
+ source="speechbrain/metricgan-plus-voicebank",
17
+ savedir="pretrained_models/metricgan-plus-voicebank",
18
+ run_opts={"device":"cuda"},
19
  )
20
 
21
  mes1 = [
 
80
  cuda=True, # whether to use gpu acceleration
81
  mode = 0) # You can try out mode 0, 1, or 2 to find out the best result
82
 
83
+ noisy = enhance_model.load_audio(
84
+ "audio1.wav"
85
+ ).unsqueeze(0)
86
 
87
+ enhanced = enhance_model.enhance_batch(noisy, lengths=torch.tensor([1.]))
88
+ torchaudio.save("enhanced.wav", enhanced.cpu(), 16000)
89
 
90
  return [result.text, chat_response, "enhanced.wav"]
91