speech-to-speech-translation

Running

Marco-Cheung commited on Aug 19, 2023

Commit

5099504

•

1 Parent(s): ce5168c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import gradio as gr
 import numpy as np
 import torch
-from transformers import AutoProcessor, pipeline, BarkModel
 ASR_MODEL_NAME = "bofenghuang/whisper-large-v2-cv11-german"
 TTS_MODEL_NAME = "suno/bark-small"
@@ -10,11 +10,20 @@ voices = {
 "male" : "v2/de_speaker_0",
 "female" : "v2/de_speaker_3"
 }
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=10,device=device)
 # load text-to-speech checkpoint
 processor = AutoProcessor.from_pretrained("suno/bark-small")
 model = BarkModel.from_pretrained("suno/bark-small").to(device)

 import gradio as gr
 import numpy as np
 import torch
+from transformers import AutoProcessor, pipeline, BarkModel, GenerationConfig
 ASR_MODEL_NAME = "bofenghuang/whisper-large-v2-cv11-german"
 TTS_MODEL_NAME = "suno/bark-small"
 "male" : "v2/de_speaker_0",
 "female" : "v2/de_speaker_3"
 }
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=10,device=device)
+# update the generation config
+MULTILINGUAL = True  # set True for multilingual models, False for English-only
+generation_config = GenerationConfig.from_pretrained("openai/whisper-large-v2")
+#else:
+    #generation_config = GenerationConfig.from_pretrained("openai/whisper-medium.en")
+generation_config.push_to_hub(ASR_MODEL_NAME)
 # load text-to-speech checkpoint
 processor = AutoProcessor.from_pretrained("suno/bark-small")
 model = BarkModel.from_pretrained("suno/bark-small").to(device)