yerang commited on
Commit
4fb359e
1 Parent(s): 5ff5c15

Upload stf/test.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. stf/test.py +30 -0
stf/test.py ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from time import time
2
+ from datasets import load_dataset
3
+ from faster_whisper import WhisperModel
4
+ # from transformers import WhisperForConditionalGeneration, WhisperProcessor
5
+
6
+ ds = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", cache_dir=".")
7
+
8
+ # processor = WhisperProcessor.from_pretrained("openai/whisper-large-v3")
9
+ # model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-large-v3").to("mps")
10
+ model = WhisperModel("large-v3", device="cuda", compute_type="float16", download_root=".")
11
+
12
+ audio_sample = ds[0]["audio"]
13
+ waveform = audio_sample["array"]
14
+ sampling_rate = audio_sample["sampling_rate"]
15
+
16
+ tic = time()
17
+ # input_features = processor(
18
+ # waveform, sampling_rate=sampling_rate, return_tensors="pt"
19
+ # ).input_features
20
+ segments, info = model.transcribe(waveform, beam_size=5)
21
+ # predicted_ids = model.generate(input_features.to("mps"))
22
+
23
+ # transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
24
+
25
+ toc = time()
26
+
27
+ # print(transcription[0])
28
+ for segment in segments:
29
+ print("[%.2fs -> %.2fs] %s" % (segment.start, segment.end, segment.text))
30
+ print(toc - tic)