kotoba-tech
/

kotoba-whisper-v1.0

Automatic Speech Recognition

hf-asr-leaderboard

Model card Files Files and versions

asahi417 commited on May 8, 2024

Commit

c814d59

·

verified ·

1 Parent(s): 87ac8c4

Update benchmark.py

Files changed (1) hide show

benchmark.py +6 -3

benchmark.py CHANGED Viewed

@@ -4,16 +4,19 @@ from transformers import pipeline
 from datasets import load_dataset
 # config
-model_id = "kotoba-tech/kotoba-whisper-v1.0"
 generate_kwargs = {"language": "japanese", "task": "transcribe"}
 # load model
 pipe = pipeline(
     "automatic-speech-recognition",
     model=model_id,
-    chunk_length_s=15,
-    batch_size=64
 )
 test_audio = [
     "kotoba-whisper-eval/audio/long_interview_1.wav",
     "kotoba-whisper-eval/audio/manzai1.wav",

 from datasets import load_dataset
 # config
 generate_kwargs = {"language": "japanese", "task": "transcribe"}
+model_id = "kotoba-tech/kotoba-whisper-v1.0"
+torch_dtype = torch.float32
+device = "cpu"
 # load model
 pipe = pipeline(
     "automatic-speech-recognition",
     model=model_id,
+    torch_dtype=torch_dtype,
+    device=device,
 )
 test_audio = [
     "kotoba-whisper-eval/audio/long_interview_1.wav",
     "kotoba-whisper-eval/audio/manzai1.wav",