Spaces:
Build error
Build error
Commit
·
10536c6
1
Parent(s):
5c7281e
add nemo models
Browse files
model.py
CHANGED
|
@@ -987,6 +987,82 @@ def _get_french_pre_trained_model(
|
|
| 987 |
return recognizer
|
| 988 |
|
| 989 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 990 |
@lru_cache(maxsize=10)
|
| 991 |
def _get_sherpa_onnx_offline_zipformer_pre_trained_model(
|
| 992 |
repo_id: str,
|
|
@@ -1505,6 +1581,8 @@ english_models = {
|
|
| 1505 |
"whisper-tiny.en": _get_whisper_model,
|
| 1506 |
"whisper-base.en": _get_whisper_model,
|
| 1507 |
"whisper-small.en": _get_whisper_model,
|
|
|
|
|
|
|
| 1508 |
# "whisper-medium.en": _get_whisper_model,
|
| 1509 |
"csukuangfj/sherpa-onnx-zipformer-en-libriheavy-20230926-large": _get_sherpa_onnx_offline_zipformer_pre_trained_model,
|
| 1510 |
"csukuangfj/sherpa-onnx-zipformer-en-libriheavy-20230926-medium": _get_sherpa_onnx_offline_zipformer_pre_trained_model,
|
|
|
|
| 987 |
return recognizer
|
| 988 |
|
| 989 |
|
| 990 |
+
@lru_cache(maxsize=10)
|
| 991 |
+
def _get_sherpa_onnx_nemo_transducer_models(
|
| 992 |
+
repo_id: str,
|
| 993 |
+
decoding_method: str,
|
| 994 |
+
num_active_paths: int,
|
| 995 |
+
) -> sherpa_onnx.OnlineRecognizer:
|
| 996 |
+
assert repo_id in [
|
| 997 |
+
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_transducer_110m-en-36000",
|
| 998 |
+
], repo_id
|
| 999 |
+
|
| 1000 |
+
encoder_model = _get_nn_model_filename(
|
| 1001 |
+
repo_id=repo_id,
|
| 1002 |
+
filename="encoder.onnx",
|
| 1003 |
+
subfolder=".",
|
| 1004 |
+
)
|
| 1005 |
+
|
| 1006 |
+
decoder_model = _get_nn_model_filename(
|
| 1007 |
+
repo_id=repo_id,
|
| 1008 |
+
filename="decoder.onnx",
|
| 1009 |
+
subfolder=".",
|
| 1010 |
+
)
|
| 1011 |
+
|
| 1012 |
+
joiner_model = _get_nn_model_filename(
|
| 1013 |
+
repo_id=repo_id,
|
| 1014 |
+
filename="joiner.onnx",
|
| 1015 |
+
subfolder=".",
|
| 1016 |
+
)
|
| 1017 |
+
|
| 1018 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
| 1019 |
+
|
| 1020 |
+
recognizer = sherpa_onnx.OnlineRecognizer.from_transducer(
|
| 1021 |
+
tokens=tokens,
|
| 1022 |
+
encoder=encoder_model,
|
| 1023 |
+
decoder=decoder_model,
|
| 1024 |
+
joiner=joiner_model,
|
| 1025 |
+
num_threads=2,
|
| 1026 |
+
sample_rate=16000,
|
| 1027 |
+
feature_dim=80,
|
| 1028 |
+
decoding_method=decoding_method,
|
| 1029 |
+
max_active_paths=num_active_paths,
|
| 1030 |
+
)
|
| 1031 |
+
|
| 1032 |
+
return recognizer
|
| 1033 |
+
|
| 1034 |
+
|
| 1035 |
+
@lru_cache(maxsize=10)
|
| 1036 |
+
def _get_sherpa_onnx_nemo_ctc_models(
|
| 1037 |
+
repo_id: str,
|
| 1038 |
+
decoding_method: str,
|
| 1039 |
+
num_active_paths: int,
|
| 1040 |
+
) -> sherpa_onnx.OfflineRecognizer:
|
| 1041 |
+
assert repo_id in [
|
| 1042 |
+
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000",
|
| 1043 |
+
], repo_id
|
| 1044 |
+
|
| 1045 |
+
model = _get_nn_model_filename(
|
| 1046 |
+
repo_id=repo_id,
|
| 1047 |
+
filename="model.onnx",
|
| 1048 |
+
subfolder=".",
|
| 1049 |
+
)
|
| 1050 |
+
|
| 1051 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
| 1052 |
+
|
| 1053 |
+
recognizer = sherpa_onnx.OfflineRecognizer.from_nemo_ctc(
|
| 1054 |
+
tokens=tokens,
|
| 1055 |
+
model=model,
|
| 1056 |
+
num_threads=2,
|
| 1057 |
+
sample_rate=16000,
|
| 1058 |
+
feature_dim=80,
|
| 1059 |
+
decoding_method=decoding_method,
|
| 1060 |
+
max_active_paths=num_active_paths,
|
| 1061 |
+
)
|
| 1062 |
+
|
| 1063 |
+
return recognizer
|
| 1064 |
+
|
| 1065 |
+
|
| 1066 |
@lru_cache(maxsize=10)
|
| 1067 |
def _get_sherpa_onnx_offline_zipformer_pre_trained_model(
|
| 1068 |
repo_id: str,
|
|
|
|
| 1581 |
"whisper-tiny.en": _get_whisper_model,
|
| 1582 |
"whisper-base.en": _get_whisper_model,
|
| 1583 |
"whisper-small.en": _get_whisper_model,
|
| 1584 |
+
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000": _get_sherpa_onnx_nemo_ctc_models,
|
| 1585 |
+
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_transducer_110m-en-36000": _get_sherpa_onnx_nemo_transducer_models,
|
| 1586 |
# "whisper-medium.en": _get_whisper_model,
|
| 1587 |
"csukuangfj/sherpa-onnx-zipformer-en-libriheavy-20230926-large": _get_sherpa_onnx_offline_zipformer_pre_trained_model,
|
| 1588 |
"csukuangfj/sherpa-onnx-zipformer-en-libriheavy-20230926-medium": _get_sherpa_onnx_offline_zipformer_pre_trained_model,
|