Spaces:

csukuangfj
/

test

Runtime error

App Files Files Community

csukuangfj commited on Jul 19, 2022

Commit

f1df253

•

1 Parent(s): 7459972

minor fixes

Browse files

Files changed (2) hide show

app.py +12 -1
model.py +8 -9

app.py CHANGED Viewed

@@ -159,8 +159,14 @@ def process(
     info = f"""
     Wave duration  : {duration: .3f} s <br/>
     Processing time: {end - start: .3f} s <br/>
-    RTF: {end - start: .3f}/{duration: .3f} = {(end - start)/duration:.3f} <br/>
     """
     logging.info(info)
     logging.info(f"hyp:\n{hyp}")
@@ -171,12 +177,17 @@ title = "# Automatic Speech Recognition with Next-gen Kaldi"
 description = """
 This space shows how to do automatic speech recognition with Next-gen Kaldi.
 See more information by visiting the following links:
 - <https://github.com/k2-fsa/icefall>
 - <https://github.com/k2-fsa/sherpa>
 - <https://github.com/k2-fsa/k2>
 - <https://github.com/lhotse-speech/lhotse>
 """
 # css style is copied from

     info = f"""
     Wave duration  : {duration: .3f} s <br/>
     Processing time: {end - start: .3f} s <br/>
+    RTF: {end - start: .3f}/{duration: .3f} = {rtf:.3f} <br/>
     """
+    if rtf > 1:
+        info += (
+            f"<br/>We are loading the model for the first run. "
+            "Please run again to measure the real RTF.<br/>"
+        )
     logging.info(info)
     logging.info(f"hyp:\n{hyp}")
 description = """
 This space shows how to do automatic speech recognition with Next-gen Kaldi.
+It is running on CPU within a docker container provided by Hugging Face.
 See more information by visiting the following links:
 - <https://github.com/k2-fsa/icefall>
 - <https://github.com/k2-fsa/sherpa>
 - <https://github.com/k2-fsa/k2>
 - <https://github.com/lhotse-speech/lhotse>
+If you want to deploy it locally, please see
+<https://k2-fsa.github.io/sherpa/>
 """
 # css style is copied from

model.py CHANGED Viewed

@@ -81,7 +81,7 @@ def _get_aishell2_pretrained_model(repo_id: str) -> OfflineAsr:
         "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12",  # noqa
         # context-size 2
         "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12",  # noqa
-    ]
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
@@ -102,12 +102,11 @@ def _get_aishell2_pretrained_model(repo_id: str) -> OfflineAsr:
 def _get_gigaspeech_pre_trained_model(repo_id: str) -> OfflineAsr:
     assert repo_id in [
         "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2",
-    ]
     nn_model_filename = _get_nn_model_filename(
-        # It is converted from https://huggingface.co/wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2  # noqa
-        repo_id="csukuangfj/icefall-asr-gigaspeech-pruned-transducer-stateless2",  # noqa
-        filename="cpu_jit-epoch-29-avg-11-torch-1.10.0.pt",
     )
     bpe_model_filename = _get_bpe_model_filename(repo_id=repo_id)
@@ -124,7 +123,7 @@ def _get_gigaspeech_pre_trained_model(repo_id: str) -> OfflineAsr:
 def _get_librispeech_pre_trained_model(repo_id: str) -> OfflineAsr:
     assert repo_id in [
         "csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13",  # noqa
-    ]
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
@@ -145,7 +144,7 @@ def _get_librispeech_pre_trained_model(repo_id: str) -> OfflineAsr:
 def _get_wenetspeech_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
-    ]
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
@@ -166,7 +165,7 @@ def _get_wenetspeech_pre_trained_model(repo_id: str):
 def _get_tal_csasr_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_tal-csasr_pruned_transducer_stateless5",
-    ]
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
@@ -187,7 +186,7 @@ def _get_tal_csasr_pre_trained_model(repo_id: str):
 def _get_alimeeting_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_alimeeting_pruned_transducer_stateless2",
-    ]
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,

         "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12",  # noqa
         # context-size 2
         "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12",  # noqa
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
 def _get_gigaspeech_pre_trained_model(repo_id: str) -> OfflineAsr:
     assert repo_id in [
         "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2",
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
+        repo_id=repo_id,
+        filename="cpu_jit-iter-3488000-avg-20.pt",
     )
     bpe_model_filename = _get_bpe_model_filename(repo_id=repo_id)
 def _get_librispeech_pre_trained_model(repo_id: str) -> OfflineAsr:
     assert repo_id in [
         "csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless3-2022-05-13",  # noqa
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
 def _get_wenetspeech_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
 def _get_tal_csasr_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_tal-csasr_pruned_transducer_stateless5",
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,
 def _get_alimeeting_pre_trained_model(repo_id: str):
     assert repo_id in [
         "luomingshuang/icefall_asr_alimeeting_pruned_transducer_stateless2",
+    ], repo_id
     nn_model_filename = _get_nn_model_filename(
         repo_id=repo_id,