csukuangfj commited on
Commit
e491b4f
1 Parent(s): 0edfdd4

add alimeeting model

Browse files
examples.py CHANGED
@@ -58,6 +58,27 @@ examples = [
58
  4,
59
  "./test_wavs/tibetan/a_0_cacm-A70_31117.wav",
60
  ],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
61
  # librispeech
62
  # https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless5-2022-05-13/tree/main/test_wavs
63
  [
 
58
  4,
59
  "./test_wavs/tibetan/a_0_cacm-A70_31117.wav",
60
  ],
61
+ [
62
+ "Chinese",
63
+ "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
64
+ "greedy_search",
65
+ 4,
66
+ "./test_wavs/alimeeting/R8003_M8001-8004-165.wav",
67
+ ],
68
+ [
69
+ "Chinese",
70
+ "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
71
+ "greedy_search",
72
+ 4,
73
+ "./test_wavs/alimeeting/R8008_M8013-8049-74.wav",
74
+ ],
75
+ [
76
+ "Chinese",
77
+ "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
78
+ "greedy_search",
79
+ 4,
80
+ "./test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav",
81
+ ],
82
  # librispeech
83
  # https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless5-2022-05-13/tree/main/test_wavs
84
  [
model.py CHANGED
@@ -311,12 +311,18 @@ def _get_alimeeting_pre_trained_model(
311
  num_active_paths: int,
312
  ):
313
  assert repo_id in [
 
314
  "luomingshuang/icefall_asr_alimeeting_pruned_transducer_stateless2",
315
  ], repo_id
316
 
 
 
 
 
 
317
  nn_model = _get_nn_model_filename(
318
  repo_id=repo_id,
319
- filename="cpu_jit_torch_1.7.1.pt",
320
  )
321
  tokens = _get_token_filename(repo_id=repo_id)
322
 
@@ -532,6 +538,7 @@ def _get_german_pre_trained_model(
532
 
533
  chinese_models = {
534
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
 
535
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
536
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
537
  "luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2": _get_aidatatang_200zh_pretrained_mode, # noqa
 
311
  num_active_paths: int,
312
  ):
313
  assert repo_id in [
314
+ "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7",
315
  "luomingshuang/icefall_asr_alimeeting_pruned_transducer_stateless2",
316
  ], repo_id
317
 
318
+ if repo_id == "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7":
319
+ filename = "cpu_jit.pt"
320
+ elif repo_id == "luomingshuang/icefall_asr_alimeeting_pruned_transducer_stateless2":
321
+ filename = "cpu_jit_torch_1.7.1.pt"
322
+
323
  nn_model = _get_nn_model_filename(
324
  repo_id=repo_id,
325
+ filename=filename,
326
  )
327
  tokens = _get_token_filename(repo_id=repo_id)
328
 
 
538
 
539
  chinese_models = {
540
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
541
+ "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
542
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
543
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
544
  "luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2": _get_aidatatang_200zh_pretrained_mode, # noqa
test_wavs/alimeeting/R8003_M8001-8004-165.wav ADDED
Binary file (525 kB). View file
 
test_wavs/alimeeting/R8008_M8013-8049-74.wav ADDED
Binary file (241 kB). View file
 
test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav ADDED
Binary file (309 kB). View file
 
test_wavs/alimeeting/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ R8009_M8020_N_SPK8026-8026-209 并不是说一天的话就一定要对一个人进行一个了解这样的话
2
+ R8003_M8001-8004-165 如果他要是不愿意提供地址也不愿意接收礼物那么第二个这个分支可能就省省下了
3
+ R8008_M8013-8049-74 面试的话五月五号到五月十号吧面试