superb
/

superb-test-orgtest-submission-with-example-expertd609b3c32044e50e3d5e9067bd97af1b42f04b0e

lewtun HF staff commited on Sep 24, 2021

Commit

b4b1070

•

1 Parent(s): 11e5015

commit files to HF hub

Browse files

Files changed (12) hide show

.gitattributes +1 -0
README.md +41 -0
asr/asr_lr01/README.md +15 -0
asr/asr_lr01/args_2021-09-24-18-59-50.yaml +30 -0
asr/asr_lr01/args_2021-09-24-19-59-45.yaml +30 -0
asr/asr_lr01/char.dict +28 -0
asr/asr_lr01/config_2021-09-24-18-59-50.yaml +84 -0
asr/asr_lr01/config_2021-09-24-19-59-45.yaml +84 -0
asr/asr_lr01/events.out.tfevents.1632502799.vorace +3 -0
asr/asr_lr01/events.out.tfevents.1632506421.vorace +0 -0
asr/asr_lr01/model.ckpt +3 -0
asr/asr_lr01/model.py +39 -0

.gitattributes CHANGED Viewed

@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,41 @@

+---
+datasets:
+- superb
+tags:
+- library:s3prl
+- benchmark:superb
+- type:model
+---
+# Fine-tuned s3prl model
+Upstream Model: superb-test-org/test-submission-with-example-expert
+## Model description
+[More information needed]
+## Intended uses & limitations
+[More information needed]
+## How to use
+[More information needed]
+## Limitations and bias
+[More information needed]
+## Training data
+[More information needed]
+## Training procedure
+[More information needed]
+## Evaluation results
+[More information needed]

asr/asr_lr01/README.md ADDED Viewed

	@@ -0,0 +1,15 @@

+---
+library_name: superb
+benchmark: superb
+task: asr
+datasets:
+- superb
+tags:
+- automatic-speech-recognition
+- ${upstream_model}
+widget:
+- label: Librispeech sample 1
+  src: https://cdn-media.huggingface.co/speech_samples/sample1.flac
+---
+# Fine-tuned s3prl model for ASR

asr/asr_lr01/args_2021-09-24-18-59-50.yaml ADDED Viewed

	@@ -0,0 +1,30 @@

+auto_resume: false
+backend: nccl
+cache_dir: null
+config: ./downstream/asr/config.yaml
+device: cuda
+disable_cudnn: false
+downstream: asr
+downstream_variant: null
+evaluate_split: test
+expdir: result/downstream/asr_lr01
+expname: asr_lr01
+from_hf_hub: true
+hf_hub_org: superb
+hub: huggingface
+init_ckpt: null
+local_rank: null
+mode: train
+override: config.downstream_expert.datarc.libri_root='/data/lewis/superb/LibriSpeech',,config.downstream_expert.datarc.bucket_file='/data/lewis/superb/LibriSpeech/len_for_bucket',,config.runner.total_steps=10,,config.runner.save_step=5
+past_exp: null
+push_to_hf_hub: 'True'
+seed: 1337
+upstream: superb-test-org/test-submission-with-weights
+upstream_ckpt: null
+upstream_feature_selection: hidden_states
+upstream_layer_selection: null
+upstream_model_config: null
+upstream_model_name: model.pt
+upstream_refresh: false
+upstream_trainable: false
+verbose: false

asr/asr_lr01/args_2021-09-24-19-59-45.yaml ADDED Viewed

	@@ -0,0 +1,30 @@

+auto_resume: false
+backend: nccl
+cache_dir: null
+config: ./downstream/asr/config.yaml
+device: cuda
+disable_cudnn: false
+downstream: asr
+downstream_variant: null
+evaluate_split: test
+expdir: result/downstream/asr_lr01
+expname: asr_lr01
+from_hf_hub: true
+hf_hub_org: superb
+hub: huggingface
+init_ckpt: null
+local_rank: null
+mode: train
+override: config.downstream_expert.datarc.libri_root='/data/lewis/superb/LibriSpeech',,config.downstream_expert.datarc.bucket_file='/data/lewis/superb/LibriSpeech/len_for_bucket',,config.runner.total_steps=10,,config.runner.save_step=5
+past_exp: null
+push_to_hf_hub: 'True'
+seed: 1337
+upstream: superb-test-org/test-submission-with-example-expert
+upstream_ckpt: null
+upstream_feature_selection: hidden_states
+upstream_layer_selection: null
+upstream_model_config: null
+upstream_model_name: model.pt
+upstream_refresh: false
+upstream_trainable: false
+verbose: false

asr/asr_lr01/char.dict ADDED Viewed

	@@ -0,0 +1,28 @@

+| 1980202
+E 1091870
+T 789572
+A 689048
+O 647720
+N 591778
+I 585614
+H 557204
+S 545238
+R 499568
+D 380912
+L 344952
+U 242014
+M 217730
+C 210734
+W 204598
+F 195086
+G 174098
+Y 168548
+P 146722
+B 129608
+V 81496
+K 65070
+' 19660
+X 12530
+J 12062
+Q 8164
+Z 4916

asr/asr_lr01/config_2021-09-24-18-59-50.yaml ADDED Viewed

	@@ -0,0 +1,84 @@

+downstream_expert:
+  datarc:
+    batch_size: 32
+    bucket_file: /data/lewis/superb/LibriSpeech/len_for_bucket
+    decoder_args:
+      beam: 5
+      beam_threshold: 25
+      criterion: ctc
+      decoder_type: None
+      kenlm_model: /path/to/KenLM
+      lexicon: /path/to/4-gram.arpa
+      lm_weight: 2
+      nbest: 1
+      sil_weight: 0
+      unk_weight: -math.inf
+      word_score: -1
+    dev-clean:
+    - dev-clean
+    dev-other:
+    - dev-other
+    dict_path: ./downstream/asr/char.dict
+    eval_batch_size: 1
+    libri_root: /data/lewis/superb/LibriSpeech
+    num_workers: 12
+    test-clean:
+    - test-clean
+    test-other:
+    - test-other
+    train:
+    - train-clean-100
+    train_batch_size: 32
+    zero_infinity: true
+  modelrc:
+    RNNs:
+      bidirection: true
+      dim:
+      - 1024
+      - 1024
+      dropout:
+      - 0.2
+      - 0.2
+      layer_norm:
+      - false
+      - false
+      module: LSTM
+      proj:
+      - false
+      - false
+      sample_rate:
+      - 1
+      - 1
+      sample_style: concat
+      total_rate: -1
+    Wav2Letter:
+      total_rate: 320
+    project_dim: 1024
+    select: RNNs
+optimizer:
+  lr: 0.0001
+  name: TorchOptim
+  torch_optim_name: Adam
+runner:
+  eval_dataloaders:
+  - dev-clean
+  eval_step: 2000
+  gradient_accumulate_steps: 1
+  gradient_clipping: 1
+  log_step: 100
+  max_keep: 1
+  save_step: 5
+  total_steps: 10
+specaug:
+  apply_freq_mask: true
+  apply_time_mask: true
+  apply_time_warp: true
+  freq_mask_width_range:
+  - 0
+  - 50
+  num_freq_mask: 4
+  num_time_mask: 2
+  time_mask_width_range:
+  - 0
+  - 40
+  time_warp_window: 5

asr/asr_lr01/config_2021-09-24-19-59-45.yaml ADDED Viewed

	@@ -0,0 +1,84 @@

+downstream_expert:
+  datarc:
+    batch_size: 32
+    bucket_file: /data/lewis/superb/LibriSpeech/len_for_bucket
+    decoder_args:
+      beam: 5
+      beam_threshold: 25
+      criterion: ctc
+      decoder_type: None
+      kenlm_model: /path/to/KenLM
+      lexicon: /path/to/4-gram.arpa
+      lm_weight: 2
+      nbest: 1
+      sil_weight: 0
+      unk_weight: -math.inf
+      word_score: -1
+    dev-clean:
+    - dev-clean
+    dev-other:
+    - dev-other
+    dict_path: ./downstream/asr/char.dict
+    eval_batch_size: 1
+    libri_root: /data/lewis/superb/LibriSpeech
+    num_workers: 12
+    test-clean:
+    - test-clean
+    test-other:
+    - test-other
+    train:
+    - train-clean-100
+    train_batch_size: 32
+    zero_infinity: true
+  modelrc:
+    RNNs:
+      bidirection: true
+      dim:
+      - 1024
+      - 1024
+      dropout:
+      - 0.2
+      - 0.2
+      layer_norm:
+      - false
+      - false
+      module: LSTM
+      proj:
+      - false
+      - false
+      sample_rate:
+      - 1
+      - 1
+      sample_style: concat
+      total_rate: -1
+    Wav2Letter:
+      total_rate: 320
+    project_dim: 1024
+    select: RNNs
+optimizer:
+  lr: 0.0001
+  name: TorchOptim
+  torch_optim_name: Adam
+runner:
+  eval_dataloaders:
+  - dev-clean
+  eval_step: 2000
+  gradient_accumulate_steps: 1
+  gradient_clipping: 1
+  log_step: 100
+  max_keep: 1
+  save_step: 5
+  total_steps: 10
+specaug:
+  apply_freq_mask: true
+  apply_time_mask: true
+  apply_time_warp: true
+  freq_mask_width_range:
+  - 0
+  - 50
+  num_freq_mask: 4
+  num_time_mask: 2
+  time_mask_width_range:
+  - 0
+  - 40
+  time_warp_window: 5

asr/asr_lr01/events.out.tfevents.1632502799.vorace ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6a353ec80108ab9875ffb6037ba9ee749d688e38355ffbac51e617066ad53dd
+size 40

asr/asr_lr01/events.out.tfevents.1632506421.vorace ADDED Viewed

File without changes

asr/asr_lr01/model.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:92d9a9f55e0073badbe9464012212a5a48e8a9c24c0f9deda3157899b8736b0d
+size 513965839

asr/asr_lr01/model.py ADDED Viewed

	@@ -0,0 +1,39 @@

+from s3prl.downstream.runner import Runner
+from typing import Dict
+import torch
+import os
+class PreTrainedModel(Runner):
+    def __init__(self, path=""):
+        """
+        Initialize downstream model.
+        """
+        ckp_file = os.path.join(path, "model.ckpt")
+        ckp = torch.load(ckp_file, map_location='cpu')
+        ckp["Args"].init_ckpt = ckp_file
+        ckp["Args"].mode = "inference"
+        ckp["Args"].device = "cpu"
+        ckp["Config"]["downstream_expert"]["datarc"]["dict_path"] = os.path.join(path,'char.dict')
+        Runner.__init__(self, ckp["Args"], ckp["Config"])
+    def __call__(self, inputs)-> Dict[str, str]:
+        """
+        Args:
+            inputs (:obj:`np.array`):
+                The raw waveform of audio received. By default at 16KHz.
+        Return:
+            A :obj:`dict`:. The object return should be liked {"text": "XXX"} containing
+            the detected text from the input audio.
+        """
+        for entry in self.all_entries:
+            entry.model.eval()
+        inputs = [torch.FloatTensor(inputs)]
+        with torch.no_grad():
+            features = self.upstream.model(inputs)
+            features = self.featurizer.model(inputs, features)
+            preds = self.downstream.model.inference(features, [])
+        return {"text": preds[0]}