Spaces:

MERaLiON
/

AudioBench-Leaderboard

Running

App Files Files Community

zhuohan-7 commited on Aug 29

Commit

8a77d82

•

1 Parent(s): b2caef0

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +18 -0
examples/AC/AudioCaps-Test/data-00000-of-00001.arrow +3 -0
examples/AC/AudioCaps-Test/dataset_info.json +142 -0
examples/AC/AudioCaps-Test/sample_0.wav +0 -0
examples/AC/AudioCaps-Test/sample_1.wav +0 -0
examples/AC/AudioCaps-Test/sample_2.wav +0 -0
examples/AC/AudioCaps-Test/state.json +23 -0
examples/AC/WavCaps-Test/data-00000-of-00001.arrow +3 -0
examples/AC/WavCaps-Test/dataset_info.json +138 -0
examples/AC/WavCaps-Test/sample_0.wav +0 -0
examples/AC/WavCaps-Test/sample_1.wav +0 -0
examples/AC/WavCaps-Test/sample_2.wav +0 -0
examples/AC/WavCaps-Test/state.json +23 -0
examples/AR/VoxCeleb-Accent-Test/data-00000-of-00001.arrow +3 -0
examples/AR/VoxCeleb-Accent-Test/dataset_info.json +150 -0
examples/AR/VoxCeleb-Accent-Test/sample_0.wav +0 -0
examples/AR/VoxCeleb-Accent-Test/sample_1.wav +0 -0
examples/AR/VoxCeleb-Accent-Test/sample_2.wav +0 -0
examples/AR/VoxCeleb-Accent-Test/state.json +23 -0
examples/ASQA/AudioCaps-QA-Test/data-00000-of-00001.arrow +3 -0
examples/ASQA/AudioCaps-QA-Test/dataset_info.json +146 -0
examples/ASQA/AudioCaps-QA-Test/sample_0.wav +0 -0
examples/ASQA/AudioCaps-QA-Test/sample_1.wav +0 -0
examples/ASQA/AudioCaps-QA-Test/sample_2.wav +0 -0
examples/ASQA/AudioCaps-QA-Test/state.json +23 -0
examples/ASQA/Clotho-AQA-Test/data-00000-of-00001.arrow +3 -0
examples/ASQA/Clotho-AQA-Test/dataset_info.json +129 -0
examples/ASQA/Clotho-AQA-Test/sample_0.wav +0 -0
examples/ASQA/Clotho-AQA-Test/sample_1.wav +0 -0
examples/ASQA/Clotho-AQA-Test/sample_2.wav +0 -0
examples/ASQA/Clotho-AQA-Test/state.json +23 -0
examples/ASQA/WavCaps-QA-Test/data-00000-of-00001.arrow +3 -0
examples/ASQA/WavCaps-QA-Test/dataset_info.json +142 -0
examples/ASQA/WavCaps-QA-Test/sample_0.wav +0 -0
examples/ASQA/WavCaps-QA-Test/sample_1.wav +0 -0
examples/ASQA/WavCaps-QA-Test/sample_2.wav +0 -0
examples/ASQA/WavCaps-QA-Test/state.json +23 -0
examples/ASR/Common-Voice-15-En-Test/data-00000-of-00001.arrow +3 -0
examples/ASR/Common-Voice-15-En-Test/dataset_info.json +170 -0
examples/ASR/Common-Voice-15-En-Test/sample_0.wav +0 -0
examples/ASR/Common-Voice-15-En-Test/sample_1.wav +0 -0
examples/ASR/Common-Voice-15-En-Test/sample_2.wav +0 -0
examples/ASR/Common-Voice-15-En-Test/state.json +23 -0
examples/ASR/Earnings21-Test/data-00000-of-00001.arrow +3 -0
examples/ASR/Earnings21-Test/dataset_info.json +134 -0
examples/ASR/Earnings21-Test/sample_0.wav +3 -0
examples/ASR/Earnings21-Test/sample_1.wav +3 -0
examples/ASR/Earnings21-Test/sample_2.wav +3 -0
examples/ASR/Earnings21-Test/state.json +23 -0
examples/ASR/Earnings22-Test/data-00000-of-00001.arrow +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,21 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 scale-hf-logo.png filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 scale-hf-logo.png filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings21-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings21-Test/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings21-Test/sample_2.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings22-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings22-Test/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Earnings22-Test/sample_2.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Tedlium3-Longform-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Tedlium3-Longform-Test/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/ASR/Tedlium3-Longform-Test/sample_2.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/DREAM-TTS-MCQ-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/Public-SG-Speech-QA-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/Public-SG-Speech-QA-Test/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/SLUE-P2-SQA5-Test/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/SLUE-P2-SQA5-Test/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/SLUE-P2-SQA5-Test/sample_2.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/Spoken-Squad-v1/sample_0.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/Spoken-Squad-v1/sample_1.wav filter=lfs diff=lfs merge=lfs -text
+examples/SQA/Spoken-Squad-v1/sample_2.wav filter=lfs diff=lfs merge=lfs -text

examples/AC/AudioCaps-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff53d7bcff873fea97f02e971836f24adfbfba9ebdcfc7554423bf65cb110e1d
+size 970312

examples/AC/AudioCaps-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,142 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "audiocap_id": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "start_time": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "youtube_id": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/AC/AudioCaps-Test/sample_0.wav ADDED Viewed

Binary file (320 kB). View file

examples/AC/AudioCaps-Test/sample_1.wav ADDED Viewed

Binary file (320 kB). View file

examples/AC/AudioCaps-Test/sample_2.wav ADDED Viewed

Binary file (320 kB). View file

examples/AC/AudioCaps-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "0e301916c3676d35",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/AC/WavCaps-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c824145183da91da498c0338860b6daeaed94d7c619ec9ae22a041918c61c902
+size 985360

examples/AC/WavCaps-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,138 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "audio_path": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "duration": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/AC/WavCaps-Test/sample_0.wav ADDED Viewed

Binary file (559 kB). View file

examples/AC/WavCaps-Test/sample_1.wav ADDED Viewed

Binary file (129 kB). View file

examples/AC/WavCaps-Test/sample_2.wav ADDED Viewed

Binary file (287 kB). View file

examples/AC/WavCaps-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "1e570096603c2a32",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/AR/VoxCeleb-Accent-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1c07c0e241fb703dda0b7544925d0ca59bba57417daa5e08727a9edd9312e64
+size 578840

examples/AR/VoxCeleb-Accent-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,150 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "Gender": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "Nationality": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "VGGFace1 ID": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "VoxCeleb1 ID": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "index": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/AR/VoxCeleb-Accent-Test/sample_0.wav ADDED Viewed

Binary file (209 kB). View file

examples/AR/VoxCeleb-Accent-Test/sample_1.wav ADDED Viewed

Binary file (227 kB). View file

examples/AR/VoxCeleb-Accent-Test/sample_2.wav ADDED Viewed

Binary file (134 kB). View file

examples/AR/VoxCeleb-Accent-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "7017504c8eeb5d71",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASQA/AudioCaps-QA-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42f33a60a23ffc8fce090307d530ef03b2b8cf9852fa70418e76ed6a1d5dd978
+size 954480

examples/ASQA/AudioCaps-QA-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,146 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "audiocap_id": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "caption": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "start_time": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "youtube_id": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/ASQA/AudioCaps-QA-Test/sample_0.wav ADDED Viewed

Binary file (320 kB). View file

examples/ASQA/AudioCaps-QA-Test/sample_1.wav ADDED Viewed

Binary file (304 kB). View file

examples/ASQA/AudioCaps-QA-Test/sample_2.wav ADDED Viewed

Binary file (320 kB). View file

examples/ASQA/AudioCaps-QA-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "b4d0bc420173574a",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASQA/Clotho-AQA-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a76c13e88e89bb39d6a4dedc9f3bb30e128cdaaa5f68d8c0e1d804d9af5cbf68
+size 2181384

examples/ASQA/Clotho-AQA-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {},
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/ASQA/Clotho-AQA-Test/sample_0.wav ADDED Viewed

Binary file (868 kB). View file

examples/ASQA/Clotho-AQA-Test/sample_1.wav ADDED Viewed

Binary file (668 kB). View file

examples/ASQA/Clotho-AQA-Test/sample_2.wav ADDED Viewed

Binary file (636 kB). View file

examples/ASQA/Clotho-AQA-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "3f05c76553bf311d",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASQA/WavCaps-QA-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:183517b37463c54c088f5e1011721003d14587380bc111e8ad7f7cfc60fcd9e5
+size 970376

examples/ASQA/WavCaps-QA-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,142 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "audio_path": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "caption": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "duration": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/ASQA/WavCaps-QA-Test/sample_0.wav ADDED Viewed

Binary file (320 kB). View file

examples/ASQA/WavCaps-QA-Test/sample_1.wav ADDED Viewed

Binary file (320 kB). View file

examples/ASQA/WavCaps-QA-Test/sample_2.wav ADDED Viewed

Binary file (320 kB). View file

examples/ASQA/WavCaps-QA-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "f88396310248e252",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASR/Common-Voice-15-En-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:44587f333a31075993f3cc8832f8946fd59605246769dd8bf86887dcf3bd889c
+size 543912

examples/ASR/Common-Voice-15-En-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,170 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "accents": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "age": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "client_id": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "down_votes": {
+        "dtype": "int64",
+        "_type": "Value"
+      },
+      "gender": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "language": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "locale": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "segment": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "up_votes": {
+        "dtype": "int64",
+        "_type": "Value"
+      },
+      "variant": {
+        "dtype": "null",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/ASR/Common-Voice-15-En-Test/sample_0.wav ADDED Viewed

Binary file (202 kB). View file

examples/ASR/Common-Voice-15-En-Test/sample_1.wav ADDED Viewed

Binary file (118 kB). View file

examples/ASR/Common-Voice-15-En-Test/sample_2.wav ADDED Viewed

Binary file (214 kB). View file

examples/ASR/Common-Voice-15-En-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "30218d56801da2e8",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASR/Earnings21-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33dce5920f131621276ca79ef824fc52d5d5bb043d7672458fdbe037c7fb60fd
+size 310572568

examples/ASR/Earnings21-Test/dataset_info.json ADDED Viewed

	@@ -0,0 +1,134 @@

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "context": {
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "audio": {
+        "sampling_rate": 16000,
+        "_type": "Audio"
+      }
+    },
+    "instruction": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "answer": {
+      "audio": {
+        "dtype": "null",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "other_attributes": {
+      "id": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "salmonn_7b": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "wavllm_fairseq": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "Qwen2-Audio-7B-Instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "whisper_large_v3_with_llama_3_8b_instruct": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    },
+    "qwen_audio_chat": {
+      "answer": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "model_prediction": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "task_type": {
+        "dtype": "string",
+        "_type": "Value"
+      },
+      "text": {
+        "dtype": "string",
+        "_type": "Value"
+      }
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

examples/ASR/Earnings21-Test/sample_0.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8e88eccc61c5e8a5e62867c52a8ccfc4e108a5f48459f7df0eb1e9ae7f16d4f
+size 139072236

examples/ASR/Earnings21-Test/sample_1.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcd3ce7847b7fb0f600bb3faeca3cd2a8f4992fd1de17bd831ef6ccfb2623f33
+size 55065644

examples/ASR/Earnings21-Test/sample_2.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:607725d2a33f206a0f00668f1907f4d997fc7dbe7d1e1f9c82045496412bd8bd
+size 115039268

examples/ASR/Earnings21-Test/state.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "2e3dea299b387757",
+  "_format_columns": [
+    "context",
+    "instruction",
+    "answer",
+    "other_attributes",
+    "salmonn_7b",
+    "wavllm_fairseq",
+    "Qwen2-Audio-7B-Instruct",
+    "whisper_large_v3_with_llama_3_8b_instruct",
+    "qwen_audio_chat"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

examples/ASR/Earnings22-Test/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51a45b6f2b6f1eaefc76f48f4778b5d5d46793e0a0fc846b1c2dd4b639dd173f
+size 299513312