Spaces:

aletrn
/

ai-pronunciation-trainer

Running

App Files Files Community

alessandro trinca tornidor commited on Nov 20, 2024

Commit

e2f3a00

1 Parent(s): 5105802

test: add/update tests

Browse files

Files changed (2) hide show

aip_trainer/lambdas/lambdaSpeechToScore.py +1 -1
tests/{test_GetAccuracyFromRecordedAudio.py → test_lambdaSpeechToScore.py} +162 -39

aip_trainer/lambdas/lambdaSpeechToScore.py CHANGED Viewed

@@ -58,7 +58,7 @@ def get_speech_to_score_dict(real_text: str, file_bytes_or_audiotmpfile: str | d
         raise ValueError(f"cannot read an empty/None text: '{real_text}'...")
     if language is None or len(language) == 0:
         raise NotImplementedError(f"Not tested/supported with '{language}' language...")
-    if file_bytes_or_audiotmpfile is None or len(file_bytes_or_audiotmpfile) == 0 or os.path.getsize(file_bytes_or_audiotmpfile) == 0:
         raise ValueError(f"cannot read an empty/None file: '{file_bytes_or_audiotmpfile}'...")
     start0 = time.time()

         raise ValueError(f"cannot read an empty/None text: '{real_text}'...")
     if language is None or len(language) == 0:
         raise NotImplementedError(f"Not tested/supported with '{language}' language...")
+    if not isinstance(file_bytes_or_audiotmpfile, (bytes, bytearray)) and (file_bytes_or_audiotmpfile is None or len(file_bytes_or_audiotmpfile) == 0 or os.path.getsize(file_bytes_or_audiotmpfile) == 0):
         raise ValueError(f"cannot read an empty/None file: '{file_bytes_or_audiotmpfile}'...")
     start0 = time.time()

tests/{test_GetAccuracyFromRecordedAudio.py → test_lambdaSpeechToScore.py} RENAMED Viewed

@@ -8,20 +8,62 @@ from aip_trainer.lambdas import lambdaSpeechToScore
 from tests import EVENTS_FOLDER
-text_dict = {
-    "de": "Ich bin Alex, wer bist du?",
-    "en": "Hi there, how are you?"
 }
-def check_output_by_field(output, key, match, expected_output):
     import re
-    assert len(output[key].strip()) > 0
-    for word in output[key].lstrip().rstrip().split(" "):
         word_check = re.findall(match, word.strip())
         assert len(word_check) == 1
         assert word_check[0] == word.strip()
     output[key] = expected_output[key]
     return output
@@ -73,13 +115,13 @@ class TestGetAccuracyFromRecordedAudio(unittest.TestCase):
         inputs = inputs_outputs["inputs"]
         outputs = inputs_outputs["outputs"]
         for event_name, event_content in inputs.items():
-            expected_output = outputs[event_name]
             output = lambdaSpeechToScore.lambda_handler(event_content, [])
             output = json.loads(output)
             app_logger.info(
-                f"output type:{type(output)}, expected_output type:{type(expected_output)}."
             )
-            check_output(self, output, expected_output)
     def test_get_speech_to_score_en_ok(self):
         from aip_trainer.lambdas import lambdaSpeechToScore
@@ -88,24 +130,29 @@ class TestGetAccuracyFromRecordedAudio(unittest.TestCase):
         path = EVENTS_FOLDER / f"test_{language}.wav"
         output = lambdaSpeechToScore.get_speech_to_score_dict(
             real_text=text_dict[language],
-            file_bytes_or_audiotmpfile=path,
             language=language,
             remove_random_file=False,
         )
-        expected_output = {
-            "real_transcript": text_dict[language],
-            "ipa_transcript": "ha\u026a ha\u028a \u0259r ju",
-            "pronunciation_accuracy": "69",
-            "real_transcripts": text_dict[language],
-            "matched_transcripts": "hi - how are you",
-            "real_transcripts_ipa": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
-            "matched_transcripts_ipa": "ha\u026a  ha\u028a \u0259r ju",
-            "pair_accuracy_category": "0 2 0 0 0",
-            "start_time": "0.2245625 1.3228125 0.852125 1.04825 1.3228125",
-            "end_time": "0.559875 1.658125 1.14825 1.344375 1.658125",
-            "is_letter_correct_all_words": "11 000001 111 111 1111 ",
-        }
-        check_output(self, output, expected_output)
     def test_get_speech_to_score_de_ok(self):
         from aip_trainer.lambdas import lambdaSpeechToScore
@@ -114,24 +161,100 @@ class TestGetAccuracyFromRecordedAudio(unittest.TestCase):
         path = EVENTS_FOLDER / f"test_{language}.wav"
         output = lambdaSpeechToScore.get_speech_to_score_dict(
             real_text=text_dict[language],
-            file_bytes_or_audiotmpfile=path,
             language=language,
             remove_random_file=False,
         )
-        expected_output = {
-            "real_transcript": text_dict[language],
-            "ipa_transcript": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bksv\u025b\u02d0 b\u025bst\u025b\u02d0 du\u02d0",
-            "pronunciation_accuracy": "63",
-            "real_transcripts": text_dict[language],
-            "matched_transcripts": "ich bin alexwe - beste du",
-            "real_transcripts_ipa": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bks, v\u0250 b\u026ast du\u02d0?",
-            "matched_transcripts_ipa": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bksv\u0259 - b\u0259st\u0259 du\u02d0",
-            "pair_accuracy_category": "0 0 2 2 2 0",
-            "start_time": "0.0 0.3075 0.62525 2.1346875 1.5785625 2.1346875",
-            "end_time": "0.328 0.6458125 1.44025 2.4730625 2.15525 2.4730625",
-            "is_letter_correct_all_words": "111 111 11111 000 1011 111 ",
-        }
-        check_output(self, output, expected_output)
 if __name__ == "__main__":

 from tests import EVENTS_FOLDER
+text_dict = {"de": "Ich bin Alex, wer bist du?", "en": "Hi there, how are you?"}
+expected_output = {
+    "de": {
+        "real_transcript": text_dict["de"],
+        "ipa_transcript": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bksv\u025b\u02d0 b\u025bst\u025b\u02d0 du\u02d0",
+        "pronunciation_accuracy": "63",
+        "real_transcripts": text_dict["de"],
+        "matched_transcripts": "ich bin alexwe - beste du",
+        "real_transcripts_ipa": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bks, v\u0250 b\u026ast du\u02d0?",
+        "matched_transcripts_ipa": "\u026a\u00e7 bi\u02d0n a\u02d0l\u025bksv\u0259 - b\u0259st\u0259 du\u02d0",
+        "pair_accuracy_category": "0 0 2 2 2 0",
+        "start_time": "0.0 0.3075 0.62525 2.1346875 1.5785625 2.1346875",
+        "end_time": "0.328 0.6458125 1.44025 2.4730625 2.15525 2.4730625",
+        "is_letter_correct_all_words": "111 111 11111 000 1011 111 ",
+    },
+    "en": {
+        "real_transcript": text_dict["en"],
+        "ipa_transcript": "ha\u026a ha\u028a \u0259r ju",
+        "pronunciation_accuracy": "69",
+        "real_transcripts": text_dict["en"],
+        "matched_transcripts": "hi - how are you",
+        "real_transcripts_ipa": "ha\u026a \u00f0\u025br, ha\u028a \u0259r ju?",
+        "matched_transcripts_ipa": "ha\u026a  ha\u028a \u0259r ju",
+        "pair_accuracy_category": "0 2 0 0 0",
+        "start_time": "0.2245625 1.3228125 0.852125 1.04825 1.3228125",
+        "end_time": "0.559875 1.658125 1.14825 1.344375 1.658125",
+        "is_letter_correct_all_words": "11 000001 111 111 1111 ",
+    },
 }
+def assert_raises_get_speech_to_score_dict(self, real_text, file_bytes_or_audiotmpfile, language, exc, error_message):
+    from aip_trainer.lambdas import lambdaSpeechToScore
+    with self.assertRaises(exc):
+        try:
+            lambdaSpeechToScore.get_speech_to_score_dict(
+                real_text, file_bytes_or_audiotmpfile, language, remove_random_file=False
+            )
+        except exc as e:
+            self.assertEqual(str(e), error_message)
+            raise e
+def check_value_by_field(value, match):
     import re
+    assert len(value.strip()) > 0
+    for word in value.lstrip().rstrip().split(" "):
         word_check = re.findall(match, word.strip())
         assert len(word_check) == 1
         assert word_check[0] == word.strip()
+def check_output_by_field(output, key, match, expected_output):
+    check_value_by_field(output[key], match)
     output[key] = expected_output[key]
     return output
         inputs = inputs_outputs["inputs"]
         outputs = inputs_outputs["outputs"]
         for event_name, event_content in inputs.items():
+            current_expected_output = outputs[event_name]
             output = lambdaSpeechToScore.lambda_handler(event_content, [])
             output = json.loads(output)
             app_logger.info(
+                f"output type:{type(output)}, expected_output type:{type(current_expected_output)}."
             )
+            check_output(self, output, current_expected_output)
     def test_get_speech_to_score_en_ok(self):
         from aip_trainer.lambdas import lambdaSpeechToScore
         path = EVENTS_FOLDER / f"test_{language}.wav"
         output = lambdaSpeechToScore.get_speech_to_score_dict(
             real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path),
             language=language,
             remove_random_file=False,
         )
+        check_output(self, output, expected_output[language])
+    def test_get_speech_to_score_en_ok_remove_input_file(self):
+        import shutil
+        from aip_trainer.lambdas import lambdaSpeechToScore
+        language = "en"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        path2 = EVENTS_FOLDER / f"test2_{language}.wav"
+        shutil.copy(path, path2)
+        assert path2.exists() and path2.is_file()
+        output = lambdaSpeechToScore.get_speech_to_score_dict(
+            real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path2),
+            language=language,
+            remove_random_file=True,
+        )
+        assert not path2.exists()
+        check_output(self, output, expected_output[language])
     def test_get_speech_to_score_de_ok(self):
         from aip_trainer.lambdas import lambdaSpeechToScore
         path = EVENTS_FOLDER / f"test_{language}.wav"
         output = lambdaSpeechToScore.get_speech_to_score_dict(
             real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path),
+            language=language,
+            remove_random_file=False,
+        )
+        check_output(self, output, expected_output[language])
+    def test_get_speech_to_score_de_ok_remove_input_file(self):
+        import shutil
+        from aip_trainer.lambdas import lambdaSpeechToScore
+        language = "de"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        path2 = EVENTS_FOLDER / f"test2_{language}.wav"
+        shutil.copy(path, path2)
+        assert path2.exists() and path2.is_file()
+        output = lambdaSpeechToScore.get_speech_to_score_dict(
+            real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path2),
+            language=language,
+            remove_random_file=True,
+        )
+        assert not path2.exists()
+        check_output(self, output, expected_output[language])
+    def test_get_speech_to_score_tuple_de_ok(self):
+        from aip_trainer.lambdas import lambdaSpeechToScore
+        language = "de"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        (
+            real_transcripts,
+            is_letter_correct_all_words,
+            pronunciation_accuracy,
+            ipa_transcript,
+            real_transcripts_ipa,
+            dumped,
+        ) = lambdaSpeechToScore.get_speech_to_score_tuple(
+            real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path),
             language=language,
             remove_random_file=False,
         )
+        assert real_transcripts == text_dict[language]
+        check_value_by_field(is_letter_correct_all_words, "[01]+")
+        check_value_by_field(pronunciation_accuracy, "\d+")
+        assert len(ipa_transcript.strip()) > 0
+        assert len(real_transcripts_ipa.strip()) > 0
+        check_output(self, json.loads(dumped), expected_output[language])
+    def test_get_speech_to_score_tuple_en_ok(self):
+        from aip_trainer.lambdas import lambdaSpeechToScore
+        language = "en"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        (
+            real_transcripts,
+            is_letter_correct_all_words,
+            pronunciation_accuracy,
+            ipa_transcript,
+            real_transcripts_ipa,
+            dumped,
+        ) = lambdaSpeechToScore.get_speech_to_score_tuple(
+            real_text=text_dict[language],
+            file_bytes_or_audiotmpfile=str(path),
+            language=language,
+            remove_random_file=False,
+        )
+        assert real_transcripts == text_dict[language]
+        check_value_by_field(is_letter_correct_all_words, "[01]+")
+        check_value_by_field(pronunciation_accuracy, "\d+")
+        assert len(ipa_transcript.strip()) > 0
+        assert len(real_transcripts_ipa.strip()) > 0
+        check_output(self, json.loads(dumped), expected_output[language])
+    def test_get_speech_to_score_dict__de_empty_input_text(self):
+        language = "de"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        assert_raises_get_speech_to_score_dict(self, "", str(path), language, ValueError, "cannot read an empty/None text: ''...")
+    def test_get_speech_to_score_dict__en_empty_input_text(self):
+        language = "en"
+        path = EVENTS_FOLDER / f"test_{language}.wav"
+        assert_raises_get_speech_to_score_dict(self, "", str(path), language, ValueError, "cannot read an empty/None text: ''...")
+    def test_get_speech_to_score_dict__de_empty_input_file(self):
+        language = "de"
+        assert_raises_get_speech_to_score_dict(self, "text fake", "", language, ValueError, "cannot read an empty/None file: ''...")
+    def test_get_speech_to_score_dict__en_empty_input_file(self):
+        language = "en"
+        assert_raises_get_speech_to_score_dict(self, "text fake", "", language, ValueError, "cannot read an empty/None file: ''...")
+    def test_get_speech_to_score_dict__empty_language(self):
+        assert_raises_get_speech_to_score_dict(self, "text fake", "fake_file", "", NotImplementedError, "Not tested/supported with '' language...")
 if __name__ == "__main__":