Spaces:

aletrn
/

ai-pronunciation-trainer

Running

alessandro trinca tornidor commited on Nov 21, 2024

Commit

bafb40b

1 Parent(s): 6e31dbd

feat: prepare a separate function to get a rendom phrase from the phrase dataset

Files changed (1) hide show

aip_trainer/lambdas/lambdaGetSample.py CHANGED Viewed

@@ -63,10 +63,7 @@ def lambda_handler(event, context):
     try:
         current_transcript = str(body["transcript"])
     except KeyError:
-        lambda_df_lang = lambda_database[language]
-        current_transcript = lambda_df_lang.get_random_sample_from_df(language, category)
-    app_logger.info(f"category={category}, language={language}, current_transcript={current_transcript}.")
-    # sentence_category = getSentenceCategory(current_transcript[0])
     current_transcript = current_transcript if isinstance(current_transcript, str) else current_transcript[0]
     current_ipa = lambda_ipa_converter[language].convertToPhonem(current_transcript)
@@ -80,6 +77,13 @@ def lambda_handler(event, context):
     return json.dumps(result)
 def getSentenceCategory(sentence) -> int:
     number_of_words = len(sentence.split())
     categories_word_limits = [0, 8, 20, 100000]

     try:
         current_transcript = str(body["transcript"])
     except KeyError:
+        current_transcript = get_random_selection(language, category, is_gradio_output=False)
     current_transcript = current_transcript if isinstance(current_transcript, str) else current_transcript[0]
     current_ipa = lambda_ipa_converter[language].convertToPhonem(current_transcript)
     return json.dumps(result)
+def get_random_selection(language: str, category: int, is_gradio_output=True):
+    lambda_df_lang = lambda_database[language]
+    current_transcript = lambda_df_lang.get_random_sample_from_df(language, category)
+    app_logger.info(f"category={category}, language={language}, current_transcript={current_transcript}.")
+    return current_transcript[0] if is_gradio_output else current_transcript
 def getSentenceCategory(sentence) -> int:
     number_of_words = len(sentence.split())
     categories_word_limits = [0, 8, 20, 100000]