Spaces:

openpecha
/

tibetan-stt-whisper-sm

Runtime error

TenzinGayche commited on Sep 21, 2023

Commit

81d612f

•

1 Parent(s): 4eff596

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,31 +4,30 @@ import pyewts
 converter = pyewts.pyewts()
-def remove_repeated_words(text):
-    # Tokenize the input text into words
-    words = text.split()
-    # Create a dictionary to count word occurrences
-    word_count = {}
-    # Create a list to store the final words
-    new_words = []
-    for word in words:
-        # Check if the word is in the dictionary
-        if word in word_count:
-            # If it has occurred once before, add it to the list with a count of 2
-            if word_count[word] == 1:
-                new_words.append(word)
-                word_count[word] = 2
-        else:
-            # If it has not occurred before, add it to the dictionary with a count of 1
-            word_count[word] = 1
-            new_words.append(word)
-    # Join the modified words back into a string
-    result = ' '.join(new_words)
-    return result
 # Example usage
@@ -44,7 +43,7 @@ def transcribe(microphone, upload):
     text = pipe(audio)["text"]
-    text = remove_repeated_words(text)
     state = converter.toUnicode(text)
     return state

 converter = pyewts.pyewts()
+# def remove_repeated_words(text):
+#     # Tokenize the input text into words
+#     words = text.split()
+#     # Create a dictionary to count word occurrences
+#     word_count = {}
+#     # Create a list to store the final words
+#     new_words = []
+#     for word in words:
+#         # Check if the word is in the dictionary
+#         if word in word_count:
+#             # If it has occurred once before, add it to the list with a count of 2
+#             if word_count[word] == 1:
+#                 new_words.append(word)
+#                 word_count[word] = 2
+#         else:
+#             # If it has not occurred before, add it to the dictionary with a count of 1
+#             word_count[word] = 1
+#             new_words.append(word)
+#     result = ' '.join(new_words)
+#     return result
 # Example usage
     text = pipe(audio)["text"]
+    # text = remove_repeated_words(text)
     state = converter.toUnicode(text)
     return state