Spaces:

ginigen
/

Sign-language

Building

App Files Files Community

ginipick commited on Jan 26

Commit

fada645

verified ·

1 Parent(s): c8c948e

Update src/main.py

Browse files

Files changed (1) hide show

src/main.py +55 -60

src/main.py CHANGED Viewed

@@ -29,32 +29,7 @@ def is_korean(text):
     """한글이 포함되어 있는지 확인"""
     return bool(re.search('[가-힣]', text))
-def normalize_quotes(text):
-    """따옴표 형식을 정규화하는 함수"""
-    # 연속된 따옴표 제거
-    text = re.sub(r"'+", "'", text)
-    # 불필요한 공백 제거
-    text = re.sub(r'\s+', ' ', text).strip()
-    if is_korean(text):
-        # 한글 문장의 경우
-        words = text.split()
-        if words:
-            # 첫 번째 단어에서 따옴표 제거 후 다시 추가
-            first_word = words[0].replace("'", "")
-            words[0] = f"'{first_word}'"
-            # 나머지 단어들에서 따옴표 제거
-            words[1:] = [w.replace("'", "") for w in words[1:]]
-            return ' '.join(words)
-    else:
-        # 영어 문장의 경우, 첫 단어만 따옴표로 처리
-        words = text.split()
-        if words:
-            # 첫 번째 단어에서 따옴표 제거 후 다시 추가
-            first_word = words[0].replace("'", "")
-            words[0] = f"'{first_word}'"
-            return ' '.join(words)
-    return text
 def find_quoted_words(text):
     """작은따옴표로 묶인 단어들을 찾는 함수"""
@@ -64,16 +39,6 @@ def spell_out_word(word):
     """단어를 개별 알파벳으로 분리하는 함수"""
     return ' '.join(list(word.lower()))
-def is_english(text):
-    """텍스트가 영어인지 확인하는 함수"""
-    # 따옴표와 기본 문장부호를 제거하고 영어 알파벳과 공백만 남김
-    cleaned_text = re.sub(r'[^A-Za-z\s]', '', text)
-    # 알파벳이 하나라도 있는지 확인
-    has_letters = bool(re.search('[A-Za-z]', cleaned_text))
-    # 알파벳과 공백 외의 문자가 없는지 확인
-    is_only_english = bool(re.match(r'^[A-Za-z\s]*$', cleaned_text))
-    return has_letters and is_only_english
 def translate_korean_to_english(text):
     """전체 텍스트 번역 함수"""
     try:
@@ -82,42 +47,72 @@ def translate_korean_to_english(text):
         # 영어 입력 확인
         if is_english(text):
             return text
         # 한글 입력 처리
-        # 따옴표로 묶인 단어 찾기
-        quoted_word = re.findall(r"'([^']*)'", text)[0]
-        # 따옴표로 묶인 단어 먼저 번역
-        url = "https://translate.googleapis.com/translate_a/single"
-        params = {
-            "client": "gtx",
-            "sl": "ko",
-            "tl": "en",
-            "dt": "t",
-            "q": quoted_word
-        }
-        response = requests.get(url, params=params)
-        if response.status_code == 200:
-            translated_word = response.json()[0][0][0].upper()
-            # 원본 텍스트에서 따옴표로 묶인 부분을 임시 마커로 대체
-            text = text.replace(f"'{quoted_word}'", "QUOTED_WORD_MARKER")
-            # 나머지 문장 번역
-            params["q"] = text
             response = requests.get(url, params=params)
             if response.status_code == 200:
-                translated_text = ' '.join(item[0] for item in response.json()[0] if item[0])
-                # 마커를 번역된 단어로 대체
-                translated_text = translated_text.replace("QUOTED_WORD_MARKER", f"'{translated_word}'")
-                return translated_text
         return text
     except Exception as e:
         print(f"Translation error: {e}")
         return text
 @app.route('/')
 def index():
     return render_template('index.html', title=app.config['TITLE'])

     """한글이 포함되어 있는지 확인"""
     return bool(re.search('[가-힣]', text))
 def find_quoted_words(text):
     """작은따옴표로 묶인 단어들을 찾는 함수"""
     """단어를 개별 알파벳으로 분리하는 함수"""
     return ' '.join(list(word.lower()))
 def translate_korean_to_english(text):
     """전체 텍스트 번역 함수"""
     try:
         # 영어 입력 확인
         if is_english(text):
+            # 영어 입력의 경우 따옴표 처리만 하고 그대로 반환
+            quoted_match = re.search(r"'([^']*)'", text)
+            if quoted_match:
+                quoted_word = quoted_match.group(1).upper()
+                text = re.sub(r"'[^']*'", f"'{quoted_word}'", text, 1)
             return text
         # 한글 입력 처리
+        quoted_match = re.search(r"'([^']*)'", text)
+        if quoted_match:
+            quoted_word = quoted_match.group(1)
+            # 따옴표로 묶인 단어 먼저 번역
+            url = "https://translate.googleapis.com/translate_a/single"
+            params = {
+                "client": "gtx",
+                "sl": "ko",
+                "tl": "en",
+                "dt": "t",
+                "q": quoted_word
+            }
             response = requests.get(url, params=params)
             if response.status_code == 200:
+                translated_word = response.json()[0][0][0].upper()
+                # 원본 텍스트에서 따옴표로 묶인 부분을 임시 마커로 대체
+                text = text.replace(f"'{quoted_word}'", "QUOTED_WORD_MARKER")
+                # 나머지 문장 번역
+                params["q"] = text
+                response = requests.get(url, params=params)
+                if response.status_code == 200:
+                    translated_text = ' '.join(item[0] for item in response.json()[0] if item[0])
+                    # 마커를 번역된 단어로 대체
+                    translated_text = translated_text.replace("QUOTED_WORD_MARKER", f"'{translated_word}'")
+                    return translated_text
         return text
     except Exception as e:
         print(f"Translation error: {e}")
         return text
+def is_english(text):
+    """텍��트가 영어인지 확인하는 함수"""
+    # 따옴표와 공백을 제외한 나머지 텍스트 확인
+    text_without_quotes = re.sub(r"'[^']*'|\s", "", text)
+    # 영어 알파벳과 기본 문장부호만 포함되어 있는지 확인
+    return bool(re.match(r'^[A-Za-z.,!?-]*$', text_without_quotes))
+def normalize_quotes(text):
+    """따옴표 형식을 정규화하는 함수"""
+    # 연속된 따옴표 제거
+    text = re.sub(r"'+", "'", text)
+    # 불필요한 공백 제거
+    text = re.sub(r'\s+', ' ', text).strip()
+    # 첫 번째 단어에만 따옴표 처리
+    words = text.split()
+    if words:
+        # 모든 따옴표 제거 후 첫 단어에만 따옴표 추가
+        first_word = words[0].replace("'", "")
+        words[0] = f"'{first_word}'"
+        words[1:] = [w.replace("'", "") for w in words[1:]]
+        return ' '.join(words)
+    return text
 @app.route('/')
 def index():
     return render_template('index.html', title=app.config['TITLE'])