Spaces:

braindeck
/

Lucy_5

Running on Zero

aaron commited on 17 days ago

Commit

771366a

1 Parent(s): d9f37c5

UI 텍스트를 영어로 변경 (국제화)

- 메인 제목 및 설명을 영어로 번역
- TTS 설정 섹션 라벨 영어화
- 음성 변환 설정 섹션 라벨 영어화
- 버튼 및 출력 라벨 영어화
- 처리 과정 및 팁 설명 영어화
- 기본 텍스트 예시를 영어로 변경
- 국제 사용자 접근성 향상

Files changed (1) hide show

app.py +36 -36

app.py CHANGED Viewed

@@ -811,98 +811,98 @@ except Exception as e:
 # Create Gradio interface
 with gr.Blocks(title="Integrated TTS + Voice Conversion", analytics_enabled=False) as demo:
     gr.Markdown("""
-    # **Integrated TTS + Voice Conversion** — 텍스트를 음성으로 변환 후 음성 변환
-    텍스트를 입력하고 참조 음성을 업로드하면, 먼저 텍스트가 음성으로 변환된 후 참조 음성의 스타일로 변환됩니다.
-    **사용법:**
-    1. 변환할 텍스트를 입력하세요
-    2. 참조 음성을 업로드하세요 (3-10초 권장)
-    3. 기본 음성 스타일과 속도를 선택하세요
-    4. 음성 변환 파라미터를 조정하세요
-    5. "통합 변환" 버튼을 클릭하세요
     """)
     with gr.Row():
         with gr.Column(scale=6):
             # TTS Parameters
-            gr.Markdown("### 🎤 텍스트-음성 변환 설정")
             text_input = gr.Textbox(
-                label="변환할 텍스트",
-                value="안녕하세요! 이것은 통합 TTS와 음성 변환 데모입니다.",
                 lines=3
             )
             style_input = gr.Dropdown(
-                label="기본 음성 스타일",
                 choices=styles,
                 value=styles[0]
             )
             speed_input = gr.Slider(
                 0.6, 1.4, value=1.0, step=0.05,
-                label="음성 속도 (×)"
             )
             reference_audio_input = gr.Audio(
-                label="참조 음성",
                 sources=["upload", "microphone"],
                 type="filepath"
             )
             # Voice Conversion Parameters
-            gr.Markdown("### 🔄 음성 변환 설정")
             with gr.Row():
                 vc_diffusion_steps = gr.Slider(
                     minimum=1, maximum=200, value=25, step=1,
-                    label="확산 단계",
-                    info="25 기본값, 50~100 최고 품질"
                 )
                 vc_length_adjust = gr.Slider(
                     minimum=0.5, maximum=2.0, step=0.1, value=1.0,
-                    label="길이 조정",
-                    info="<1.0 빠르게, >1.0 느리게"
                 )
             with gr.Row():
                 vc_inference_cfg_rate = gr.Slider(
                     minimum=0.0, maximum=1.0, step=0.1, value=0.7,
-                    label="CFG 비율",
-                    info="미묘한 영향"
                 )
                 vc_pitch_shift = gr.Slider(
                     minimum=-24, maximum=24, step=1, value=0,
-                    label="피치 시프트",
-                    info="반음 단위"
                 )
             with gr.Row():
                 vc_f0_condition = gr.Checkbox(
-                    label="F0 조건부 모델 사용",
                     value=False,
-                    info="노래 음성 변환에 필요"
                 )
                 vc_auto_f0_adjust = gr.Checkbox(
-                    label="자동 F0 조정",
                     value=True,
-                    info="대상 음성에 맞게 F0 조정"
                 )
-            convert_btn = gr.Button("통합 변환", variant="primary", size="lg")
         with gr.Column(scale=6):
             output_audio = gr.Audio(
-                label="최종 변환된 음성",
                 autoplay=True,
                 format="wav"
             )
             gr.Markdown("""
-            ### 📋 처리 과정:
-            1. **텍스트 → 음성**: 입력된 텍스트가 참조 음성의 톤으로 변환됩니다
-            2. **음성 변환**: 생성된 음성이 참조 음성의 스타일로 최종 변환됩니다
-            ### 💡 팁:
-            - 참조 음성은 3-10초 길이의 깨끗한 음성을 사용하세요
-            - 노래 음성 변환을 원한다면 "F0 조건부 모델 사용"을 체크하세요
-            - 품질을 높이려면 확산 단계를 50-100으로 설정하세요
             """)
     # Connect the button click to the processing function

 # Create Gradio interface
 with gr.Blocks(title="Integrated TTS + Voice Conversion", analytics_enabled=False) as demo:
     gr.Markdown("""
+    # **Integrated TTS + Voice Conversion** — Convert text to speech and then apply voice conversion
+    Enter text and upload a reference audio to first convert text to speech, then apply voice conversion to match the reference style.
+    **How to use:**
+    1. Enter the text you want to convert
+    2. Upload a reference audio (3-10 seconds recommended)
+    3. Select the base voice style and speed
+    4. Adjust voice conversion parameters
+    5. Click the "Convert" button
     """)
     with gr.Row():
         with gr.Column(scale=6):
             # TTS Parameters
+            gr.Markdown("### 🎤 Text-to-Speech Settings")
             text_input = gr.Textbox(
+                label="Text to Convert",
+                value="Hello! This is an integrated TTS and voice conversion demo.",
                 lines=3
             )
             style_input = gr.Dropdown(
+                label="Base Voice Style",
                 choices=styles,
                 value=styles[0]
             )
             speed_input = gr.Slider(
                 0.6, 1.4, value=1.0, step=0.05,
+                label="Speech Speed (×)"
             )
             reference_audio_input = gr.Audio(
+                label="Reference Audio",
                 sources=["upload", "microphone"],
                 type="filepath"
             )
             # Voice Conversion Parameters
+            gr.Markdown("### 🔄 Voice Conversion Settings")
             with gr.Row():
                 vc_diffusion_steps = gr.Slider(
                     minimum=1, maximum=200, value=25, step=1,
+                    label="Diffusion Steps",
+                    info="25 default, 50~100 for best quality"
                 )
                 vc_length_adjust = gr.Slider(
                     minimum=0.5, maximum=2.0, step=0.1, value=1.0,
+                    label="Length Adjustment",
+                    info="<1.0 faster, >1.0 slower"
                 )
             with gr.Row():
                 vc_inference_cfg_rate = gr.Slider(
                     minimum=0.0, maximum=1.0, step=0.1, value=0.7,
+                    label="CFG Rate",
+                    info="Subtle influence"
                 )
                 vc_pitch_shift = gr.Slider(
                     minimum=-24, maximum=24, step=1, value=0,
+                    label="Pitch Shift",
+                    info="In semitones"
                 )
             with gr.Row():
                 vc_f0_condition = gr.Checkbox(
+                    label="Use F0 Conditioned Model",
                     value=False,
+                    info="Required for singing voice conversion"
                 )
                 vc_auto_f0_adjust = gr.Checkbox(
+                    label="Auto F0 Adjustment",
                     value=True,
+                    info="Adjust F0 to match target voice"
                 )
+            convert_btn = gr.Button("Convert", variant="primary", size="lg")
         with gr.Column(scale=6):
             output_audio = gr.Audio(
+                label="Final Converted Audio",
                 autoplay=True,
                 format="wav"
             )
             gr.Markdown("""
+            ### 📋 Processing Steps:
+            1. **Text → Speech**: Input text is converted to speech with the reference voice tone
+            2. **Voice Conversion**: Generated speech is converted to match the reference voice style
+            ### 💡 Tips:
+            - Use clean reference audio of 3-10 seconds length
+            - Check "Use F0 Conditioned Model" for singing voice conversion
+            - Set diffusion steps to 50-100 for higher quality
             """)
     # Connect the button click to the processing function