Spaces:

englissi
/

engdialogue

Running

App Files Files Community

englissi commited on 3 days ago

Commit

1a4473d

verified ·

1 Parent(s): 9e130e4

Update app.py

Browse files

Files changed (1) hide show

app.py +79 -57

app.py CHANGED Viewed

@@ -3,36 +3,45 @@ from gtts import gTTS
 from pydub import AudioSegment
 from io import BytesIO
-def multilingual_tts(
-    korean_text,
-    british_text,
-    american_text,
-    british_text_add1,
-    british_text_add2,
-    australian_text_add1,
-    australian_text_add2,
-    american_text_add1,
-    additional_english_text_9,
-    additional_english_text_10
 ):
-    # 각 음성에 대해 (언어 코드, tld, 텍스트) 튜플을 리스트에 저장합니다.
-    voices = [
-        ("ko", "com", korean_text),                      # 한국어
-        ("en", "co.uk", british_text),                   # 기존 영국식
-        ("en", "com", american_text),                    # 기존 미국식
-        ("en", "co.uk", british_text_add1),              # 추가 영국식 1
-        ("en", "co.uk", british_text_add2),              # 추가 영국식 2
-        ("en", "com.au", australian_text_add1),          # 추가 호주식 1
-        ("en", "com.au", australian_text_add2),          # 추가 호주식 2
-        ("en", "com", american_text_add1),               # 추가 미국식 1
-        ("en", "com", additional_english_text_9),        # 추가 영어 9
-        ("en", "com", additional_english_text_10)        # 추가 영어 10
     ]
-    combined_audio = AudioSegment.silent(duration=0)  # 빈 오디오
-    for lang, tld, text in voices:
-        if text.strip():  # 텍스트가 입력되어 있을 때만 처리
             tts = gTTS(text, lang=lang, tld=tld)
             audio_file = BytesIO()
             tts.write_to_fp(audio_file)
@@ -44,57 +53,70 @@ def multilingual_tts(
     # 최종 결합된 오디오를 mp3 파일로 저장
     output_file = "combined_output.mp3"
     combined_audio.export(output_file, format="mp3")
     return output_file
 with gr.Blocks() as demo:
-    gr.Markdown("## Multilingual TTS: Generate a Single Audio File (총 10개 음성)")
-    # 한국어 입력란
-    korean_input = gr.Textbox(label="Enter Korean Text:", placeholder="안녕하세요")
-    # 기존 영어 입력란 (영국식, 미국식)
     with gr.Row():
-        british_input = gr.Textbox(label="Enter British English Text:", placeholder="Hello (British)")
-        american_input = gr.Textbox(label="Enter American English Text:", placeholder="Hello (American)")
-    # 추가 영어 입력란 (추가 영국식)
     with gr.Row():
-        british_input_add1 = gr.Textbox(label="Enter Additional British English Text 1:", placeholder="Hi there (British)")
-        british_input_add2 = gr.Textbox(label="Enter Additional British English Text 2:", placeholder="Good day (British)")
-    # 추가 영어 입력란 (추가 호주식)
     with gr.Row():
-        australian_input_add1 = gr.Textbox(label="Enter Additional Australian English Text 1:", placeholder="G'day (Australian)")
-        australian_input_add2 = gr.Textbox(label="Enter Additional Australian English Text 2:", placeholder="How ya going? (Australian)")
-    # 추가 영어 입력란 (추가 미국식 및 추가 영어)
     with gr.Row():
-        american_input_add1 = gr.Textbox(label="Enter Additional American English Text 1:", placeholder="Hey (American)")
-        additional_english_input_9 = gr.Textbox(label="Enter Additional English Text 9:", placeholder="Additional dialogue 9 (English)")
-    # 마지막 추가 영어 입력란
-    additional_english_input_10 = gr.Textbox(label="Enter Additional English Text 10:", placeholder="Additional dialogue 10 (English)")
     output_audio = gr.Audio(label="Generated Speech", type="filepath")
     generate_button = gr.Button("Generate Speech")
     generate_button.click(
-        multilingual_tts,
         inputs=[
-            korean_input,
-            british_input,
-            american_input,
-            british_input_add1,
-            british_input_add2,
-            australian_input_add1,
-            australian_input_add2,
-            american_input_add1,
-            additional_english_input_9,
-            additional_english_input_10
-        ],
         outputs=output_audio
     )
 if __name__ == "__main__":
-    demo.launch()

 from pydub import AudioSegment
 from io import BytesIO
+def custom_tts(
+    text1, accent1,
+    text2, accent2,
+    text3, accent3,
+    text4, accent4,
+    text5, accent5,
+    text6, accent6,
+    text7, accent7,
+    text8, accent8,
+    text9, accent9,
+    text10, accent10
 ):
+    # 각 악센트에 따른 언어 코드와 tld 설정
+    accent_mapping = {
+        "British": ("en", "co.uk"),
+        "American": ("en", "com"),
+        "Australian": ("en", "com.au")
+    }
+    # 10개의 대화문과 선택된 악센트를 튜플 리스트로 구성합니다.
+    dialogues = [
+        (text1, accent1),
+        (text2, accent2),
+        (text3, accent3),
+        (text4, accent4),
+        (text5, accent5),
+        (text6, accent6),
+        (text7, accent7),
+        (text8, accent8),
+        (text9, accent9),
+        (text10, accent10)
     ]
+    combined_audio = AudioSegment.silent(duration=0)  # 초기 빈 오디오
+    # 각 대화문에 대해 음성 생성 후 결합
+    for text, accent in dialogues:
+        if text.strip():  # 텍스트가 비어있지 않은 경우에만 처리
+            lang, tld = accent_mapping.get(accent, ("en", "com"))
             tts = gTTS(text, lang=lang, tld=tld)
             audio_file = BytesIO()
             tts.write_to_fp(audio_file)
     # 최종 결합된 오디오를 mp3 파일로 저장
     output_file = "combined_output.mp3"
     combined_audio.export(output_file, format="mp3")
     return output_file
 with gr.Blocks() as demo:
+    gr.Markdown("## Custom TTS: 10개의 대화문 입력란에서 악센트를 선택하여 음성 생성하기")
+    with gr.Row():
+        text1 = gr.Textbox(label="Dialogue 1", placeholder="Enter text for Dialogue 1")
+        accent1 = gr.Dropdown(label="Accent for Dialogue 1", choices=["British", "American", "Australian"], value="British")
+    with gr.Row():
+        text2 = gr.Textbox(label="Dialogue 2", placeholder="Enter text for Dialogue 2")
+        accent2 = gr.Dropdown(label="Accent for Dialogue 2", choices=["British", "American", "Australian"], value="British")
+    with gr.Row():
+        text3 = gr.Textbox(label="Dialogue 3", placeholder="Enter text for Dialogue 3")
+        accent3 = gr.Dropdown(label="Accent for Dialogue 3", choices=["British", "American", "Australian"], value="British")
+    with gr.Row():
+        text4 = gr.Textbox(label="Dialogue 4", placeholder="Enter text for Dialogue 4")
+        accent4 = gr.Dropdown(label="Accent for Dialogue 4", choices=["British", "American", "Australian"], value="British")
     with gr.Row():
+        text5 = gr.Textbox(label="Dialogue 5", placeholder="Enter text for Dialogue 5")
+        accent5 = gr.Dropdown(label="Accent for Dialogue 5", choices=["British", "American", "Australian"], value="British")
     with gr.Row():
+        text6 = gr.Textbox(label="Dialogue 6", placeholder="Enter text for Dialogue 6")
+        accent6 = gr.Dropdown(label="Accent for Dialogue 6", choices=["British", "American", "Australian"], value="British")
     with gr.Row():
+        text7 = gr.Textbox(label="Dialogue 7", placeholder="Enter text for Dialogue 7")
+        accent7 = gr.Dropdown(label="Accent for Dialogue 7", choices=["British", "American", "Australian"], value="British")
     with gr.Row():
+        text8 = gr.Textbox(label="Dialogue 8", placeholder="Enter text for Dialogue 8")
+        accent8 = gr.Dropdown(label="Accent for Dialogue 8", choices=["British", "American", "Australian"], value="British")
+    with gr.Row():
+        text9 = gr.Textbox(label="Dialogue 9", placeholder="Enter text for Dialogue 9")
+        accent9 = gr.Dropdown(label="Accent for Dialogue 9", choices=["British", "American", "Australian"], value="British")
+    with gr.Row():
+        text10 = gr.Textbox(label="Dialogue 10", placeholder="Enter text for Dialogue 10")
+        accent10 = gr.Dropdown(label="Accent for Dialogue 10", choices=["British", "American", "Australian"], value="British")
     output_audio = gr.Audio(label="Generated Speech", type="filepath")
     generate_button = gr.Button("Generate Speech")
     generate_button.click(
+        custom_tts,
         inputs=[
+            text1, accent1,
+            text2, accent2,
+            text3, accent3,
+            text4, accent4,
+            text5, accent5,
+            text6, accent6,
+            text7, accent7,
+            text8, accent8,
+            text9, accent9,
+            text10, accent10
+        ],
         outputs=output_audio
     )
 if __name__ == "__main__":
+    demo.launch()