Spaces:

ayousanz
/

piper-plus-demo

Running

App Files Files Community

ayousanz commited on Aug 21

Commit

4956922

verified ·

1 Parent(s): 9ff78c7

Update from GitHub Actions - 2025-08-21 14:44:46

Browse files

Files changed (1) hide show

app.py +67 -84

app.py CHANGED Viewed

@@ -300,9 +300,8 @@ def synthesize_speech(
 def create_interface():
     """Create Gradio interface"""
-    try:
-        with gr.Blocks(title="Piper TTS Demo") as interface:
-            gr.Markdown("""
             # 🎙️ Piper TTS Demo
             High-quality text-to-speech synthesis supporting Japanese and English.
@@ -310,64 +309,64 @@ def create_interface():
             This demo uses ONNX models for fast CPU inference.
             """)
-            with gr.Row():
-                with gr.Column(scale=2):
-                    model_dropdown = gr.Dropdown(
-                        choices=list(MODELS.keys()),
-                        label="Select Model",
-                        value=list(MODELS.keys())[0],
-                    )
-                    text_input = gr.Textbox(
-                        label="Text to synthesize",
-                        placeholder="Enter text here...",
-                        lines=3,
-                    )
-                    # Advanced Settings without Accordion (flattened)
-                    gr.Markdown("### Advanced Settings")
-                    speaker_id = gr.Number(
-                        label="Speaker ID (for multi-speaker models)",
-                        value=0,
-                        minimum=0,
-                        maximum=10,
-                    )
-                    length_scale = gr.Slider(
-                        label="Speed (Lower = faster speech)",
-                        minimum=0.5,
-                        maximum=2.0,
-                        value=1.0,
-                        step=0.1,
-                    )
-                    noise_scale = gr.Slider(
-                        label="Expressiveness",
-                        minimum=0.0,
-                        maximum=1.0,
-                        value=0.667,
-                        step=0.01,
-                    )
-                    noise_w = gr.Slider(
-                        label="Phoneme Duration Variance",
-                        minimum=0.0,
-                        maximum=1.0,
-                        value=0.8,
-                        step=0.01,
-                    )
-                synthesize_btn = gr.Button("Generate Speech", variant="primary")
-            with gr.Column(scale=1):
-                audio_output = gr.Audio(
-                    label="Generated Speech",
-                    type="numpy",
-                    autoplay=True,
                 )
-                gr.Markdown("""
                 ### Tips:
                 - Japanese model expects hiragana/kanji text
                 - English model works with standard text
@@ -406,17 +405,13 @@ def create_interface():
             outputs=audio_output,
         )
-        return interface
-    except Exception as e:
-        logger.error(f"Failed to create main interface: {e}")
-        # Fallback to minimal interface
-        return create_minimal_interface()
 def create_minimal_interface():
     """Create a minimal fallback interface if main interface fails"""
-    with gr.Blocks(title="Piper TTS Demo - Minimal") as interface:
-        gr.Markdown("# Piper TTS Demo (Minimal Mode)")
         text_input = gr.Textbox(
             label="Text to synthesize",
@@ -451,22 +446,10 @@ def create_minimal_interface():
 interface = None
 if __name__ == "__main__":
-    # Create interface inside main block
     interface = create_interface()
-    try:
-        # Launch with settings for Gradio 5.x
-        interface.launch(
-            server_name="0.0.0.0",
-            server_port=7860,
-            show_api=False,  # Disable API documentation for cleaner UI
-        )
-    except Exception as e:
-        logger.error(f"Failed to launch interface: {e}")
-        # Try minimal launch
-        minimal_interface = create_minimal_interface()
-        minimal_interface.launch(
-            server_name="0.0.0.0",
-            server_port=7860,
-            show_api=False,
-        )

 def create_interface():
     """Create Gradio interface"""
+    with gr.Blocks(title="Piper TTS Demo") as interface:
+        gr.Markdown("""
             # 🎙️ Piper TTS Demo
             High-quality text-to-speech synthesis supporting Japanese and English.
             This demo uses ONNX models for fast CPU inference.
             """)
+        with gr.Row():
+            with gr.Column(scale=2):
+                model_dropdown = gr.Dropdown(
+                    choices=list(MODELS.keys()),
+                    label="Select Model",
+                    value=list(MODELS.keys())[0],
+                )
+                text_input = gr.Textbox(
+                    label="Text to synthesize",
+                    placeholder="Enter text here...",
+                    lines=3,
+                )
+                # Advanced Settings without Accordion (flattened)
+                gr.Markdown("### Advanced Settings")
+                speaker_id = gr.Number(
+                    label="Speaker ID (for multi-speaker models)",
+                    value=0,
+                    minimum=0,
+                    maximum=10,
+                )
+                length_scale = gr.Slider(
+                    label="Speed (Lower = faster speech)",
+                    minimum=0.5,
+                    maximum=2.0,
+                    value=1.0,
+                    step=0.1,
                 )
+                noise_scale = gr.Slider(
+                    label="Expressiveness",
+                    minimum=0.0,
+                    maximum=1.0,
+                    value=0.667,
+                    step=0.01,
+                )
+                noise_w = gr.Slider(
+                    label="Phoneme Duration Variance",
+                    minimum=0.0,
+                    maximum=1.0,
+                    value=0.8,
+                    step=0.01,
+                )
+            synthesize_btn = gr.Button("Generate Speech", variant="primary")
+        with gr.Column(scale=1):
+            audio_output = gr.Audio(
+                label="Generated Speech",
+                type="numpy",
+                autoplay=True,
+            )
+            gr.Markdown("""
                 ### Tips:
                 - Japanese model expects hiragana/kanji text
                 - English model works with standard text
             outputs=audio_output,
         )
+    return interface
 def create_minimal_interface():
     """Create a minimal fallback interface if main interface fails"""
+    with gr.Blocks(title="Piper TTS Demo") as interface:
+        gr.Markdown("# 🎙️ Piper TTS Demo")
         text_input = gr.Textbox(
             label="Text to synthesize",
 interface = None
 if __name__ == "__main__":
+    # Create and launch interface
     interface = create_interface()
+    interface.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        show_api=False,  # Disable API documentation for cleaner UI
+    )