Spaces:

ayousanz
/

piper-plus-demo

Running

App Files Files Community

ayousanz commited on Aug 21

Commit

9ff78c7

verified ·

1 Parent(s): aca1362

Update from GitHub Actions - 2025-08-21 11:46:08

Browse files

Files changed (3) hide show

README.md +2 -2
app.py +79 -11
requirements.txt +2 -3

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🎙️
 colorFrom: blue
 colorTo: purple
 sdk: gradio
-sdk_version: 3.50.2
 app_file: app.py
 pinned: false
 license: mit
@@ -67,4 +67,4 @@ python app.py
 This project is licensed under the MIT License. See the original [Piper repository](https://github.com/rhasspy/piper) for more details.
 ---
-_Last updated: 2025-01-21 - Cache rebuild for Gradio 3.50.2_

 colorFrom: blue
 colorTo: purple
 sdk: gradio
+sdk_version: 5.0.0
 app_file: app.py
 pinned: false
 license: mit
 This project is licensed under the MIT License. See the original [Piper repository](https://github.com/rhasspy/piper) for more details.
 ---
+_Last updated: 2025-01-21 - Upgraded to Gradio 5.0.0 for security fixes_

app.py CHANGED Viewed

@@ -45,6 +45,57 @@ MODELS = {
     },
 }
 # Japanese multi-character phoneme to Unicode PUA mapping
 # This mapping must match the C++ implementation and training data
 PHONEME_TO_PUA = {
@@ -113,7 +164,7 @@ def text_to_phonemes(text: str, language: str) -> list[str]:
             # Add sentence markers
             phonemes = ["^"] + phonemes + ["$"]
             # Convert multi-character phonemes to Unicode PUA
             phonemes = map_phonemes(phonemes)
         else:
@@ -127,10 +178,28 @@ def text_to_phonemes(text: str, language: str) -> list[str]:
         # Convert phoneme string to list
         phonemes = ["^"] + list(phoneme_str.replace(" ", "")) + ["$"]
     else:
-        logger.warning("espeak_phonemizer not available, using character fallback")
-        # Character-based fallback - filter non-alphabetic characters
-        cleaned_text = "".join(c.lower() for c in text if c.isalpha() or c.isspace())
-        phonemes = ["^"] + list(cleaned_text) + ["$"]
     return phonemes
@@ -261,7 +330,8 @@ def create_interface():
                     speaker_id = gr.Number(
                         label="Speaker ID (for multi-speaker models)",
                         value=0,
-                        precision=0,
                     )
                     length_scale = gr.Slider(
@@ -383,15 +453,13 @@ interface = None
 if __name__ == "__main__":
     # Create interface inside main block
     interface = create_interface()
     try:
-        # Launch with minimal settings for Gradio 3.x
         interface.launch(
             server_name="0.0.0.0",
             server_port=7860,
-            show_api=False,  # Disable API documentation
-            show_error=True,
-            quiet=False,
         )
     except Exception as e:
         logger.error(f"Failed to launch interface: {e}")

     },
 }
+# Basic English word to IPA mapping for common words
+# This is a simplified fallback when espeak-ng is not available
+ENGLISH_IPA_MAP = {
+    "hello": "hɛloʊ",
+    "world": "wɜrld",
+    "this": "ðɪs",
+    "is": "ɪz",
+    "a": "ə",
+    "test": "tɛst",
+    "text": "tɛkst",
+    "to": "tu",
+    "speech": "spitʃ",
+    "demo": "dɛmoʊ",
+    "welcome": "wɛlkəm",
+    "piper": "paɪpər",
+    "tts": "titiɛs",
+    "enjoy": "ɛndʒɔɪ",
+    "high": "haɪ",
+    "quality": "kwɑləti",
+    "synthesis": "sɪnθəsɪs",
+    "the": "ðə",
+    "and": "ænd",
+    "for": "fɔr",
+    "with": "wɪð",
+    "you": "ju",
+    "can": "kæn",
+    "it": "ɪt",
+    "that": "ðæt",
+    "have": "hæv",
+    "from": "frʌm",
+    "or": "ɔr",
+    "which": "wɪtʃ",
+    "one": "wʌn",
+    "would": "wʊd",
+    "all": "ɔl",
+    "will": "wɪl",
+    "there": "ðɛr",
+    "say": "seɪ",
+    "who": "hu",
+    "make": "meɪk",
+    "when": "wɛn",
+    "time": "taɪm",
+    "if": "ɪf",
+    "no": "noʊ",
+    "way": "weɪ",
+    "has": "hæz",
+    "yes": "jɛs",
+    "good": "gʊd",
+    "very": "vɛri",
+}
 # Japanese multi-character phoneme to Unicode PUA mapping
 # This mapping must match the C++ implementation and training data
 PHONEME_TO_PUA = {
             # Add sentence markers
             phonemes = ["^"] + phonemes + ["$"]
             # Convert multi-character phonemes to Unicode PUA
             phonemes = map_phonemes(phonemes)
         else:
         # Convert phoneme string to list
         phonemes = ["^"] + list(phoneme_str.replace(" ", "")) + ["$"]
     else:
+        logger.warning("espeak_phonemizer not available, using IPA fallback")
+        # IPA-based fallback for better English pronunciation
+        words = text.lower().split()
+        phonemes = ["^"]
+        for i, word in enumerate(words):
+            # Add space between words
+            if i > 0:
+                phonemes.append(" ")
+            # Remove punctuation from word
+            clean_word = "".join(c for c in word if c.isalpha())
+            if clean_word in ENGLISH_IPA_MAP:
+                # Use IPA mapping if available
+                ipa = ENGLISH_IPA_MAP[clean_word]
+                phonemes.extend(list(ipa))
+            else:
+                # Fall back to character-by-character for unknown words
+                phonemes.extend(list(clean_word))
+        phonemes.append("$")
     return phonemes
                     speaker_id = gr.Number(
                         label="Speaker ID (for multi-speaker models)",
                         value=0,
+                        minimum=0,
+                        maximum=10,
                     )
                     length_scale = gr.Slider(
 if __name__ == "__main__":
     # Create interface inside main block
     interface = create_interface()
     try:
+        # Launch with settings for Gradio 5.x
         interface.launch(
             server_name="0.0.0.0",
             server_port=7860,
+            show_api=False,  # Disable API documentation for cleaner UI
         )
     except Exception as e:
         logger.error(f"Failed to launch interface: {e}")

requirements.txt CHANGED Viewed

@@ -1,9 +1,8 @@
 # Piper TTS Demo Requirements
-gradio==3.50.2  # Stable Gradio 3.x version to avoid TypeError
-pydantic==1.10.18  # Compatible with Gradio 3.x
 numpy>=1.24.0,<3.0
 onnxruntime>=1.16.0
 pyopenjtalk>=0.3.0
 onnx>=1.14.0
 # Note: espeak-phonemizer requires system espeak-ng library
-# For simplified deployment, using character-based fallback for English

 # Piper TTS Demo Requirements
+gradio>=5.0.0  # Latest Gradio 5.x with security fixes
 numpy>=1.24.0,<3.0
 onnxruntime>=1.16.0
 pyopenjtalk>=0.3.0
 onnx>=1.14.0
 # Note: espeak-phonemizer requires system espeak-ng library
+# For simplified deployment, using IPA-based fallback for English