Spaces:

tsuching
/

Tibetan-tts

Running

App Files Files Community

tsuching commited on 17 days ago

Commit

f340b44

verified ·

1 Parent(s): 6e312f5

Update app.py

Browse files

Files changed (1) hide show

app.py +47 -5

app.py CHANGED Viewed

@@ -288,17 +288,37 @@ def get_all_phonetics_schemes(text):
 # Tibetan TTS function
-def run_task_tts(text):
     # Always return: [audio_numpy, audio_filepath, text_output]
     # 1) Generate speech via MMS-TTS
-    speech = tts_tibetan(text)
     # 2) Clip, cast, flatten for Gradio (browser playback expects float32 in [-1, 1])
     audio = speech["audio"]
     sr = int(speech["sampling_rate"])
     audio = np.clip(audio.astype(np.float32), -1.0, 1.0).flatten()
-    # 3) Write a WAV file for download/Flutter using PCM_16 to avoid pydub header errors
     tmpfile = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
     sf.write(tmpfile.name, audio, sr, subtype="PCM_16")
     # 4) Return both audio forms + a status message
     return (sr, audio), tmpfile.name, "Tibetan audio generated successfully!"
@@ -567,15 +587,36 @@ def generate_tts_file(text: str) -> str:
     _, file_path, _ = run_task_tts(text)  # unpack tuple
     return file_path
 @api.post("/api/tts")
 async def api_tts(request: gr.Request):
     body = await request.json()
     text = body.get("text", "")
-    if not text:
         return {"error": "No text provided"}
-    output_path = generate_tts_file(text)
     return FileResponse(
         output_path,
@@ -584,6 +625,7 @@ async def api_tts(request: gr.Request):
     )
 #############################################
 # 🔥 Attach your existing Gradio UI
 #############################################

 # Tibetan TTS function
+#def run_task_tts(text):
     # Always return: [audio_numpy, audio_filepath, text_output]
     # 1) Generate speech via MMS-TTS
+#    speech = tts_tibetan(text)
+    # 2) Clip, cast, flatten for Gradio (browser playback expects float32 in [-1, 1])
+#    audio = speech["audio"]
+#    sr = int(speech["sampling_rate"])
+#    audio = np.clip(audio.astype(np.float32), -1.0, 1.0).flatten()
+    # 3) Write a WAV file for download/Flutter using PCM_16 to avoid pydub header errors
+#    tmpfile = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
+#    sf.write(tmpfile.name, audio, sr, subtype="PCM_16")
+    # 4) Return both audio forms + a status message
+#    return (sr, audio), tmpfile.name, "Tibetan audio generated successfully!"
+def run_task_tts(text: str):
+    # Ensure input is a string
+    if not isinstance(text, str):
+        text = str(text)
+    # 1) Generate speech via MMS-TTS
+    speech = tts_tibetan(text)  # pipeline expects plain string
     # 2) Clip, cast, flatten for Gradio (browser playback expects float32 in [-1, 1])
     audio = speech["audio"]
     sr = int(speech["sampling_rate"])
     audio = np.clip(audio.astype(np.float32), -1.0, 1.0).flatten()
+    # 3) Write a WAV file for download/Flutter using PCM_16
     tmpfile = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
     sf.write(tmpfile.name, audio, sr, subtype="PCM_16")
     # 4) Return both audio forms + a status message
     return (sr, audio), tmpfile.name, "Tibetan audio generated successfully!"
     _, file_path, _ = run_task_tts(text)  # unpack tuple
     return file_path
+#@api.post("/api/tts")
+#async def api_tts(request: gr.Request):
+#    body = await request.json()
+#    text = body.get("text", "")
+#    if not text:
+#        return {"error": "No text provided"}
+#    output_path = generate_tts_file(text)
+#    return FileResponse(
+#        output_path,
+#        media_type="audio/wav",
+#        filename="tts.wav"
+#    )
 @api.post("/api/tts")
 async def api_tts(request: gr.Request):
     body = await request.json()
     text = body.get("text", "")
+    # ✅ Ensure text is always a string
+    if not isinstance(text, str):
+        text = str(text)
+    if not text.strip():
         return {"error": "No text provided"}
+    # Call your wrapper
+    _, output_path, status = run_task_tts(text)
     return FileResponse(
         output_path,
     )
 #############################################
 # 🔥 Attach your existing Gradio UI
 #############################################