Spaces:

Mynameisju
/

Aceh-tts

Sleeping

Mynameisju commited on Jun 13

Commit

ebf2718

verified ·

1 Parent(s): 37eaa38

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,9 +1,8 @@
 import torch
 import gradio as gr
-import torchaudio
 from transformers import VitsModel, VitsTokenizer
-from numToAce import convert_number_to_aceh
 model_id = "facebook/mms-tts-ace"
 tokenizer = VitsTokenizer.from_pretrained(model_id)
 model = VitsModel.from_pretrained(model_id)
@@ -11,23 +10,27 @@ model = VitsModel.from_pretrained(model_id)
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
 def tts_aceh(text):
-    text = convert_number_to_aceh(text)
     inputs = tokenizer(text, return_tensors="pt").to(device)
     with torch.no_grad():
-        outputs = model(**inputs)
-    waveform = outputs.waveform.squeeze().cpu()
     sample_rate = model.config.sampling_rate
     return (sample_rate, waveform)
 demo = gr.Interface(
     fn=tts_aceh,
-    inputs=gr.Textbox(label="Nhập văn bản tiếng Aceh"),
-    outputs=gr.Audio(label="Giọng đọc tiếng Aceh"),
-    title="TTS tiếng Aceh (MMS-VITS)",
-    description="Mô hình VITS từ Meta AI, hoạt động trực tiếp với Gradio"
 )
 if __name__ == "__main__":

 import torch
 import gradio as gr
 from transformers import VitsModel, VitsTokenizer
+# Load the TTS model and tokenizer for Acehnese
 model_id = "facebook/mms-tts-ace"
 tokenizer = VitsTokenizer.from_pretrained(model_id)
 model = VitsModel.from_pretrained(model_id)
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
+# TTS function
 def tts_aceh(text):
     inputs = tokenizer(text, return_tensors="pt").to(device)
     with torch.no_grad():
+        output = model(**inputs)
+    waveform = output.waveform[0].cpu().numpy()
     sample_rate = model.config.sampling_rate
     return (sample_rate, waveform)
+# Gradio UI
 demo = gr.Interface(
     fn=tts_aceh,
+    inputs=gr.Textbox(label="Enter Acehnese text"),
+    outputs=gr.Audio(type="numpy", label="Generated Speech"),
+    title="Acehnese TTS (Text-to-Speech)",
+    description=(
+        "This is a text-to-speech tool for the Acehnese language using Meta's MMS model. "
+        "To use: 1) Enter text in Acehnese, 2) Click Submit to hear it spoken aloud.\n\n"
+        "Note: Reuse, redistribution, or derivative use is not allowed unless you ask for permission. "
+        "Enjoy responsibly, and feel free to share feedback or support!"
+    )
 )
 if __name__ == "__main__":