Spaces:

ovieyra21
/

tts-fair-spa

Runtime error

App Files Files Community

ovieyra21 commited on Jun 25

Commit

70a7607

•

1 Parent(s): 60fcc9c

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -15

app.py CHANGED Viewed

@@ -4,7 +4,6 @@ import torch
 from fairseq.checkpoint_utils import load_model_ensemble_and_task_from_hf_hub
 from huggingface_hub import login
 # Obtener el token desde las variables de entorno
 hf_token = os.getenv("HF_TOKEN")
 if hf_token is None:
@@ -14,9 +13,14 @@ if hf_token is None:
 login(hf_token)
 # Intentar cargar el modelo
 try:
-    models, cfg, task = load_model_ensemble_and_task_from_hf_hub("gitgato/speecht5_tts_mabama_es"
-    )
     if not models:
         raise RuntimeError("No se pudo cargar el modelo. Asegúrate de que el nombre del modelo es correcto y que está disponible en Hugging Face Hub.")
     model = models[0]
@@ -25,24 +29,28 @@ except Exception as e:
 # Función para generar la salida de texto a voz
 def text_to_speech(text):
-    # Preprocesamiento del texto
-    tokens = task.source_dictionary.encode_line(text, add_if_not_exist=False)
-    # Generar salida de audio
-    with torch.no_grad():
-        sample = {"net_input": {"src_tokens": tokens.unsqueeze(0).long()}}
-        generator = task.build_generator([model], cfg.generation)
-        audio = task.inference_step(generator, [model], sample)
-    return audio[0][0].numpy()
 # Crear interfaz de Gradio
 iface = gr.Interface(
     fn=text_to_speech,
     inputs=gr.inputs.Textbox(lines=2, placeholder="Ingrese el texto aquí..."),
-    outputs=gr.outputs.Audio(type="numpy", label="Output Audio")
 )
 if __name__ == "__main__":
     iface.launch()
-add_to_git_credential=True

 from fairseq.checkpoint_utils import load_model_ensemble_and_task_from_hf_hub
 from huggingface_hub import login
 # Obtener el token desde las variables de entorno
 hf_token = os.getenv("HF_TOKEN")
 if hf_token is None:
 login(hf_token)
 # Intentar cargar el modelo
+# Load model directly
+processor = AutoProcessor.from_pretrained("ovieyra21/es_speecht5_tts_mabama")
+model = AutoModelForTextToSpectrogram.from_pretrained("ovieyra21/es_speecht5_tts_mabama")
 try:
+    models, cfg, task = load_model_ensemble_and_task_from_hf_hub("ovieyra21/es_speecht5_tts_mabama")
     if not models:
         raise RuntimeError("No se pudo cargar el modelo. Asegúrate de que el nombre del modelo es correcto y que está disponible en Hugging Face Hub.")
     model = models[0]
 # Función para generar la salida de texto a voz
 def text_to_speech(text):
+    try:
+        # Preprocesamiento del texto
+        tokens = task.source_dictionary.encode_line(text, add_if_not_exist=False)
+        # Generar salida de audio
+        with torch.no_grad():
+            sample = {"net_input": {"src_tokens": tokens.unsqueeze(0).long()}}
+            generator = task.build_generator([model], cfg.generation)
+            audio = task.inference_step(generator, [model], sample)
+        return audio[0][0].numpy()
+    except Exception as e:
+        return f"Error en la generación de audio: {e}"
 # Crear interfaz de Gradio
 iface = gr.Interface(
     fn=text_to_speech,
     inputs=gr.inputs.Textbox(lines=2, placeholder="Ingrese el texto aquí..."),
+    outputs=gr.outputs.Audio(type="numpy", label="Output Audio"),
+    title="Conversor de Texto a Voz",
+    description="Ingrese texto para convertirlo a voz utilizando el modelo speecht5_tts_mabama_es."
 )
 if __name__ == "__main__":
     iface.launch()