Spaces:

gnosticdev
/

INVIDEO_BASIC

Sleeping

App Files Files Community

gnosticdev commited on 6 days ago

Commit

b0e58a6

verified ·

1 Parent(s): ebafac2

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -66

app.py CHANGED Viewed

@@ -9,7 +9,6 @@ import torch
 from transformers import GPT2Tokenizer, GPT2LMHeadModel
 from keybert import KeyBERT
 from TTS.api import TTS
-# Importación correcta: Solo 'concatenate_videoclips'
 from moviepy.editor import VideoFileClip, concatenate_videoclips, AudioFileClip, CompositeAudioClip, concatenate_audioclips, AudioClip
 import re
 import math
@@ -133,9 +132,9 @@ def generate_script(prompt, max_length=150):
         cleaned_text = text.strip()
         try:
-            instruction_end_idx = text.find(instruction_phrase)
             if instruction_end_idx != -1:
-                cleaned_text = text[instruction_end_idx + len(instruction_phrase):].strip()
                 logger.debug("Instrucción inicial encontrada y eliminada del guión generado.")
             else:
                  instruction_start_idx = text.find(instruction_phrase_start)
@@ -178,8 +177,6 @@ def generate_script(prompt, max_length=150):
         logger.warning("Usando prompt original como guion debido al error de generación.")
         return prompt.strip()
-from TTS.api import TTS
 def text_to_speech(text, output_path, voice=None):
     logger.info(f"Convirtiendo texto a voz con Coqui TTS | Caracteres: {len(text)} | Salida: {output_path}")
     if not text or not text.strip():
@@ -191,6 +188,7 @@ def text_to_speech(text, output_path, voice=None):
         tts = TTS(model_name="tts_models/es/css10/vits", progress_bar=False, gpu=False)
         # Limpiar y truncar texto
         text = re.sub(r'[^\w\s.,!?áéíóúñÁÉÍÓÚÑ]', '', text)
         if len(text) > 500:
             logger.warning("Texto demasiado largo, truncando a 500 caracteres")
@@ -210,8 +208,6 @@ def text_to_speech(text, output_path, voice=None):
     except Exception as e:
         logger.error(f"Error TTS: {str(e)}", exc_info=True)
         return False
-        #FIN DE ESTA MIERDA
 def download_video_file(url, temp_dir):
     if not url:
@@ -305,7 +301,6 @@ def loop_audio_to_length(audio_clip, target_duration):
             try: looped_audio.close()
             except: pass
 def extract_visual_keywords_from_script(script_text):
     logger.info("Extrayendo palabras clave del guion")
     if not script_text or not script_text.strip():
@@ -392,40 +387,23 @@ def crear_video(prompt_type, input_text, musica_file=None):
             logger.error("El guion resultante está vacío o solo contiene espacios.")
             raise ValueError("El guion está vacío.")
         temp_dir_intermediate = tempfile.mkdtemp(prefix="video_gen_intermediate_")
         logger.info(f"Directorio temporal intermedio creado: {temp_dir_intermediate}")
         temp_intermediate_files = []
-        # 2. Generar audio de voz con reintentos y voz de respaldo
         logger.info("Generando audio de voz...")
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
-        primary_voice = "es-ES-JuanNeural"
-        fallback_voice = "es-ES-ElviraNeural" # Otra voz en español
-        tts_success = False
-        retries = 3
-        for attempt in range(retries):
-            current_voice = primary_voice if attempt == 0 else fallback_voice
-            if attempt > 0: logger.warning(f"Reintentando TTS ({attempt+1}/{retries})...")
-            logger.info(f"Intentando TTS con voz: {current_voice}")
-            try:
-                tts_success = asyncio.run(text_to_speech(guion, voz_path, voice=current_voice))
-                if tts_success:
-                    logger.info(f"TTS exitoso en intento {attempt + 1} con voz {current_voice}.")
-                    break
-            except Exception as e:
-                 pass
-            if not tts_success and attempt == 0 and primary_voice != fallback_voice:
-                 logger.warning(f"Fallo con voz {primary_voice}, intentando voz de respaldo: {fallback_voice}")
-            elif not tts_success and attempt < retries - 1:
-                 logger.warning(f"Fallo con voz {current_voice}, reintentando...")
-        if not tts_success or not os.path.exists(voz_path) or os.path.getsize(voz_path) <= 100:
-             logger.error(f"Fallo en la generación de voz después de {retries} intentos. Archivo de audio no creado o es muy pequeño.")
-             raise ValueError("Error generando voz a partir del guion (fallo de TTS).")
         temp_intermediate_files.append(voz_path)
@@ -655,7 +633,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
                                    try: clip.close()
                                    except: pass
         if final_video_base.duration > audio_duration:
              logger.info(f"Recortando video base ({final_video_base.duration:.2f}s) para que coincida con la duración del audio ({audio_duration:.2f}s).")
              trimmed_video_base = None
@@ -675,7 +652,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
                 logger.critical(f"Error durante el recorte: {str(e)}", exc_info=True)
                 raise ValueError("Fallo durante el recorte de video.")
         if final_video_base is None or final_video_base.duration is None or final_video_base.duration <= 0:
              logger.critical("Video base final es inválido antes de audio/escritura (None o duración cero).")
              raise ValueError("Video base final es inválido.")
@@ -718,7 +694,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
                           except: pass
                           musica_audio_looped = None
                 if musica_audio_looped:
                     composite_audio = CompositeAudioClip([
                         musica_audio_looped.volumex(0.2), # Volumen 20% para música
@@ -741,7 +716,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
                 musica_audio = None
                 logger.warning("Usando solo audio de voz debido a un error con la música.")
         if final_audio.duration is not None and abs(final_audio.duration - video_base.duration) > 0.2:
             logger.warning(f"Duración del audio final ({final_audio.duration:.2f}s) difiere significativamente del video base ({video_base.duration:.2f}s). Intentando recorte.")
             try:
@@ -773,7 +747,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
         logger.info(f"Escribiendo video final a: {output_path}")
         video_final.write_videofile(
-            output_path,
             fps=24,
             threads=4,
             codec="libx264",
@@ -858,8 +831,6 @@ def crear_video(prompt_type, input_text, musica_file=None):
              logger.info(f"Directorio temporal intermedio {temp_dir_intermediate} persistirá para que Gradio lea el video final.")
-# La función run_app ahora recibe todos los inputs de texto y el archivo de música
 def run_app(prompt_type, prompt_ia, prompt_manual, musica_file):
     logger.info("="*80)
     logger.info("SOLICITUD RECIBIDA EN INTERFAZ")
@@ -873,7 +844,6 @@ def run_app(prompt_type, prompt_ia, prompt_manual, musica_file):
     if not input_text or not input_text.strip():
         logger.warning("Texto de entrada vacío.")
-        # Retornar None para video y archivo, actualizar estado con mensaje de error
         return None, None, gr.update(value="⚠️ Por favor, ingresa texto para el guion o el tema.", interactive=False)
     logger.info(f"Tipo de entrada: {prompt_type}")
@@ -885,14 +855,13 @@ def run_app(prompt_type, prompt_ia, prompt_manual, musica_file):
     try:
         logger.info("Llamando a crear_video...")
-        # Pasar el input_text elegido y el archivo de música a crear_video
         video_path = crear_video(prompt_type, input_text, musica_file)
         if video_path and os.path.exists(video_path):
             logger.info(f"crear_video retornó path: {video_path}")
             logger.info(f"Tamaño del archivo de video retornado: {os.path.getsize(video_path)} bytes")
-            output_video = video_path # Establecer valor del componente de video
-            output_file = video_path   # Establecer valor del componente de archivo para descarga
             status_msg = gr.update(value="✅ Video generado exitosamente.", interactive=False)
         else:
             logger.error(f"crear_video no retornó un path válido o el archivo no existe: {video_path}")
@@ -906,10 +875,8 @@ def run_app(prompt_type, prompt_ia, prompt_manual, musica_file):
         status_msg = gr.update(value=f"❌ Error inesperado: {str(e)}", interactive=False)
     finally:
         logger.info("Fin del handler run_app.")
-        # Retornar las tres salidas esperadas por el evento click
         return output_video, output_file, status_msg
 # Interfaz de Gradio
 with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft(), css="""
     .gradio-container {max-width: 800px; margin: auto;}
@@ -927,8 +894,6 @@ with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft(), css="
                 value="Generar Guion con IA"
             )
-            # Contenedores para los campos de texto para controlar la visibilidad
-            # Nombrados para que coincidan con los outputs del evento change
             with gr.Column(visible=True) as ia_guion_column:
                 prompt_ia = gr.Textbox(
                     label="Tema para IA",
@@ -965,7 +930,7 @@ with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft(), css="
             file_output = gr.File(
                 label="Descargar Archivo de Video",
                 interactive=False,
-                visible=False # Ocultar inicialmente
             )
             status_output = gr.Textbox(
                 label="Estado",
@@ -975,42 +940,27 @@ with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft(), css="
                 value="Esperando entrada..."
             )
-    # Evento para mostrar/ocultar los campos de texto según el tipo de prompt
-    # Apuntar a los componentes Column padre para controlar la visibilidad
     prompt_type.change(
         lambda x: (gr.update(visible=x == "Generar Guion con IA"),
                    gr.update(visible=x == "Usar Mi Guion")),
         inputs=prompt_type,
-        # Pasar los componentes Column
         outputs=[ia_guion_column, manual_guion_column]
     )
-    # Evento click del botón de generar video
     generate_btn.click(
-        # Acción 1 (síncrona): Resetear salidas y establecer estado a procesando
-        # Retorna None para los 3 outputs iniciales
         lambda: (None, None, gr.update(value="⏳ Procesando... Esto puede tomar varios minutos.", interactive=False)),
         outputs=[video_output, file_output, status_output],
-        queue=True, # Usar la cola de Gradio para tareas largas
     ).then(
-        # Acción 2 (asíncrona): Llamar a la función principal de procesamiento
         run_app,
-        # PASAR TODOS LOS INPUTS DE LA INTERFAZ que run_app espera
         inputs=[prompt_type, prompt_ia, prompt_manual, musica_input],
-        # run_app retornará los 3 outputs esperados aquí
         outputs=[video_output, file_output, status_output]
     ).then(
-        # Acción 3 (síncrona): Hacer visible el enlace de descarga si se retornó un archivo
-        # Esta función recibe las salidas de la Acción 2 (video_path, file_path, status_msg)
-        # Solo necesitamos video_path o file_path para decidir si mostrar el enlace
         lambda video_path, file_path, status_msg: gr.update(visible=file_path is not None),
-        # Inputs son las salidas de la función .then() anterior
         inputs=[video_output, file_output, status_output],
-        # Actualizamos la visibilidad del componente file_output
         outputs=[file_output]
     )
     gr.Markdown("### Instrucciones:")
     gr.Markdown("""
     1.  **Clave API de Pexels:** Asegúrate de haber configurado la variable de entorno `PEXELS_API_KEY` con tu clave.

 from transformers import GPT2Tokenizer, GPT2LMHeadModel
 from keybert import KeyBERT
 from TTS.api import TTS
 from moviepy.editor import VideoFileClip, concatenate_videoclips, AudioFileClip, CompositeAudioClip, concatenate_audioclips, AudioClip
 import re
 import math
         cleaned_text = text.strip()
         try:
+            instruction_end_idx = text.find(instruction_phrase_start)
             if instruction_end_idx != -1:
+                cleaned_text = text[instruction_end_idx + len(instruction_phrase_start):].strip()
                 logger.debug("Instrucción inicial encontrada y eliminada del guión generado.")
             else:
                  instruction_start_idx = text.find(instruction_phrase_start)
         logger.warning("Usando prompt original como guion debido al error de generación.")
         return prompt.strip()
 def text_to_speech(text, output_path, voice=None):
     logger.info(f"Convirtiendo texto a voz con Coqui TTS | Caracteres: {len(text)} | Salida: {output_path}")
     if not text or not text.strip():
         tts = TTS(model_name="tts_models/es/css10/vits", progress_bar=False, gpu=False)
         # Limpiar y truncar texto
+        text = text.replace("na hora", "A la hora")
         text = re.sub(r'[^\w\s.,!?áéíóúñÁÉÍÓÚÑ]', '', text)
         if len(text) > 500:
             logger.warning("Texto demasiado largo, truncando a 500 caracteres")
     except Exception as e:
         logger.error(f"Error TTS: {str(e)}", exc_info=True)
         return False
 def download_video_file(url, temp_dir):
     if not url:
             try: looped_audio.close()
             except: pass
 def extract_visual_keywords_from_script(script_text):
     logger.info("Extrayendo palabras clave del guion")
     if not script_text or not script_text.strip():
             logger.error("El guion resultante está vacío o solo contiene espacios.")
             raise ValueError("El guion está vacío.")
+        # Corregir error tipográfico en el guion
+        guion = guion.replace("na hora", "A la hora")
         temp_dir_intermediate = tempfile.mkdtemp(prefix="video_gen_intermediate_")
         logger.info(f"Directorio temporal intermedio creado: {temp_dir_intermediate}")
         temp_intermediate_files = []
+        # 2. Generar audio de voz
         logger.info("Generando audio de voz...")
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
+        # Llamar a text_to_speech directamente
+        tts_success = text_to_speech(guion, voz_path)
+        if not tts_success or not os.path.exists(voz_path) or os.path.getsize(voz_path) <= 1000:
+            logger.error(f"Fallo en la generación de voz. Archivo de audio no creado o es muy pequeño: {voz_path}")
+            raise ValueError("Error generando voz a partir del guion (fallo de TTS).")
         temp_intermediate_files.append(voz_path)
                                    try: clip.close()
                                    except: pass
         if final_video_base.duration > audio_duration:
              logger.info(f"Recortando video base ({final_video_base.duration:.2f}s) para que coincida con la duración del audio ({audio_duration:.2f}s).")
              trimmed_video_base = None
                 logger.critical(f"Error durante el recorte: {str(e)}", exc_info=True)
                 raise ValueError("Fallo durante el recorte de video.")
         if final_video_base is None or final_video_base.duration is None or final_video_base.duration <= 0:
              logger.critical("Video base final es inválido antes de audio/escritura (None o duración cero).")
              raise ValueError("Video base final es inválido.")
                           except: pass
                           musica_audio_looped = None
                 if musica_audio_looped:
                     composite_audio = CompositeAudioClip([
                         musica_audio_looped.volumex(0.2), # Volumen 20% para música
                 musica_audio = None
                 logger.warning("Usando solo audio de voz debido a un error con la música.")
         if final_audio.duration is not None and abs(final_audio.duration - video_base.duration) > 0.2:
             logger.warning(f"Duración del audio final ({final_audio.duration:.2f}s) difiere significativamente del video base ({video_base.duration:.2f}s). Intentando recorte.")
             try:
         logger.info(f"Escribiendo video final a: {output_path}")
         video_final.write_videofile(
             fps=24,
             threads=4,
             codec="libx264",
              logger.info(f"Directorio temporal intermedio {temp_dir_intermediate} persistirá para que Gradio lea el video final.")
 def run_app(prompt_type, prompt_ia, prompt_manual, musica_file):
     logger.info("="*80)
     logger.info("SOLICITUD RECIBIDA EN INTERFAZ")
     if not input_text or not input_text.strip():
         logger.warning("Texto de entrada vacío.")
         return None, None, gr.update(value="⚠️ Por favor, ingresa texto para el guion o el tema.", interactive=False)
     logger.info(f"Tipo de entrada: {prompt_type}")
     try:
         logger.info("Llamando a crear_video...")
         video_path = crear_video(prompt_type, input_text, musica_file)
         if video_path and os.path.exists(video_path):
             logger.info(f"crear_video retornó path: {video_path}")
             logger.info(f"Tamaño del archivo de video retornado: {os.path.getsize(video_path)} bytes")
+            output_video = video_path
+            output_file = video_path
             status_msg = gr.update(value="✅ Video generado exitosamente.", interactive=False)
         else:
             logger.error(f"crear_video no retornó un path válido o el archivo no existe: {video_path}")
         status_msg = gr.update(value=f"❌ Error inesperado: {str(e)}", interactive=False)
     finally:
         logger.info("Fin del handler run_app.")
         return output_video, output_file, status_msg
 # Interfaz de Gradio
 with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft(), css="""
     .gradio-container {max-width: 800px; margin: auto;}
                 value="Generar Guion con IA"
             )
             with gr.Column(visible=True) as ia_guion_column:
                 prompt_ia = gr.Textbox(
                     label="Tema para IA",
             file_output = gr.File(
                 label="Descargar Archivo de Video",
                 interactive=False,
+                visible=False
             )
             status_output = gr.Textbox(
                 label="Estado",
                 value="Esperando entrada..."
             )
     prompt_type.change(
         lambda x: (gr.update(visible=x == "Generar Guion con IA"),
                    gr.update(visible=x == "Usar Mi Guion")),
         inputs=prompt_type,
         outputs=[ia_guion_column, manual_guion_column]
     )
     generate_btn.click(
         lambda: (None, None, gr.update(value="⏳ Procesando... Esto puede tomar varios minutos.", interactive=False)),
         outputs=[video_output, file_output, status_output],
+        queue=True,
     ).then(
         run_app,
         inputs=[prompt_type, prompt_ia, prompt_manual, musica_input],
         outputs=[video_output, file_output, status_output]
     ).then(
         lambda video_path, file_path, status_msg: gr.update(visible=file_path is not None),
         inputs=[video_output, file_output, status_output],
         outputs=[file_output]
     )
     gr.Markdown("### Instrucciones:")
     gr.Markdown("""
     1.  **Clave API de Pexels:** Asegúrate de haber configurado la variable de entorno `PEXELS_API_KEY` con tu clave.