Spaces:

VeuReu
/

demo

Sleeping

App Files Files Community

VeuReu commited on Oct 14, 2025

Commit

9167d9a

1 Parent(s): b6cdefa

Upload 93 files

Browse files

Files changed (4) hide show

app.py +42 -41
utils.py +141 -0
videos/curtmetratge_4/MoE/une_ad.srt +11 -11
videos/curtmetratge_4/Salamandra/une_ad.srt +4 -4

app.py CHANGED Viewed

@@ -12,10 +12,15 @@ except ModuleNotFoundError:  # Py<3.11
 import streamlit as st
 from moviepy.editor import VideoFileClip
 from database import set_db_path, init_schema, get_user, create_video, update_video_status, list_videos, get_video, get_all_users, upsert_result, get_results, add_feedback, get_feedback_for_video, get_feedback_stats
 from api_client import APIClient
 from utils import ensure_dirs, save_bytes, save_text, human_size
 # -- Move DB ---
 os.environ["STREAMLIT_DATA_DIRECTORY"] = "/tmp/.streamlit"
@@ -98,7 +103,7 @@ with st.sidebar:
             st.session_state.user = None
             st.rerun()
     if st.session_state.user:
-        page = st.radio("Navegació", ["Analitzar video-transcripcions","Processar vídeo nou","Estadístiques"], index=0)
     else:
         page = None
@@ -245,9 +250,9 @@ if page == "Processar vídeo nou":
             if st.session_state.characters_saved:
                 st.button("Generar Audiodescripció")
-elif page == "Analitzar video-transcripcions":
     require_login()
-    st.header("Analitzar video-transcripcions")
     base_dir = Path("/tmp/data/videos")
     if not base_dir.exists():
@@ -321,39 +326,28 @@ elif page == "Analitzar video-transcripcions":
         c1, c2 = st.columns(2)
         with c1:
             if st.button("Reconstruir àudio amb narració lliure", use_container_width=True, key="rebuild_free_ad"):
-                if subcarpeta_seleccio:
-                    free_ad_path = vid_dir / subcarpeta_seleccio / "free_ad.txt"
-                    if free_ad_path.exists():
-                        with st.spinner("Generant àudio de la narració lliure..."):
-                            text_content = free_ad_path.read_text(encoding="utf-8")
-                            voice = "central/grau" # Voz fijada
-                            response = api.tts_matxa(text=text_content, voice=voice)
-                            if "mp3_bytes" in response:
-                                output_path = vid_dir / subcarpeta_seleccio / "free_ad.mp3"
-                                save_bytes(output_path, response["mp3_bytes"])
-                                st.success(f"Àudio generat i desat a: {output_path}")
-                            else:
-                                st.error(f"Error en la generació de l'àudio: {response.get('error', 'Desconegut')}")
-                    else:
-                        st.warning("No s'ha trobat el fitxer 'free_ad.txt' en aquesta versió.")
         with c2:
             if st.button("Reconstruir vídeo amb audiodescripció", use_container_width=True, key="rebuild_video_ad"):
-                if subcarpeta_seleccio and mp4s:
-                    une_srt_path = vid_dir / subcarpeta_seleccio / "une_ad.srt"
-                    video_original_path = mp4s[0]
-                    if une_srt_path.exists():
-                        with st.spinner("Reconstruint el vídeo amb l'audiodescripció... Aquesta operació pot trigar una estona."):
-                            response = api.rebuild_video_with_ad(video_path=str(video_original_path), srt_path=str(une_srt_path))
-                            if "video_bytes" in response:
-                                output_path = vid_dir / subcarpeta_seleccio / "video_ad_rebuilt.mp4"
-                                save_bytes(output_path, response["video_bytes"])
-                                st.success(f"Vídeo reconstruït i desat a: {output_path}")
-                                st.info("Pots visualitzar-lo activant la casella 'Afegir audiodescripció' i seleccionant el nou fitxer si cal.")
-                            else:
-                                st.error(f"Error en la reconstrucció del vídeo: {response.get('error', 'Desconegut')}")
-                    else:
-                        st.warning("No s'ha trobat el fitxer 'une_ad.srt' en aquesta versió.")
     # --- Columna Derecha (Editor de texto y guardado) ---
@@ -376,24 +370,31 @@ elif page == "Analitzar video-transcripcions":
             else:
                 st.info(f"No s'ha trobat el fitxer **{ad_filename}**.")
         else:
-            st.warning("Selecciona una versió per veure els fitxers.")
         # Área de texto para edición
         new_text = st.text_area(f"Contingut de {tipus_ad_seleccio}", value=text_content, height=500, key=f"editor_{seleccio}_{subcarpeta_seleccio}_{ad_filename}")
-        # Controles de reproducción de narración (selector de voz eliminado)
-        if st.button("▶️ Reproduir narració", use_container_width=True, disabled=not new_text.strip(), key="play_button_editor"):
-            with st.spinner("Generant àudio..."):
-                # Lógica de TTS con el texto del área
-                pass # Implementación de la llamada a la API TTS
         # Botón de guardado
         if st.button("Desar canvis", use_container_width=True, type="primary"):
             if ad_path:
                 try:
-                    ad_path.write_text(new_text, encoding="utf-8")
                     st.success(f"Fitxer **{ad_filename}** desat correctament.")
-                    st.rerun()
                 except Exception as e:
                     st.error(f"No s'ha pogut desar el fitxer: {e}")
             else:

 import streamlit as st
 from moviepy.editor import VideoFileClip
+import sys
 from database import set_db_path, init_schema, get_user, create_video, update_video_status, list_videos, get_video, get_all_users, upsert_result, get_results, add_feedback, get_feedback_for_video, get_feedback_stats
 from api_client import APIClient
 from utils import ensure_dirs, save_bytes, save_text, human_size
+# Añadir la carpeta de scripts al path para poder importar el cliente
+sys.path.append(str(Path(__file__).parent / "scripts"))
+from client_generate_av import generate_free_ad_mp3, generate_une_ad_video
 # -- Move DB ---
 os.environ["STREAMLIT_DATA_DIRECTORY"] = "/tmp/.streamlit"
             st.session_state.user = None
             st.rerun()
     if st.session_state.user:
+        page = st.radio("Navegació", ["Analitzar audio-descripcions","Processar vídeo nou","Estadístiques"], index=0)
     else:
         page = None
             if st.session_state.characters_saved:
                 st.button("Generar Audiodescripció")
+elif page == "Analitzar audio-descripcions":
     require_login()
+    st.header("Analitzar audio-descripcions")
     base_dir = Path("/tmp/data/videos")
     if not base_dir.exists():
         c1, c2 = st.columns(2)
         with c1:
             if st.button("Reconstruir àudio amb narració lliure", use_container_width=True, key="rebuild_free_ad"):
+                if seleccio and subcarpeta_seleccio:
+                    with st.spinner("Generant àudio de la narració lliure..."):
+                        result = generate_free_ad_mp3(seleccio, subcarpeta_seleccio, api)
+                        if result.get("status") == "success":
+                            st.success(f"Àudio generat amb èxit: {result.get('path')}")
+                        else:
+                            st.error(f"Error: {result.get('reason', 'Desconegut')}")
+                else:
+                    st.warning("Selecciona un vídeo i una versió.")
         with c2:
             if st.button("Reconstruir vídeo amb audiodescripció", use_container_width=True, key="rebuild_video_ad"):
+                if seleccio and subcarpeta_seleccio:
+                    with st.spinner("Reconstruint el vídeo... Aquesta operació pot trigar."):
+                        result = generate_une_ad_video(seleccio, subcarpeta_seleccio, api)
+                        if result.get("status") == "success":
+                            st.success(f"Vídeo generat amb èxit: {result.get('path')}")
+                            st.info("Pots visualitzar-lo activant la casella 'Afegir audiodescripció'.")
+                        else:
+                            st.error(f"Error: {result.get('reason', 'Desconegut')}")
+                else:
+                    st.warning("Selecciona un vídeo i una versió.")
     # --- Columna Derecha (Editor de texto y guardado) ---
             else:
                 st.info(f"No s'ha trobat el fitxer **{ad_filename}**.")
         else:
+            # Eliminada la nota de advertencia
+            pass
         # Área de texto para edición
         new_text = st.text_area(f"Contingut de {tipus_ad_seleccio}", value=text_content, height=500, key=f"editor_{seleccio}_{subcarpeta_seleccio}_{ad_filename}")
+        # Controles de reproducción de narración
+        free_ad_mp3_path = vid_dir / subcarpeta_seleccio / "free_ad.mp3" if seleccio and subcarpeta_seleccio else None
+        can_play_free_ad = free_ad_mp3_path is not None and free_ad_mp3_path.exists()
+        if st.button("▶️ Reproduir narració lliure", use_container_width=True, disabled=not can_play_free_ad, key="play_button_editor"):
+            if can_play_free_ad:
+                st.audio(str(free_ad_mp3_path), format="audio/mp3")
+            else:
+                st.warning("No s'ha trobat el fitxer 'free_ad.mp3'. Reconstrueix l'àudio primer.")
         # Botón de guardado
         if st.button("Desar canvis", use_container_width=True, type="primary"):
             if ad_path:
                 try:
+                    save_text(ad_path, new_text)
                     st.success(f"Fitxer **{ad_filename}** desat correctament.")
+                    # Forzar la recarga del contenido en el text_area
+                    st.session_state[f"editor_{seleccio}_{subcarpeta_seleccio}_{ad_filename}"] = new_text
+                    st.rerun() # Opcional, si quieres recargar toda la UI
                 except Exception as e:
                     st.error(f"No s'ha pogut desar el fitxer: {e}")
             else:

utils.py CHANGED Viewed

@@ -5,6 +5,11 @@ import subprocess
 from pathlib import Path
 from dataclasses import dataclass
 import shlex # Para manejar argumentos de línea de comandos de forma segura
 def incrustar_subtitulos_ffmpeg(
@@ -152,6 +157,142 @@ def recortar_video(input_path: str, output_path: str, duracion_segundos: int = 2
     subprocess.run(cmd, check=True)
 #----------------------------
 if __name__ == "__main__":

 from pathlib import Path
 from dataclasses import dataclass
 import shlex # Para manejar argumentos de línea de comandos de forma segura
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import List, Optional, Callable
+import re
+import xml.etree.ElementTree as ET
 def incrustar_subtitulos_ffmpeg(
     subprocess.run(cmd, check=True)
+# ---- Núcleo: SRT -> ESF (XML string) ----
+TIME_RE = re.compile(
+    r"(?P<start>\d{2}:\d{2}:\d{2}[,\.]\d{3})\s*-->\s*(?P<end>\d{2}:\d{2}:\d{2}[,\.]\d{3})"
+)
+@dataclass
+class Cue:
+    index: int
+    start: str  # "HH:MM:SS.mmm"
+    end: str    # "HH:MM:SS.mmm"
+    text: str
+def _norm_ts(ts: str) -> str:
+    """Convierte '01:02:03,456' -> '01:02:03.456'."""
+    return ts.replace(",", ".")
+def _parse_srt(srt_text: str) -> List[Cue]:
+    """Parsea SRT a una lista de cues normalizados."""
+    srt_text = srt_text.replace("\r\n", "\n").replace("\r", "\n")
+    blocks = [b.strip() for b in re.split(r"\n\s*\n", srt_text) if b.strip()]
+    cues: List[Cue] = []
+    for block in blocks:
+        lines = block.split("\n")
+        # Detectar si la primera línea es índice
+        idx = None
+        if lines and lines[0].strip().isdigit():
+            idx = int(lines[0].strip())
+            time_candidates = lines[1:]
+        else:
+            idx = len(cues) + 1
+            time_candidates = lines
+        m = None
+        time_line_idx = None
+        for i, ln in enumerate(time_candidates[:3]):  # robustez
+            mm = TIME_RE.search(ln)
+            if mm:
+                m = mm
+                time_line_idx = i
+                break
+        if not m:
+            raise ValueError(f"Bloque SRT sin tiempos válidos (índice {idx}):\n{block}")
+        start = _norm_ts(m.group("start"))
+        end = _norm_ts(m.group("end"))
+        text_lines = time_candidates[time_line_idx + 1 :]
+        text = "\n".join(text_lines).strip()
+        cues.append(Cue(index=idx, start=start, end=end, text=text))
+    # Re-indexar por si venía desordenado
+    for i, c in enumerate(cues, 1):
+        c.index = i
+    return cues
+def _build_esf_tree(
+    cues: List[Cue],
+    language: str = "es",
+    voice_db: float = -6.0,
+    original_db: float = -3.0,
+    audio_lookup: Optional[Callable[[int], Optional[str]]] = None,
+) -> ET.ElementTree:
+    """
+    Construye el árbol XML ESF.
+    audio_lookup: función opcional index->filename (p. ej., lambda i: f\"{i:03d}.wav\" si existe).
+    """
+    root = ET.Element("esef", attrib={"version": "1.0"})
+    header = ET.SubElement(root, "header")
+    ET.SubElement(header, "language").text = language
+    mix = ET.SubElement(header, "mix")
+    ET.SubElement(mix, "voice", attrib={"level": f"{voice_db}dB"})
+    ET.SubElement(mix, "original", attrib={"level": f"{original_db}dB"})
+    ad = ET.SubElement(root, "ad")
+    for c in cues:
+        attrs = {"in": c.start, "out": c.end}
+        if audio_lookup:
+            fname = audio_lookup(c.index)
+            if fname:
+                attrs["file"] = fname
+        cue_el = ET.SubElement(ad, "cue", attrib=attrs)
+        cue_el.text = c.text
+    return ET.ElementTree(root)
+def _xml_pretty_string(tree: ET.ElementTree) -> str:
+    """Devuelve XML con sangría (sin depender de minidom)."""
+    def _indent(elem, level=0):
+        i = "\n" + level * "  "
+        if len(elem):
+            if not elem.text or not elem.text.strip():
+                elem.text = i + "  "
+            for e in elem:
+                _indent(e, level + 1)
+            if not e.tail or not e.tail.strip():
+                e.tail = i
+        if level and (not elem.tail or not elem.tail.strip()):
+            elem.tail = i
+    root = tree.getroot()
+    _indent(root)
+    return ET.tostring(root, encoding="utf-8", xml_declaration=True).decode("utf-8")
+def srt_to_esf(
+    srt_text: str,
+    *,
+    language: str = "es",
+    voice_db: float = -6.0,
+    original_db: float = -3.0,
+    audio_lookup: Optional[Callable[[int], Optional[str]]] = None,
+) -> str:
+    """
+    Convierte un SRT (texto) en un ESF (XML) y lo devuelve como string.
+    Parámetros:
+        srt_text: Contenido del .srt.
+        language: Código ISO del idioma (por defecto 'es').
+        voice_db: Nivel de la voz AD (dB).
+        original_db: Nivel del audio original (dB).
+        audio_lookup: Función opcional index->filename para asociar locuciones por cue.
+    Retorna:
+        Cadena XML ESF.
+    """
+    cues = _parse_srt(srt_text)
+    tree = _build_esf_tree(
+        cues,
+        language=language,
+        voice_db=voice_db,
+        original_db=original_db,
+        audio_lookup=audio_lookup,
+    )
+    return _xml_pretty_string(tree)
 #----------------------------
 if __name__ == "__main__":

videos/curtmetratge_4/MoE/une_ad.srt CHANGED Viewed

@@ -1,26 +1,26 @@
 1
-00:00:00,000 --> 00:00:10,480
-(AD): "Neus es troba en un sofà, amb la llum apagada, concentrada en la pantalla del seu telèfon mòbil, reflexionant."
 2
-00:00:10,480 --> 00:00:11,134
-(AD): ""
 3
 00:00:11,134 --> 00:00:12,044
 [Sento]: bon dia neus
-4
 00:00:12,044 --> 00:00:12,653
 [Neus]: bon dia gràcies
-5
-00:00:12,653 --> 00:00:15,919
-(AD): "Neus, amb una samarreta, llegeix un diari."
 6
-00:00:15,919 --> 00:00:16,568
-(AD): ""
 7
 00:00:16,568 --> 00:00:18,777

 1
+00:00:00,000 --> 00:00:01,020
+(AD): "Títol: No puc."
 2
+00:00:01,020 --> 00:00:04,121
+(AD): "Títol: No puc."
 3
+00:00:04,121 --> 00:00:11,134
+(AD): "Neus es troba en un sofà, amb la llum apagada, concentrada en la pantalla del seu telèfon mòbil, reflexionant."
+4
 00:00:11,134 --> 00:00:12,044
 [Sento]: bon dia neus
+5
 00:00:12,044 --> 00:00:12,653
 [Neus]: bon dia gràcies
 6
+00:00:12,653 --> 00:00:16,568
+(AD): "Neus, amb una samarreta, llegeix un diari."
 7
 00:00:16,568 --> 00:00:18,777

videos/curtmetratge_4/Salamandra/une_ad.srt CHANGED Viewed

@@ -1,10 +1,10 @@
 1
-00:00:00,000 --> 00:00:10,480
-(AD): Una dona amb el llum apagat, asseguda en un sofà, mirant el seu telèfon.
 2
-00:00:10,480 --> 00:00:11,134
-(AD): Una noia amb una samarreta de l'americana està llegint un diari en un restaurant.
 3
 00:00:11,134 --> 00:00:12,044

 1
+00:00:01,000 --> 00:00:03,000
+(AD): "No puc."
 2
+00:00:03,000 --> 00:00:11,134
+(AD): "Una dona amb el llum apagat, asseguda en un sofà, mirant el seu telèfon."
 3
 00:00:11,134 --> 00:00:12,044