Aduc-sdr-2_5

Paused

App Files Files Community

carlex3321 commited on Sep 29

Commit

0834a4b

verified ·

1 Parent(s): b11811b

Upload 6 files

Browse files

Files changed (4) hide show

Dockerfile +12 -0
app_vince.py +110 -40
builder.sh +74 -54
start.sh +63 -31

Dockerfile CHANGED Viewed

@@ -130,6 +130,18 @@ RUN useradd -m -u 1000 -s /bin/bash appuser && \
 USER appuser
 RUN df -h
 # Mostra uso de disco por volume (procure /app ou o filesystem raiz).

 USER appuser
+# Declara volume persistente para HF Spaces
+VOLUME /data
+# Env vars para caches em /data
+ENV HF_HOME=/data/.cache/huggingface
+ENV TORCH_HOME=/data/.cache/torch
+ENV HF_DATASETS_CACHE=/data/.cache/datasets
+ENV TRANSFORMERS_CACHE=/data/.cache/transformers
+ENV DIFFUSERS_CACHE=/data/.cache/diffusers
 RUN df -h
 # Mostra uso de disco por volume (procure /app ou o filesystem raiz).

app_vince.py CHANGED Viewed

@@ -3,11 +3,24 @@ import os
 from pathlib import Path
 from typing import List, Tuple, Optional
 import gradio as gr
 from services.vincie import VincieService
 svc = VincieService()
-DEFAULT_NEGATIVE_PROMPT = "Worst quality, Normal quality, Low quality, Low res, Blurry, Jpeg artifacts, Grainy, text, logo, watermark, banner, extra digits, signature, subtitling, Bad anatomy, Bad proportions, Deformed, Disconnected limbs, Disfigured, Extra arms, Extra limbs, Extra hands, Fused fingers, Gross proportions, Long neck, Malformed limbs, Mutated, Mutated hands, Mutated limbs, Missing arms, Missing fingers, Poorly drawn hands, Poorly drawn face, Nsfw, Uncensored, Cleavage, Nude, Nipples, Overexposed, Plain background, Grainy, Underexposed, Deformed structures"
 def setup_auto() -> str:
     try:
@@ -21,9 +34,18 @@ def setup_auto() -> str:
 def _list_media(out_dir: Path, max_images: int = 24) -> Tuple[List[str], Optional[str]]:
     img_globs = ("*.png", "*.jpg", "*.jpeg", "*.webp")
-    images = sorted([p for pat in img_globs for p in out_dir.rglob(pat)], key=lambda p: p.stat().st_mtime)
     image_paths = [str(p) for p in images[-max_images:]]
-    videos = sorted(out_dir.rglob("*.mp4"), key=lambda p: p.stat().st_mtime)
     video_path = str(videos[-1]) if videos else None
     return image_paths, video_path
@@ -34,7 +56,18 @@ def ui_multi_turn(input_image, turns_text, negative_prompt, seed, steps, cfg_sca
         return [], None, "Por favor, forneça as instruções de edição (uma por linha)."
     turns = [ln.strip() for ln in turns_text.splitlines() if ln.strip()]
     try:
-        out_dir = svc.multi_turn_edit(input_image, turns, negative_prompt=negative_prompt, seed=int(seed), steps=int(steps), cfg_scale=float(cfg_scale), resolution=int(resolution), use_vae_slicing=use_vae_slicing, num_gpus=int(num_gpus), batch_size=int(batch_size))
         imgs, vid = _list_media(Path(out_dir))
         return imgs, vid, f"Saídas salvas em: {out_dir}"
     except Exception as e:
@@ -48,7 +81,19 @@ def ui_text_to_video(input_image, prompt, negative_prompt, seed, steps, cfg_scal
     if not prompt or not prompt.strip():
         return None, "Por favor, forneça um prompt para o vídeo."
     try:
-        out_dir = svc.text_to_video(input_image, prompt, negative_prompt=negative_prompt, seed=int(seed), steps=int(steps), cfg_scale=float(cfg_scale), resolution=int(resolution), fps=int(fps), use_vae_slicing=use_vae_slicing, num_gpus=int(num_gpus), batch_size=int(batch_size))
         _, vid = _list_media(Path(out_dir))
         return vid, f"Vídeo salvo em: {out_dir}"
     except Exception as e:
@@ -57,11 +102,15 @@ def ui_text_to_video(input_image, prompt, negative_prompt, seed, steps, cfg_scal
         return None, f"Erro na geração: {e}"
 def ui_multi_concept(files, descs_text, final_prompt):
-    if not files: return [], None, "Por favor, faça o upload das imagens de conceito."
-    if not descs_text: return [], None, "Por favor, forneça as descrições (uma por linha)."
-    if not final_prompt: return [], None, "Por favor, forneça um prompt final."
     descs = [ln.strip() for ln in descs_text.splitlines() if ln.strip()]
-    if len(descs) != len(files): return [], None, f"O número de descrições ({len(descs)}) deve ser igual ao de imagens ({len(files)})."
     try:
         out_dir = svc.multi_concept_compose(files, descs, final_prompt)
         imgs, vid = _list_media(Path(out_dir))
@@ -73,62 +122,83 @@ def ui_multi_concept(files, descs_text, final_prompt):
 with gr.Blocks(title="VINCIE Service", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# VINCIE Service — Geração Distribuída com Controles Avançados")
-    gr.Markdown("- **Interface por:** Carlex ([email protected] | GitHub: carlex22)")
     with gr.Row():
         setup_out = gr.Textbox(label="Status da Configuração", interactive=False)
     with gr.Tab("Edição Multi-Turno"):
         with gr.Row():
             img_mt = gr.Image(type="filepath", label="Imagem de Entrada")
             with gr.Column():
-                turns_mt = gr.Textbox(lines=5, label="Instruções de Edição (uma por linha)", placeholder="Ex: adicione um chapéu azul\nagora, mude o fundo para uma praia")
-                with gr.Accordion("Configurações Avançadas e de Desempenho", open=True):
-                    with gr.Row():
-                        num_gpus_mt = gr.Slider(label="Número de GPUs", minimum=1, maximum=8, step=1, value=8, info="Use >1 para acelerar a geração com torchrun.")
-                        batch_size_mt = gr.Number(label="Batch Size por GPU", value=1, precision=0, info="Para Multi-GPU, o lote total será (GPUs x Batch Size).")
-                    resolution_mt = gr.Slider(label="Resolução", minimum=256, maximum=1024, step=128, value=512, info="Maior resolução exige mais VRAM e tempo.")
-                    use_vae_slicing_mt = gr.Checkbox(label="Usar VAE Slicing (Economiza VRAM)", value=True)
-                    neg_prompt_mt = gr.Textbox(lines=3, label="Prompt Negativo", value=DEFAULT_NEGATIVE_PROMPT)
-                    seed_mt = gr.Number(label="Seed (Semente)", value=1, precision=0)
-                    steps_mt = gr.Slider(label="Passos de Inferência", minimum=10, maximum=100, step=1, value=50, info="Menos passos = mais rápido.")
-                    cfg_mt = gr.Slider(label="Escala de Orientação (CFG)", minimum=1.0, maximum=20.0, step=0.5, value=7.5, info="Quão forte o modelo segue o prompt.")
-                run_mt = gr.Button("Executar Edição Multi-Turno", variant="primary")
         gallery_mt = gr.Gallery(label="Imagens Geradas", columns=4, height="auto")
         video_mt = gr.Video(label="Vídeo da Sequência (se disponível)")
         status_mt = gr.Textbox(label="Status da Saída", interactive=False)
-        run_mt.click(ui_multi_turn, inputs=[img_mt, turns_mt, neg_prompt_mt, seed_mt, steps_mt, cfg_mt, resolution_mt, use_vae_slicing_mt, num_gpus_mt, batch_size_mt], outputs=[gallery_mt, video_mt, status_mt])
     with gr.Tab("Texto-para-Vídeo"):
         with gr.Row():
             img_vid = gr.Image(type="filepath", label="Frame Inicial")
             with gr.Column():
                 prompt_vid = gr.Textbox(lines=2, label="Prompt do Vídeo", placeholder="Ex: um gato andando pela sala")
-                with gr.Accordion("Configurações Avançadas e de Desempenho", open=True):
-                    with gr.Row():
-                        num_gpus_vid = gr.Slider(label="Número de GPUs", minimum=1, maximum=8, step=1, value=8, info="Use >1 para acelerar a geração com torchrun.")
-                        batch_size_vid = gr.Number(label="Batch Size por GPU", value=1, precision=0, info="Para Multi-GPU, o lote total será (GPUs x Batch Size).")
-                    resolution_vid = gr.Slider(label="Resolução", minimum=256, maximum=1024, step=128, value=512)
-                    fps_vid = gr.Slider(label="Frames por Segundo (FPS)", minimum=1, maximum=24, step=1, value=2)
-                    use_vae_slicing_vid = gr.Checkbox(label="Usar VAE Slicing (Economiza VRAM)", value=True)
-                    neg_prompt_vid = gr.Textbox(lines=3, label="Prompt Negativo", value=DEFAULT_NEGATIVE_PROMPT)
-                    seed_vid = gr.Number(label="Seed (Semente)", value=1, precision=0)
-                    steps_vid = gr.Slider(label="Passos de Inferência", minimum=10, maximum=100, step=1, value=50)
-                    cfg_vid = gr.Slider(label="Escala de Orientação (CFG)", minimum=1.0, maximum=20.0, step=0.5, value=7.5)
-                run_vid = gr.Button("Gerar Vídeo", variant="primary")
         video_vid = gr.Video(label="Vídeo Gerado")
         status_vid = gr.Textbox(label="Status da Saída", interactive=False)
-        run_vid.click(ui_text_to_video, inputs=[img_vid, prompt_vid, neg_prompt_vid, seed_vid, steps_vid, cfg_vid, resolution_vid, fps_vid, use_vae_slicing_vid, num_gpus_vid, batch_size_vid], outputs=[video_vid, status_vid])
     with gr.Tab("Composição Multi-Conceito"):
         gr.Markdown("Nota: A composição multi-conceito está atualmente configurada para rodar em uma única GPU para garantir estabilidade.")
         with gr.Row():
             with gr.Column(scale=1):
                 files_mc = gr.File(file_count="multiple", type="filepath", label="1. Imagens de Conceito")
             with gr.Column(scale=2):
-                descs_mc = gr.Textbox(lines=5, label="2. Descrições (uma por linha, na mesma ordem)", placeholder="Ex: : uma foto de um pai\n: uma foto de uma mãe...")
-                final_prompt_mc = gr.Textbox(lines=3, label="3. Prompt Final de Composição", placeholder="Ex: Baseado em , ..., uma família sorrindo em um retrato...")
-            run_mc = gr.Button("Executar Composição", variant="primary")
         gallery_mc = gr.Gallery(label="Imagens Geradas", columns=4, height="auto")
         video_mc = gr.Video(label="Vídeo da Sequência (se disponível)")
         status_mc = gr.Textbox(label="Status da Saída", interactive=False)
-        run_mc.click(ui_multi_concept, inputs=[files_mc, descs_mc, final_prompt_mc], outputs=[gallery_mc, video_mc, status_mc])
     demo.load(fn=setup_auto, outputs=setup_out)
 if __name__ == "__main__":

 from pathlib import Path
 from typing import List, Tuple, Optional
 import gradio as gr
+# Importa o serviço
 from services.vincie import VincieService
+# Instancia e normaliza caminhos (defensivo contra imports alternativos)
 svc = VincieService()
+svc.repo_dir = Path(svc.repo_dir)
+svc.ckpt_dir = Path(svc.ckpt_dir)
+DEFAULT_NEGATIVE_PROMPT = (
+    "Worst quality, Normal quality, Low quality, Low res, Blurry, Jpeg artifacts, Grainy, "
+    "text, logo, watermark, banner, extra digits, signature, subtitling, Bad anatomy, "
+    "Bad proportions, Deformed, Disconnected limbs, Disfigured, Extra arms, Extra limbs, "
+    "Extra hands, Fused fingers, Gross proportions, Long neck, Malformed limbs, Mutated, "
+    "Mutated hands, Mutated limbs, Missing arms, Missing fingers, Poorly drawn hands, "
+    "Poorly drawn face, Nsfw, Uncensored, Cleavage, Nude, Nipples, Overexposed, "
+    "Plain background, Grainy, Underexposed, Deformed structures"
+)
 def setup_auto() -> str:
     try:
 def _list_media(out_dir: Path, max_images: int = 24) -> Tuple[List[str], Optional[str]]:
     img_globs = ("*.png", "*.jpg", "*.jpeg", "*.webp")
+    try:
+        images = sorted(
+            [p for pat in img_globs for p in out_dir.rglob(pat)],
+            key=lambda p: p.stat().st_mtime
+        )
+    except FileNotFoundError:
+        images = []
     image_paths = [str(p) for p in images[-max_images:]]
+    try:
+        videos = sorted(out_dir.rglob("*.mp4"), key=lambda p: p.stat().st_mtime)
+    except FileNotFoundError:
+        videos = []
     video_path = str(videos[-1]) if videos else None
     return image_paths, video_path
         return [], None, "Por favor, forneça as instruções de edição (uma por linha)."
     turns = [ln.strip() for ln in turns_text.splitlines() if ln.strip()]
     try:
+        out_dir = svc.multi_turn_edit(
+            input_image,
+            turns,
+            negative_prompt=negative_prompt,
+            seed=int(seed),
+            steps=int(steps),
+            cfg_scale=float(cfg_scale),
+            resolution=int(resolution),
+            use_vae_slicing=use_vae_slicing,
+            num_gpus=int(num_gpus),
+            batch_size=int(batch_size),
+        )
         imgs, vid = _list_media(Path(out_dir))
         return imgs, vid, f"Saídas salvas em: {out_dir}"
     except Exception as e:
     if not prompt or not prompt.strip():
         return None, "Por favor, forneça um prompt para o vídeo."
     try:
+        out_dir = svc.text_to_video(
+            input_image,
+            prompt,
+            negative_prompt=negative_prompt,
+            seed=int(seed),
+            steps=int(steps),
+            cfg_scale=float(cfg_scale),
+            resolution=int(resolution),
+            fps=int(fps),
+            use_vae_slicing=use_vae_slicing,
+            num_gpus=int(num_gpus),
+            batch_size=int(batch_size),
+        )
         _, vid = _list_media(Path(out_dir))
         return vid, f"Vídeo salvo em: {out_dir}"
     except Exception as e:
         return None, f"Erro na geração: {e}"
 def ui_multi_concept(files, descs_text, final_prompt):
+    if not files:
+        return [], None, "Por favor, faça o upload das imagens de conceito."
+    if not descs_text:
+        return [], None, "Por favor, forneça as descrições (uma por linha)."
+    if not final_prompt:
+        return [], None, "Por favor, forneça um prompt final."
     descs = [ln.strip() for ln in descs_text.splitlines() if ln.strip()]
+    if len(descs) != len(files):
+        return [], None, f"O número de descrições ({len(descs)}) deve ser igual ao de imagens ({len(files)})."
     try:
         out_dir = svc.multi_concept_compose(files, descs, final_prompt)
         imgs, vid = _list_media(Path(out_dir))
 with gr.Blocks(title="VINCIE Service", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# VINCIE Service — Geração Distribuída com Controles Avançados")
+    gr.Markdown("- Interface por: Carlex ([email protected] | GitHub: carlex22)")
     with gr.Row():
         setup_out = gr.Textbox(label="Status da Configuração", interactive=False)
     with gr.Tab("Edição Multi-Turno"):
         with gr.Row():
             img_mt = gr.Image(type="filepath", label="Imagem de Entrada")
             with gr.Column():
+                turns_mt = gr.Textbox(
+                    lines=5,
+                    label="Instruções de Edição (uma por linha)",
+                    placeholder="Ex: adicione um chapéu azul\nagora, mude o fundo para uma praia"
+                )
+        with gr.Accordion("Configurações Avançadas e de Desempenho", open=True):
+            with gr.Row():
+                num_gpus_mt = gr.Slider(label="Número de GPUs", minimum=1, maximum=8, step=1, value=8, info="Use >1 para acelerar a geração com torchrun.")
+                batch_size_mt = gr.Number(label="Batch Size por GPU", value=1, precision=0, info="Para Multi-GPU, o lote total será (GPUs x Batch Size).")
+                resolution_mt = gr.Slider(label="Resolução", minimum=256, maximum=1024, step=128, value=512, info="Maior resolução exige mais VRAM e tempo.")
+                use_vae_slicing_mt = gr.Checkbox(label="Usar VAE Slicing (Economiza VRAM)", value=True)
+                neg_prompt_mt = gr.Textbox(lines=3, label="Prompt Negativo", value=DEFAULT_NEGATIVE_PROMPT)
+                seed_mt = gr.Number(label="Seed (Semente)", value=1, precision=0)
+                steps_mt = gr.Slider(label="Passos de Inferência", minimum=10, maximum=100, step=1, value=50, info="Menos passos = mais rápido.")
+                cfg_mt = gr.Slider(label="Escala de Orientação (CFG)", minimum=1.0, maximum=20.0, step=0.5, value=7.5, info="Quão forte o modelo segue o prompt.")
+            run_mt = gr.Button("Executar Edição Multi-Turno", variant="primary")
         gallery_mt = gr.Gallery(label="Imagens Geradas", columns=4, height="auto")
         video_mt = gr.Video(label="Vídeo da Sequência (se disponível)")
         status_mt = gr.Textbox(label="Status da Saída", interactive=False)
+        run_mt.click(
+            ui_multi_turn,
+            inputs=[img_mt, turns_mt, neg_prompt_mt, seed_mt, steps_mt, cfg_mt, resolution_mt, use_vae_slicing_mt, num_gpus_mt, batch_size_mt],
+            outputs=[gallery_mt, video_mt, status_mt]
+        )
     with gr.Tab("Texto-para-Vídeo"):
         with gr.Row():
             img_vid = gr.Image(type="filepath", label="Frame Inicial")
             with gr.Column():
                 prompt_vid = gr.Textbox(lines=2, label="Prompt do Vídeo", placeholder="Ex: um gato andando pela sala")
+        with gr.Accordion("Configurações Avançadas e de Desempenho", open=True):
+            with gr.Row():
+                num_gpus_vid = gr.Slider(label="Número de GPUs", minimum=1, maximum=8, step=1, value=8, info="Use >1 para acelerar a geração com torchrun.")
+                batch_size_vid = gr.Number(label="Batch Size por GPU", value=1, precision=0, info="Para Multi-GPU, o lote total será (GPUs x Batch Size).")
+                resolution_vid = gr.Slider(label="Resolução", minimum=256, maximum=1024, step=128, value=512)
+                fps_vid = gr.Slider(label="Frames por Segundo (FPS)", minimum=1, maximum=24, step=1, value=2)
+                use_vae_slicing_vid = gr.Checkbox(label="Usar VAE Slicing (Economiza VRAM)", value=True)
+                neg_prompt_vid = gr.Textbox(lines=3, label="Prompt Negativo", value=DEFAULT_NEGATIVE_PROMPT)
+                seed_vid = gr.Number(label="Seed (Semente)", value=1, precision=0)
+                steps_vid = gr.Slider(label="Passos de Inferência", minimum=10, maximum=100, step=1, value=50)
+                cfg_vid = gr.Slider(label="Escala de Orientação (CFG)", minimum=1.0, maximum=20.0, step=0.5, value=7.5)
+            run_vid = gr.Button("Gerar Vídeo", variant="primary")
         video_vid = gr.Video(label="Vídeo Gerado")
         status_vid = gr.Textbox(label="Status da Saída", interactive=False)
+        run_vid.click(
+            ui_text_to_video,
+            inputs=[img_vid, prompt_vid, neg_prompt_vid, seed_vid, steps_vid, cfg_vid, resolution_vid, fps_vid, use_vae_slicing_vid, num_gpus_vid, batch_size_vid],
+            outputs=[video_vid, status_vid]
+        )
     with gr.Tab("Composição Multi-Conceito"):
         gr.Markdown("Nota: A composição multi-conceito está atualmente configurada para rodar em uma única GPU para garantir estabilidade.")
         with gr.Row():
             with gr.Column(scale=1):
                 files_mc = gr.File(file_count="multiple", type="filepath", label="1. Imagens de Conceito")
             with gr.Column(scale=2):
+                descs_mc = gr.Textbox(lines=5, label="2. Descrições (uma por linha, na mesma ordem)", placeholder="Ex: <ref1>: uma foto de um pai\n<ref2>: uma foto de uma mãe...")
+                final_prompt_mc = gr.Textbox(lines=3, label="3. Prompt Final de Composição", placeholder="Ex: Baseado em <ref1>, <ref2>, ..., uma família sorrindo em um retrato...")
+        run_mc = gr.Button("Executar Composição", variant="primary")
         gallery_mc = gr.Gallery(label="Imagens Geradas", columns=4, height="auto")
         video_mc = gr.Video(label="Vídeo da Sequência (se disponível)")
         status_mc = gr.Textbox(label="Status da Saída", interactive=False)
+        run_mc.click(
+            ui_multi_concept,
+            inputs=[files_mc, descs_mc, final_prompt_mc],
+            outputs=[gallery_mc, video_mc, status_mc]
+        )
     demo.load(fn=setup_auto, outputs=setup_out)
 if __name__ == "__main__":

builder.sh CHANGED Viewed

@@ -1,45 +1,62 @@
 #!/usr/bin/env bash
 set -euo pipefail
-echo "🚀 Builder (Apex + Q8) — roda em runtime com GPU visível"
-# ===== Config e diretórios =====
-export SELF_HF_REPO_ID="${SELF_HF_REPO_ID:-carlex3321/aduc-sdr}"   # Model repo no HF com wheels
-export HF_HOME="${HF_HOME:-/app/model_cache}"
 export HF_HUB_CACHE="${HF_HUB_CACHE:-$HF_HOME/hub}"
-export TORCH_HOME="${TORCH_HOME:-$HF_HOME/torch}"
 export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
-export PATH="$HOME/.local/bin:$PATH"
-mkdir -p /app/wheels /app/cuda_cache "$HF_HOME" "$TORCH_HOME" /app/wheels/src
 chmod -R 777 /app/wheels || true
 export CUDA_CACHE_PATH="/app/cuda_cache"
 if [ -f "/NGC-DL-CONTAINER-LICENSE" ]; then
   cp -f /NGC-DL-CONTAINER-LICENSE /app/wheels/NGC-DL-CONTAINER-LICENSE || true
 fi
-# ===== Dependências mínimas =====
 python -m pip install -v -U pip build setuptools wheel hatchling hatch-vcs scikit-build-core cmake ninja packaging "huggingface_hub[hf_transfer]" || true
 # ===== Tags de ambiente (Python/CUDA/Torch) =====
 PY_TAG="$(python -c 'import sys; print(f"cp{sys.version_info[0]}{sys.version_info[1]}")' 2>/dev/null || echo cp310)"
 TORCH_VER="$(python - <<'PY'
 try:
-    import torch, re
-    v = torch.__version__
-    print(re.sub(r'\+.*$', '', v))
 except Exception:
-    print("unknown")
 PY
 )"
 CU_TAG="$(python - <<'PY'
 try:
-    import torch
-    cu = getattr(torch.version, "cuda", None)
-    print("cu"+cu.replace(".","")) if cu else print("")
 except Exception:
-    print("")
 PY
 )"
 echo "[env] PY_TAG=${PY_TAG} TORCH_VER=${TORCH_VER} CU_TAG=${CU_TAG}"
@@ -48,11 +65,11 @@ echo "[env] PY_TAG=${PY_TAG} TORCH_VER=${TORCH_VER} CU_TAG=${CU_TAG}"
 check_apex() {
 python - <<'PY'
 try:
-    from apex.normalization import FusedLayerNorm, FusedRMSNorm
-    import importlib; importlib.import_module("fused_layer_norm_cuda")
-    ok = True
 except Exception:
-    ok = False
 raise SystemExit(0 if ok else 1)
 PY
 }
@@ -65,10 +82,10 @@ raise SystemExit(0 if spec else 1)
 PY
 }
-# ===== Download do Hub =====
 install_from_hf () {
-  local PKG="$1"    # 'apex' ou 'q8_kernels'
-  echo "[hub] Verificando wheel de ${PKG} no repositório ${SELF_HF_REPO_ID}"
   python - "$PKG" "$PY_TAG" "$CU_TAG" <<'PY' || exit 0
 import os, sys
 from huggingface_hub import HfApi, hf_hub_download, HfFolder
@@ -76,16 +93,16 @@ from huggingface_hub import HfApi, hf_hub_download, HfFolder
 pkg, py_tag, cu_tag = sys.argv[1], sys.argv[2], sys.argv[3]
 repo = os.environ.get("SELF_HF_REPO_ID","carlex3321/aduc-sdr")
 api = HfApi(token=os.getenv("HF_TOKEN") or HfFolder.get_token())
 try:
-    files = api.list_repo_files(repo_id=repo, repo_type="model")
 except Exception:
-    raise SystemExit(0)
 cands = [f for f in files if f.endswith(".whl") and f.rsplit("/",1)[-1].startswith(pkg+"-") and py_tag in f]
-pref  = [f for f in cands if cu_tag and cu_tag in f] or cands
 if not pref:
-    raise SystemExit(0)
 target = sorted(pref, reverse=True)[0]
 print(target)
 path = hf_hub_download(repo_id=repo, filename=target, repo_type="model", local_dir="/app/wheels")
@@ -96,7 +113,7 @@ PY
 # ===== Builders =====
 build_apex () {
   local SRC="/app/wheels/src/apex"
-  echo "[build] Preparando fonte Apex em ${SRC}"
   if [ -d "$SRC/.git" ]; then
     git -C "$SRC" fetch --all -p || true
     git -C "$SRC" reset --hard HEAD || true
@@ -105,16 +122,18 @@ build_apex () {
     rm -rf "$SRC"
     git clone --depth 1 https://github.com/NVIDIA/apex "$SRC"
   fi
   echo "[build] Compilando Apex -> wheel"
   export APEX_CPP_EXT=1 APEX_CUDA_EXT=1 APEX_ALL_CONTRIB_EXT=0
-  python -m pip wheel --no-build-isolation --no-deps "$SRC" -w /app/wheels || true
   local W="$(ls -t /app/wheels/apex-*.whl 2>/dev/null | head -n1 || true)"
   if [ -n "${W}" ]; then
-    python -m pip install -U --no-deps "${W}" || true
-    echo "[build] Apex instalado da wheel recém-compilada: ${W}"
   else
-    echo "[build] Nenhuma wheel Apex gerada; instalando do source (pode falhar)"
-    python -m pip install --no-build-isolation "$SRC" || true
   fi
 }
@@ -126,25 +145,27 @@ build_q8 () {
   git clone --filter=blob:none "$Q8_REPO" "$SRC"
   git -C "$SRC" checkout "$Q8_COMMIT"
   git -C "$SRC" submodule update --init --recursive
   echo "[build] Compilando Q8 Kernels -> wheel"
-  python -m pip wheel --no-build-isolation "$SRC" -w /app/wheels || true
   local W="$(ls -t /app/wheels/q8_kernels-*.whl 2>/dev/null | head -n1 || true)"
   if [ -n "${W}" ]; then
-    python -m pip install -U --no-deps "${W}" || true
-    echo "[build] Q8 instalado da wheel recém-compilada: ${W}"
   else
-    echo "[build] Nenhuma wheel q8_kernels gerada; instalando do source (pode falhar)"
-    python -m pip install --no-build-isolation "$SRC" || true
   fi
 }
 # ===== Pipeline genérico =====
 ensure_pkg () {
-  local PKG="$1"      # apex | q8_kernels
-  local CHECK_FN="$2" # check_apex | check_q8
-  local BUILD_FN="$3" # build_apex | build_q8
   echo "[flow] === ${PKG} ==="
   if ${CHECK_FN}; then
     echo "[flow] ${PKG}: já instalado (import OK)"
     return 0
@@ -155,7 +176,7 @@ ensure_pkg () {
   if [ -n "${HF_OUT:-}" ]; then
     WHEEL_PATH="$(printf "%s\n" "${HF_OUT}" | tail -n1)"
     echo "[hub] Baixado: ${WHEEL_PATH}"
-    python -m pip install -U --no-build-isolation "${WHEEL_PATH}" || true
     if ${CHECK_FN}; then
       echo "[flow] ${PKG}: sucesso via Hub (${WHEEL_PATH})"
       return 0
@@ -173,7 +194,7 @@ ensure_pkg () {
     return 0
   fi
-  echo "[flow] ${PKG}: falhou após build; registrando logs e seguindo"
   return 1
 }
@@ -181,25 +202,24 @@ ensure_pkg () {
 ensure_pkg "apex" check_apex build_apex || true
 ensure_pkg "q8_kernels" check_q8 build_q8 || true
 python - <<'PY'
 import os
 from huggingface_hub import HfApi, HfFolder
 repo=os.environ.get("SELF_HF_REPO_ID","carlex3321/aduc-sdr")
 token=os.getenv("HF_TOKEN") or HfFolder.get_token()
 if not token:
-    raise SystemExit("HF_TOKEN ausente; upload desabilitado")
 api=HfApi(token=token)
 api.upload_folder(
-    folder_path="/app/wheels",
-    repo_id=repo,
-    repo_type="model",
-    allow_patterns=["*.whl","NGC-DL-CONTAINER-LICENSE"],
-    ignore_patterns=["**/src/**","**/*.log","**/logs/**",".git/**"],
 )
 print("Upload concluído (wheels + licença).")
 PY
 chmod -R 777 /app/wheels || true
 echo "✅ Builder finalizado."

 #!/usr/bin/env bash
 set -euo pipefail
+echo "🚀 Builder (Apex + Q8) — runtime, GPU visível, cache persistente"
+# ===== Persistência e caches =====
+# Prioriza /data (HF Spaces) e mantém compatibilidade com /app
+if [ -d /data ]; then
+  export HF_HOME="${HF_HOME:-/data/.cache/huggingface}"
+  export TORCH_HOME="${TORCH_HOME:-/data/.cache/torch}"
+else
+  export HF_HOME="${HF_HOME:-/app/.cache/huggingface}"
+  export TORCH_HOME="${TORCH_HOME:-/app/.cache/torch}"
+fi
 export HF_HUB_CACHE="${HF_HUB_CACHE:-$HF_HOME/hub}"
+mkdir -p "$HF_HOME" "$HF_HUB_CACHE" "$TORCH_HOME"
+# Symlink de compatibilidade (se scripts esperarem /app/.cache/huggingface)
+mkdir -p /app/.cache
+ln -sf "$HF_HOME" /app/.cache/huggingface
+# ===== Repositório de wheels no Hub =====
+export SELF_HF_REPO_ID="${SELF_HF_REPO_ID:-carlex3321/aduc-sdr}"
+# ===== Aceleração de transferência =====
 export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
+export HF_HUB_DOWNLOAD_TIMEOUT="${HF_HUB_DOWNLOAD_TIMEOUT:-60}"
+# ===== Diretórios de trabalho =====
+mkdir -p /app/wheels /app/cuda_cache /app/wheels/src
 chmod -R 777 /app/wheels || true
 export CUDA_CACHE_PATH="/app/cuda_cache"
+# Licença (NVIDIA NGC) se presente
 if [ -f "/NGC-DL-CONTAINER-LICENSE" ]; then
   cp -f /NGC-DL-CONTAINER-LICENSE /app/wheels/NGC-DL-CONTAINER-LICENSE || true
 fi
+# ===== Dependências mínimas de build =====
 python -m pip install -v -U pip build setuptools wheel hatchling hatch-vcs scikit-build-core cmake ninja packaging "huggingface_hub[hf_transfer]" || true
 # ===== Tags de ambiente (Python/CUDA/Torch) =====
 PY_TAG="$(python -c 'import sys; print(f"cp{sys.version_info[0]}{sys.version_info[1]}")' 2>/dev/null || echo cp310)"
 TORCH_VER="$(python - <<'PY'
 try:
+  import torch, re
+  v = torch.__version__
+  print(re.sub(r'\+.*$', '', v))
 except Exception:
+  print("unknown")
 PY
 )"
 CU_TAG="$(python - <<'PY'
 try:
+  import torch
+  cu = getattr(torch.version, "cuda", None)
+  print("cu"+cu.replace(".","")) if cu else print("")
 except Exception:
+  print("")
 PY
 )"
 echo "[env] PY_TAG=${PY_TAG} TORCH_VER=${TORCH_VER} CU_TAG=${CU_TAG}"
 check_apex() {
 python - <<'PY'
 try:
+  from apex.normalization import FusedLayerNorm, FusedRMSNorm
+  import importlib; importlib.import_module("fused_layer_norm_cuda")
+  ok = True
 except Exception:
+  ok = False
 raise SystemExit(0 if ok else 1)
 PY
 }
 PY
 }
+# ===== Download de wheels do Hub =====
 install_from_hf () {
+  local PKG="$1" # 'apex' ou 'q8_kernels'
+  echo "[hub] Buscando wheel de ${PKG} em ${SELF_HF_REPO_ID} (py=${PY_TAG}, cu=${CU_TAG})"
   python - "$PKG" "$PY_TAG" "$CU_TAG" <<'PY' || exit 0
 import os, sys
 from huggingface_hub import HfApi, hf_hub_download, HfFolder
 pkg, py_tag, cu_tag = sys.argv[1], sys.argv[2], sys.argv[3]
 repo = os.environ.get("SELF_HF_REPO_ID","carlex3321/aduc-sdr")
 api = HfApi(token=os.getenv("HF_TOKEN") or HfFolder.get_token())
 try:
+  files = api.list_repo_files(repo_id=repo, repo_type="model")
 except Exception:
+  raise SystemExit(0)
 cands = [f for f in files if f.endswith(".whl") and f.rsplit("/",1)[-1].startswith(pkg+"-") and py_tag in f]
+pref = [f for f in cands if cu_tag and cu_tag in f] or cands
 if not pref:
+  raise SystemExit(0)
 target = sorted(pref, reverse=True)[0]
 print(target)
 path = hf_hub_download(repo_id=repo, filename=target, repo_type="model", local_dir="/app/wheels")
 # ===== Builders =====
 build_apex () {
   local SRC="/app/wheels/src/apex"
+  echo "[build] Fonte Apex em ${SRC}"
   if [ -d "$SRC/.git" ]; then
     git -C "$SRC" fetch --all -p || true
     git -C "$SRC" reset --hard HEAD || true
     rm -rf "$SRC"
     git clone --depth 1 https://github.com/NVIDIA/apex "$SRC"
   fi
   echo "[build] Compilando Apex -> wheel"
   export APEX_CPP_EXT=1 APEX_CUDA_EXT=1 APEX_ALL_CONTRIB_EXT=0
+  python -m pip wheel -v --no-build-isolation --no-deps "$SRC" -w /app/wheels || true
   local W="$(ls -t /app/wheels/apex-*.whl 2>/dev/null | head -n1 || true)"
   if [ -n "${W}" ]; then
+    python -m pip install -v -U --no-deps "${W}" || true
+    echo "[build] Apex instalado da wheel: ${W}"
   else
+    echo "[build] Nenhuma wheel Apex gerada; instalando do source"
+    python -m pip install -v --no-build-isolation "$SRC" || true
   fi
 }
   git clone --filter=blob:none "$Q8_REPO" "$SRC"
   git -C "$SRC" checkout "$Q8_COMMIT"
   git -C "$SRC" submodule update --init --recursive
   echo "[build] Compilando Q8 Kernels -> wheel"
+  python -m pip wheel -v --no-build-isolation "$SRC" -w /app/wheels || true
   local W="$(ls -t /app/wheels/q8_kernels-*.whl 2>/dev/null | head -n1 || true)"
   if [ -n "${W}" ]; then
+    python -m pip install -v -U --no-deps "${W}" || true
+    echo "[build] Q8 instalado da wheel: ${W}"
   else
+    echo "[build] Nenhuma wheel q8_kernels gerada; instalando do source"
+    python -m pip install -v --no-build-isolation "$SRC" || true
   fi
 }
 # ===== Pipeline genérico =====
 ensure_pkg () {
+  local PKG="$1"       # apex | q8_kernels
+  local CHECK_FN="$2"  # check_apex | check_q8
+  local BUILD_FN="$3"  # build_apex | build_q8
   echo "[flow] === ${PKG} ==="
   if ${CHECK_FN}; then
     echo "[flow] ${PKG}: já instalado (import OK)"
     return 0
   if [ -n "${HF_OUT:-}" ]; then
     WHEEL_PATH="$(printf "%s\n" "${HF_OUT}" | tail -n1)"
     echo "[hub] Baixado: ${WHEEL_PATH}"
+    python -m pip install -v -U --no-build-isolation "${WHEEL_PATH}" || true
     if ${CHECK_FN}; then
       echo "[flow] ${PKG}: sucesso via Hub (${WHEEL_PATH})"
       return 0
     return 0
   fi
+  echo "[flow] ${PKG}: falhou após build; seguindo adiante"
   return 1
 }
 ensure_pkg "apex" check_apex build_apex || true
 ensure_pkg "q8_kernels" check_q8 build_q8 || true
+# ===== Upload das wheels geradas (opcional) =====
 python - <<'PY'
 import os
 from huggingface_hub import HfApi, HfFolder
 repo=os.environ.get("SELF_HF_REPO_ID","carlex3321/aduc-sdr")
 token=os.getenv("HF_TOKEN") or HfFolder.get_token()
 if not token:
+  raise SystemExit("HF_TOKEN ausente; upload desabilitado")
 api=HfApi(token=token)
 api.upload_folder(
+  folder_path="/app/wheels",
+  repo_id=repo,
+  repo_type="model",
+  allow_patterns=["*.whl","NGC-DL-CONTAINER-LICENSE"],
+  ignore_patterns=["**/src/**","**/*.log","**/logs/**",".git/**"],
 )
 print("Upload concluído (wheels + licença).")
 PY
 chmod -R 777 /app/wheels || true
 echo "✅ Builder finalizado."

start.sh CHANGED Viewed

@@ -32,28 +32,54 @@ export NCCL_BLOCKING_WAIT=1
 export TORCH_NCCL_BLOCKING_WAIT=1
 export NCCL_TIMEOUT=600
-# HF caches
-export HF_HOME=/app/.cache/huggingface
-unset TRANSFORMERS_CACHE
-# ---------------------- Baixar o modelo antes de iniciar ----------------------
-echo "Criando diretório de cache se não existir..."
-mkdir -p /app/.cache/huggingface/hub
-# Ativando hf_transfer para downloads mais rápidos
 export HF_HUB_ENABLE_HF_TRANSFER=1
 export HF_HUB_DOWNLOAD_TIMEOUT=60
 MODEL_REPO="ByteDance-Seed/VINCIE-3B"
 retry_count=0
 max_retries=3
 while [ $retry_count -lt $max_retries ]; do
-  echo "Tentativa $((retry_count+1)) de baixar o modelo $MODEL_REPO..."
-  python -c "import os; from huggingface_hub import snapshot_download; os.environ['HF_HOME']='/app/.cache/huggingface'; from os import getenv; snapshot_download(repo_id='$MODEL_REPO', cache_dir=os.path.join(os.environ['HF_HOME'], 'hub'), resume_download=True, token=getenv('HF_TOKEN'))" && break
   retry_count=$((retry_count+1))
-  echo "Falha na tentativa $retry_count. Tentando novamente em 10 segundos..."
   sleep 10
   if [ $retry_count -eq $max_retries ]; then
     echo "Erro: Falha ao baixar o modelo após $max_retries tentativas."
@@ -61,19 +87,20 @@ while [ $retry_count -lt $max_retries ]; do
   fi
 done
-ls -la /app/.cache/huggingface/hub || echo "Cache não encontrado após download."
 # ---------------------- Builder Apex/Q8 ----------------------
 if nvidia-smi >/dev/null 2>&1; then
   if [ "${DISABLE_BUILDER:-0}" -eq 0 ]; then
     echo "Executando builder Apex/Q8..."
-    chmod +x /app/builder.sh || true
-    # Executa com GPU disponível, busca wheels no HF e compila se necessário (sem FlashAttention)
-    SELF_HF_REPO_ID=carlex3321/aduc-sdr  # repo de wheels no HF
-    HF_UPLOAD_WHEELS=0  # publica wheels geradas
-    BUILDER_TIMEOUT_SEC=6000000  # tempo limite
-    Q8_REPO="" Q8_COMMIT=""  # pin do LTX Q8
-    timeout ${BUILDER_TIMEOUT_SEC:-60000} bash -lc /app/builder.sh || echo "Builder excedeu tempo/retornou erro, prosseguindo com a aplicação."
   else
     echo "Builder desabilitado por DISABLE_BUILDER=1"
   fi
@@ -81,16 +108,21 @@ else
   echo "GPU não visível, pulando builder Apex/Q8."
 fi
-# ---------------------- Banner ----------------------
-./info.sh || true
-ls -la /app && ls -R /app | head -n 2000
 echo "🚀 Subindo serviços..."
-# Exemplo: subir UI mínima SD Img2Img (ajuste conforme seu app)
-# python app_animatediff_min.py
-# Ou subir VINCIE UI se for o caso
-python app_vince.py

 export TORCH_NCCL_BLOCKING_WAIT=1
 export NCCL_TIMEOUT=600
+# ---------------------- Persistência: /data ----------------------
+if [ -d /data ]; then
+  export HF_HOME="/data/.cache/huggingface"
+  export TORCH_HOME="/data/.cache/torch"
+  mkdir -p "$HF_HOME/hub" "$TORCH_HOME"
+  # Symlink para compatibilidade com /app
+  mkdir -p /app/.cache
+  ln -sf "$HF_HOME" /app/.cache/huggingface
+else
+  export HF_HOME="/app/.cache/huggingface"
+  export TORCH_HOME="/app/.cache/torch"
+  mkdir -p "$HF_HOME/hub" "$TORCH_HOME"
+fi
+unset TRANSFORMERS_CACHE  # evitar conflito com outros caches
+export HF_HUB_CACHE="${HF_HUB_CACHE:-$HF_HOME/hub}"
 export HF_HUB_ENABLE_HF_TRANSFER=1
 export HF_HUB_DOWNLOAD_TIMEOUT=60
+# ---------------------- Pré-download do modelo ----------------------
 MODEL_REPO="ByteDance-Seed/VINCIE-3B"
+echo "Baixando o modelo ${MODEL_REPO} para cache persistente em $HF_HUB_CACHE..."
 retry_count=0
 max_retries=3
 while [ $retry_count -lt $max_retries ]; do
+  echo "Tentativa $((retry_count+1)) de snapshot_download..."
+  python - <<'PY' || true
+import os, time
+from huggingface_hub import snapshot_download
+hf_home = os.environ.get("HF_HOME","/app/.cache/huggingface")
+cache_dir = os.path.join(hf_home, "hub")
+os.makedirs(cache_dir, exist_ok=True)
+repo_id = "ByteDance-Seed/VINCIE-3B"
+token = os.getenv("HF_TOKEN")
+try:
+  snapshot_download(repo_id=repo_id, cache_dir=cache_dir, resume_download=True, token=token)
+  print("Download concluído.")
+except Exception as e:
+  print(f"Erro no download: {e}")
+  raise
+PY
+  status=$?
+  if [ $status -eq 0 ]; then
+    break
+  fi
   retry_count=$((retry_count+1))
+  echo "Falha na tentativa $retry_count. Tentando novamente em 10s..."
   sleep 10
   if [ $retry_count -eq $max_retries ]; then
     echo "Erro: Falha ao baixar o modelo após $max_retries tentativas."
   fi
 done
+ls -la "$HF_HUB_CACHE" || echo "Cache não encontrado após download."
 # ---------------------- Builder Apex/Q8 ----------------------
 if nvidia-smi >/dev/null 2>&1; then
   if [ "${DISABLE_BUILDER:-0}" -eq 0 ]; then
     echo "Executando builder Apex/Q8..."
+    # Use o builder revisado (salve como /app/builder-7.sh)
+    if [ -f /app/builder-7.sh ]; then
+      chmod +x /app/builder-7.sh
+      timeout "${BUILDER_TIMEOUT_SEC:-7200}" bash -lc /app/builder-7.sh || echo "Builder excedeu tempo/erro, prosseguindo."
+    else
+      chmod +x /app/builder.sh || true
+      timeout "${BUILDER_TIMEOUT_SEC:-7200}" bash -lc /app/builder.sh || echo "Builder excedeu tempo/erro, prosseguindo."
+    fi
   else
     echo "Builder desabilitado por DISABLE_BUILDER=1"
   fi
   echo "GPU não visível, pulando builder Apex/Q8."
 fi
+# ---------------------- Diagnóstico e listagem ----------------------
+/app/info.sh || true
+echo "Estrutura em /app:"
+ls -la /app | sed -n '1,200p'
+echo "Estrutura em $HF_HOME:"
+ls -la "$HF_HOME" | sed -n '1,200p'
+# ---------------------- Subindo serviço ----------------------
 echo "🚀 Subindo serviços..."
+# Se o seu entrypoint é a UI Gradio:
+if [ -f /app/app_vince.py ]; then
+  python /app/app_vince.py
+elif [ -f /app/vince.py ]; then
+  python /app/vince.py
+else
+  echo "Nenhum entrypoint encontrado (app_vince.py ou vince.py)."
+  exit 1
+fi