SeedVR2

Paused

App Files Files Community

aducsdr commited on Sep 9

Commit

53cc24b

verified ·

1 Parent(s): 40e8355

Upload 2 files

Browse files

Files changed (2) hide show

ai_studio_code (20).txt +29 -0
ai_studio_code (6).py +164 -0

ai_studio_code (20).txt ADDED Viewed

	@@ -0,0 +1,29 @@

+# Dependências do SeedVR
+torch==2.1.0
+torchvision==0.16.0
+torchaudio==2.1.0
+accelerate==0.24.1
+av==11.0.0
+beautifulsoup4==4.12.2
+einops==0.7.0
+gradio
+huggingface_hub
+iopath==0.1.10
+ipython==8.17.2
+omegaconf==2.3.0
+pandas==2.1.3
+pytorch-lightning==2.1.0
+pytorchvideo==0.1.5
+ftfy==6.1.1
+regex==2023.10.3
+timm==0.9.10
+transformers==4.35.2
+tqdm==4.66.1
+webdataset==0.2.70
+diffusers==0.26.3
+controlnet_aux==0.0.7
+opencv-python
+scikit-image
+xformers==0.0.22.post7
+# Dependência com instalação especial (tratada no app.py)
+# flash_attn==2.5.9.post1 --no-build-isolation

ai_studio_code (6).py ADDED Viewed

	@@ -0,0 +1,164 @@

+import gradio as gr
+import subprocess
+import os
+import sys
+import threading
+from huggingface_hub import snapshot_download
+# --- 1. CONFIGURAÇÃO INICIAL (Executa apenas uma vez) ---
+# Diretório base para o projeto SeedVR
+SEEDVR_DIR = "SeedVR"
+def setup():
+    """
+    Clona o repositório, instala dependências especiais e baixa o modelo.
+    Esta função é executada uma vez quando o Space é iniciado.
+    """
+    print("--- Iniciando configuração do ambiente ---")
+    # Etapa 1: Clonar o repositório SeedVR se ainda não existir
+    if not os.path.exists(SEEDVR_DIR):
+        print(f"Clonando o repositório SeedVR de https://github.com/bytedance-seed/SeedVR.git...")
+        subprocess.run(["git", "clone", "https://github.com/bytedance-seed/SeedVR.git"], check=True)
+    else:
+        print("Repositório SeedVR já existe.")
+    # Mudando para o diretório do projeto para os próximos comandos
+    os.chdir(SEEDVR_DIR)
+    # Etapa 2: Instalar dependências que exigem comandos específicos
+    print("Instalando flash_attn...")
+    subprocess.run([sys.executable, "-m", "pip", "install", "flash_attn==2.5.9.post1", "--no-build-isolation"], check=True)
+    # Nota sobre o Apex: O arquivo .whl precisa estar no seu repositório Hugging Face
+    apex_whl_path = "apex-0.1-cp310-cp310-linux_x86_64.whl"
+    if os.path.exists(apex_whl_path):
+        print(f"Instalando {apex_whl_path}...")
+        subprocess.run([sys.executable, "-m", "pip", "install", apex_whl_path], check=True)
+    else:
+        print(f"AVISO: Arquivo '{apex_whl_path}' não encontrado. A instalação do Apex foi pulada. Por favor, adicione este arquivo ao seu repositório.")
+    # Etapa 3: Baixar o modelo do Hugging Face Hub
+    save_dir = "ckpts/"
+    repo_id = "ByteDance-Seed/SeedVR2-3B"
+    cache_dir = os.path.join(save_dir, "cache")
+    if not os.path.exists(os.path.join(save_dir, "README.md")): # Checa se o download já foi feito
+        print(f"Baixando o modelo '{repo_id}' para '{save_dir}'...")
+        snapshot_download(
+            cache_dir=cache_dir,
+            local_dir=save_dir,
+            repo_id=repo_id,
+            local_dir_use_symlinks=False,
+            resume_download=True,
+            allow_patterns=["*.json", "*.safetensors", "*.pth", "*.bin", "*.py", "*.md", "*.txt"],
+        )
+    else:
+        print("Modelo já foi baixado.")
+    print("--- Configuração do ambiente concluída ---")
+    # Retornar ao diretório raiz original
+    os.chdir("..")
+# Executa a configuração
+setup()
+# --- 2. LÓGICA DA INFERÊNCIA ---
+def run_inference(video_path, seed, res_h, res_w, sp_size, progress=gr.Progress(track_tqdm=True)):
+    """
+    Executa o script de inferência do SeedVR usando torchrun.
+    """
+    if video_path is None:
+        return None, "Por favor, faça o upload de um arquivo de vídeo de entrada."
+    input_folder = os.path.dirname(video_path.name)
+    output_folder = "outputs"
+    os.makedirs(output_folder, exist_ok=True)
+    # Determinar o número de GPUs disponíveis. Para 4xL40s, será 4.
+    num_gpus = 4
+    command = [
+        "torchrun",
+        f"--nproc-per-node={num_gpus}",
+        "projects/inference_seedvr2_3b.py",
+        "--video_path", input_folder,
+        "--output_dir", f"../{output_folder}", # Navega para fora do dir SeedVR
+        "--seed", str(seed),
+        "--res_h", str(res_h),
+        "--res_w", str(res_w),
+        "--sp_size", str(sp_size),
+    ]
+    log_output = ""
+    try:
+        print(f"Executando comando: {' '.join(command)}")
+        # Executar o comando dentro do diretório SeedVR
+        process = subprocess.Popen(
+            command,
+            cwd=SEEDVR_DIR,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.STDOUT,
+            text=True,
+            encoding='utf-8'
+        )
+        # Capturar e exibir a saída em tempo real
+        while True:
+            line = process.stdout.readline()
+            if not line:
+                break
+            log_output += line
+            print(line, end='')
+            yield None, log_output
+        process.wait()
+        if process.returncode != 0:
+            raise subprocess.CalledProcessError(process.returncode, command, output=log_output)
+        # Encontrar os arquivos de vídeo gerados
+        result_files = [os.path.join(output_folder, f) for f in os.listdir(output_folder) if f.endswith(('.mp4', '.avi', '.mov'))]
+        if not result_files:
+             return None, log_output + "\n\nERRO: Nenhum arquivo de vídeo foi gerado."
+        return result_files, log_output
+    except subprocess.CalledProcessError as e:
+        error_message = f"Erro ao executar a inferência.\nOutput:\n{e.output}"
+        print(error_message)
+        return None, error_message
+    except Exception as e:
+        return None, f"Ocorreu um erro inesperado: {str(e)}"
+# --- 3. INTERFACE GRAPHEMICA (GRADIO) ---
+with gr.Blocks() as demo:
+    gr.Markdown("# 🎥 Interface de Inferência para SeedVR2")
+    gr.Markdown("Faça o upload de um vídeo, ajuste os parâmetros e clique em 'Gerar Vídeo' para iniciar a inferência.")
+    with gr.Row():
+        with gr.Column(scale=1):
+            video_input = gr.File(label="Vídeo de Entrada (.mp4, .mov, etc.)")
+            seed_input = gr.Number(label="Seed", value=123)
+            res_h_input = gr.Number(label="Altura da Saída (res_h)", value=320)
+            res_w_input = gr.Number(label="Largura da Saída (res_w)", value=512)
+            sp_size_input = gr.Number(label="Tamanho do passo espacial (sp_size)", value=1)
+            run_button = gr.Button("Gerar Vídeo", variant="primary")
+        with gr.Column(scale=2):
+            gallery_output = gr.Gallery(label="Vídeo Gerado", show_label=True, elem_id="gallery")
+            log_display = gr.Textbox(label="Logs de Execução", lines=15, interactive=False)
+    run_button.click(
+        fn=run_inference,
+        inputs=[video_input, seed_input, res_h_input, res_w_input, sp_size_input],
+        outputs=[gallery_output, log_display]
+    )
+if __name__ == "__main__":
+    demo.launch()