Test

Paused

App Files Files Community

Eueuiaa commited on Oct 10

Commit

cae55d9

verified ·

1 Parent(s): eb6e96e

Update api/ltx_server_refactored.py

Browse files

Files changed (1) hide show

api/ltx_server_refactored.py +54 -49

api/ltx_server_refactored.py CHANGED Viewed

@@ -1,17 +1,7 @@
 # ltx_server_refactored.py — VideoService (Modular Version with Simple Overlap Chunking)
-# --- 0. WARNINGS E AMBIENTE ---
 import warnings
-warnings.filterwarnings("ignore", category=UserWarning)
-warnings.filterwarnings("ignore", category=FutureWarning)
-warnings.filterwarnings("ignore", message=".*")
 from huggingface_hub import logging
-logging.set_verbosity_error()
-logging.set_verbosity_warning()
-logging.set_verbosity_info()
-logging.set_verbosity_debug()
-LTXV_DEBUG=1
-LTXV_FRAME_LOG_EVERY=8
 import os, subprocess, shlex, tempfile
 import torch
 import json
@@ -38,8 +28,18 @@ from einops import rearrange
 import torch.nn.functional as F
 from managers.vae_manager import vae_manager_singleton
 from tools.video_encode_tool import video_encode_tool_singleton
 DEPS_DIR = Path("/data")
 LTX_VIDEO_REPO_DIR = DEPS_DIR / "LTX-Video"
 # (Todas as funções de setup, helpers e inicialização da classe permanecem inalteradas)
 # ... (run_setup, add_deps_to_path, _query_gpu_processes_via_nvml, etc.)
@@ -99,27 +99,6 @@ from api.ltx.inference import (
 )
 class VideoService:
-    def __init__(self):
-        t0 = time.perf_counter()
-        print("[DEBUG] Inicializando VideoService...")
-        self.device = gpu_manager.get_ltx_device()
-        print(f"[DEBUG] LTX foi alocado para o dispositivo: {self.device}")
-        self.device = "cuda" if torch.cuda.is_available() else "cpu"
-        self.config = self._load_config()
-        self.pipeline, self.latent_upsampler = self._load_models()
-        self.pipeline.to(self.device)
-        if self.latent_upsampler:
-            self.latent_upsampler.to(self.device)
-        self._apply_precision_policy()
-        vae_manager_singleton.attach_pipeline(
-            self.pipeline,
-            device=self.device,
-            autocast_dtype=self.runtime_autocast_dtype
-        )
-        self._tmp_dirs = set()
-        print(f"[DEBUG] VideoService pronto. boot_time={time.perf_counter()-t0:.3f}s")
     def _load_config(self):
         base = LTX_VIDEO_REPO_DIR / "configs"
         config_path = base / "ltxv-13b-0.9.8-distilled-fp8.yaml"
@@ -143,20 +122,6 @@ class VideoService:
             self._log_gpu_memory("Após finalize")
         except Exception as e:
             print(f"[DEBUG] Log GPU pós-finalize falhou: {e}")
-    def move_to_device(self, device):
-        """Move os modelos do pipeline para o dispositivo especificado."""
-        print(f"[LTX] Movendo modelos para {device}...")
-        self.pipeline.to(device)
-        if self.latent_upsampler:
-            self.latent_upsampler.to(device)
-        self.device = device
-    def move_to_cpu(self):
-        """Move os modelos para a CPU para liberar VRAM."""
-        self.move_to_device(torch.device("cpu"))
-        if torch.cuda.is_available():
-            torch.cuda.empty_cache()
     def _load_models(self):
         t0 = time.perf_counter()
@@ -559,11 +524,51 @@ class VideoService:
         final_pixel_tensor = torch.cat(pixel_chunks_to_concat, dim=2)
         final_video_path = self._save_and_log_video(final_pixel_tensor, f"final_concatenated_{seed}", fps, temp_dir, results_dir, seed)
         return final_video_path
-# --- INSTANCIAÇÃO DO SERVIÇO ---
 print("Criando instância do VideoService...")
 video_generation_service = VideoService()
-print("Instância do VideoService pronta.")
-self.device = gpu_manager.get_ltx_device()
-print(f"[DEBUG] LTX foi alocado para o dispositivo: {self.device}")

 # ltx_server_refactored.py — VideoService (Modular Version with Simple Overlap Chunking)
 import warnings
 from huggingface_hub import logging
 import os, subprocess, shlex, tempfile
 import torch
 import json
 import torch.nn.functional as F
 from managers.vae_manager import vae_manager_singleton
 from tools.video_encode_tool import video_encode_tool_singleton
 DEPS_DIR = Path("/data")
 LTX_VIDEO_REPO_DIR = DEPS_DIR / "LTX-Video"
+logging.set_verbosity_error()
+logging.set_verbosity_warning()
+logging.set_verbosity_info()
+logging.set_verbosity_debug()
+LTXV_DEBUG=1
+LTXV_FRAME_LOG_EVERY=8
+warnings.filterwarnings("ignore", category=UserWarning)
+warnings.filterwarnings("ignore", category=FutureWarning)
+warnings.filterwarnings("ignore", message=".*")
 # (Todas as funções de setup, helpers e inicialização da classe permanecem inalteradas)
 # ... (run_setup, add_deps_to_path, _query_gpu_processes_via_nvml, etc.)
 )
 class VideoService:
     def _load_config(self):
         base = LTX_VIDEO_REPO_DIR / "configs"
         config_path = base / "ltxv-13b-0.9.8-distilled-fp8.yaml"
             self._log_gpu_memory("Após finalize")
         except Exception as e:
             print(f"[DEBUG] Log GPU pós-finalize falhou: {e}")
     def _load_models(self):
         t0 = time.perf_counter()
         final_pixel_tensor = torch.cat(pixel_chunks_to_concat, dim=2)
         final_video_path = self._save_and_log_video(final_pixel_tensor, f"final_concatenated_{seed}", fps, temp_dir, results_dir, seed)
         return final_video_path
+    def __init__(self):
+        t0 = time.perf_counter()
+        print("[DEBUG] Inicializando VideoService...")
+        # 1. Obter o dispositivo alvo a partir do gerenciador
+        #    Não definimos `self.device` ainda, apenas guardamos o alvo.
+        target_device = gpu_manager.get_ltx_device()
+        print(f"[DEBUG] LTX foi alocado para o dispositivo: {target_device}")
+        # 2. Carregar a configuração e os modelos (na CPU, como a função _load_models faz)
+        self.config = self._load_config()
+        self.pipeline, self.latent_upsampler = self._load_models()
+        # 3. Mover os modelos para o dispositivo alvo e definir `self.device`
+        self.move_to_device(target_device) # Usando a função que já criamos!
+        # 4. Configurar o resto dos componentes com o dispositivo correto
+        self._apply_precision_policy()
+        vae_manager_singleton.attach_pipeline(
+            self.pipeline,
+            device=self.device, # Agora `self.device` está correto
+            autocast_dtype=self.runtime_autocast_dtype
+        )
+        self._tmp_dirs = set()
+        print(f"[DEBUG] VideoService pronto. boot_time={time.perf_counter()-t0:.3f}s")
+    # A função move_to_device que criamos antes é essencial aqui
+    def move_to_device(self, device):
+        """Move os modelos do pipeline para o dispositivo especificado."""
+        print(f"[LTX] Movendo modelos para {device}...")
+        self.device = torch.device(device) # Garante que é um objeto torch.device
+        self.pipeline.to(self.device)
+        if self.latent_upsampler:
+            self.latent_upsampler.to(self.device)
+        print(f"[LTX] Modelos agora estão em {self.device}.")
+    def move_to_cpu(self):
+        """Move os modelos para a CPU para liberar VRAM."""
+        self.move_to_device(torch.device("cpu"))
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+# Instanciação limpa, sem usar `self` fora da classe.
 print("Criando instância do VideoService...")
 video_generation_service = VideoService()
+print("Instância do VideoService pronta.")