Test

Paused

App Files Files Community

Carlos s commited on Oct 4, 2025

Commit

b5542bb

verified ·

1 Parent(s): a614adb

Update api/ltx_server.py

Browse files

Files changed (1) hide show

api/ltx_server.py +17 -9

api/ltx_server.py CHANGED Viewed

@@ -587,7 +587,6 @@ class VideoService:
                 print("[DEBUG] Multi-escala: Iniciando Passo 1 (geração de latentes base).")
-                # 1. Configurar e executar o primeiro passo
                 first_pass_args = self.config.get("first_pass", {}).copy()
                 first_pass_kwargs = call_kwargs.copy()
                 first_pass_kwargs.update({
@@ -596,33 +595,41 @@ class VideoService:
                     "rescaling_scale": first_pass_args.get("rescaling_scale"),
                     "skip_block_list": first_pass_args.get("skip_block_list"),
                 })
-                # Opcional: ajustar timesteps se especificado no config
                 schedule = first_pass_args.get("timesteps") or first_pass_args.get("guidance_timesteps")
                 if schedule:
                     first_pass_kwargs["timesteps"] = schedule
                     first_pass_kwargs["guidance_timesteps"] = schedule
-                # Reduzir dimensões para o primeiro passo
                 downscale_factor = self.config.get("downscale_factor", 2)
                 original_height = first_pass_kwargs["height"]
                 original_width = first_pass_kwargs["width"]
-                first_pass_kwargs["height"] = original_height // downscale_factor
-                first_pass_kwargs["width"] = original_width // downscale_factor
-                print(f"[DEBUG] Passo 1: Dimensões reduzidas para {first_pass_kwargs['height']}x{first_pass_kwargs['width']}")
                 t_p1 = time.perf_counter()
                 ctx = torch.autocast(device_type="cuda", dtype=self.runtime_autocast_dtype) if self.device == "cuda" else contextlib.nullcontext()
                 with ctx:
-                    # Executa a pipeline principal para o primeiro passo
                     first_pass_result = self.pipeline(**first_pass_kwargs)
-                # Extrai os latentes do resultado
                 latents_low_res = first_pass_result.latents if hasattr(first_pass_result, "latents") else first_pass_result
                 print(f"[DEBUG] Passo 1 concluído em {time.perf_counter()-t_p1:.3f}s. Shape dos latentes de baixa resolução: {tuple(latents_low_res.shape)}")
                 log_tensor_info(latents_low_res, "Latentes (Passo 1)")
-                # Limpeza de memória entre os passos
                 del first_pass_result, first_pass_kwargs
                 gc.collect()
                 if self.device == "cuda": torch.cuda.empty_cache()
@@ -644,6 +651,7 @@ class VideoService:
                 print("[DEBUG] Multi-escala: Iniciando Passo 2 (refinamento em alta resolução).")
                 second_pass_args = self.config.get("second_pass", {}).copy()
                 second_pass_kwargs = call_kwargs.copy()
                 second_pass_kwargs.update({
                     "guidance_scale": float(guidance_scale),
                     "stg_scale": second_pass_args.get("stg_scale"),

                 print("[DEBUG] Multi-escala: Iniciando Passo 1 (geração de latentes base).")
                 first_pass_args = self.config.get("first_pass", {}).copy()
                 first_pass_kwargs = call_kwargs.copy()
                 first_pass_kwargs.update({
                     "rescaling_scale": first_pass_args.get("rescaling_scale"),
                     "skip_block_list": first_pass_args.get("skip_block_list"),
                 })
                 schedule = first_pass_args.get("timesteps") or first_pass_args.get("guidance_timesteps")
                 if schedule:
                     first_pass_kwargs["timesteps"] = schedule
                     first_pass_kwargs["guidance_timesteps"] = schedule
+                # ==================== NOVA LÓGICA DE DIMENSÕES AQUI ====================
                 downscale_factor = self.config.get("downscale_factor", 2)
                 original_height = first_pass_kwargs["height"]
                 original_width = first_pass_kwargs["width"]
+                divisor = 24
+                # Calcula a altura para o primeiro passo, garantindo divisibilidade
+                target_height_p1 = original_height // downscale_factor
+                first_pass_kwargs["height"] = round(target_height_p1 / divisor) * divisor
+                # Calcula a largura para o primeiro passo, garantindo divisibilidade
+                target_width_p1 = original_width // downscale_factor
+                first_pass_kwargs["width"] = round(target_width_p1 / divisor) * divisor
+                # Medida de segurança para evitar dimensões zero
+                if first_pass_kwargs["height"] == 0: first_pass_kwargs["height"] = divisor
+                if first_pass_kwargs["width"] == 0: first_pass_kwargs["width"] = divisor
+                # =======================================================================
+                print(f"[DEBUG] Passo 1: Dimensões reduzidas e ajustadas para {first_pass_kwargs['height']}x{first_pass_kwargs['width']}")
                 t_p1 = time.perf_counter()
                 ctx = torch.autocast(device_type="cuda", dtype=self.runtime_autocast_dtype) if self.device == "cuda" else contextlib.nullcontext()
                 with ctx:
                     first_pass_result = self.pipeline(**first_pass_kwargs)
                 latents_low_res = first_pass_result.latents if hasattr(first_pass_result, "latents") else first_pass_result
                 print(f"[DEBUG] Passo 1 concluído em {time.perf_counter()-t_p1:.3f}s. Shape dos latentes de baixa resolução: {tuple(latents_low_res.shape)}")
                 log_tensor_info(latents_low_res, "Latentes (Passo 1)")
                 del first_pass_result, first_pass_kwargs
                 gc.collect()
                 if self.device == "cuda": torch.cuda.empty_cache()
                 print("[DEBUG] Multi-escala: Iniciando Passo 2 (refinamento em alta resolução).")
                 second_pass_args = self.config.get("second_pass", {}).copy()
                 second_pass_kwargs = call_kwargs.copy()
                 second_pass_kwargs.update({
                     "guidance_scale": float(guidance_scale),
                     "stg_scale": second_pass_args.get("stg_scale"),