AbstractPhil
/

tiny-flux-deep

@@ -41,12 +41,12 @@ from pathlib import Path
 class TinyFluxConfig:
     """
     Configuration for TinyFlux-Deep v4.1 model.
     This config fully defines the model architecture and can be used to:
     1. Initialize a new model
-    2. Convert checkpoints between versions
     3. Validate checkpoint compatibility
     All dimension constraints are validated on creation.
     """
@@ -105,10 +105,10 @@ class TinyFluxConfig:
                 f"num_attention_heads * attention_head_dim ({expected_hidden})"
             )
-        # Validate RoPE dimensions
         if isinstance(self.axes_dims_rope, list):
             self.axes_dims_rope = tuple(self.axes_dims_rope)
         rope_sum = sum(self.axes_dims_rope)
         if rope_sum != self.attention_head_dim:
             raise ValueError(
@@ -158,11 +158,11 @@ class TinyFluxConfig:
     def validate_checkpoint(self, state_dict: Dict[str, torch.Tensor]) -> List[str]:
         """
         Validate that a checkpoint matches this config.
         Returns list of warnings (empty if perfect match).
         """
         warnings = []
         # Check double block count
         max_double = 0
         for key in state_dict:
@@ -171,7 +171,7 @@ class TinyFluxConfig:
                 max_double = max(max_double, idx + 1)
         if max_double != self.num_double_layers:
             warnings.append(f"double_blocks: checkpoint has {max_double}, config expects {self.num_double_layers}")
         # Check single block count
         max_single = 0
         for key in state_dict:
@@ -180,25 +180,25 @@ class TinyFluxConfig:
                 max_single = max(max_single, idx + 1)
         if max_single != self.num_single_layers:
             warnings.append(f"single_blocks: checkpoint has {max_single}, config expects {self.num_single_layers}")
         # Check hidden size from a known weight
         if "img_in.weight" in state_dict:
             w = state_dict["img_in.weight"]
             if w.shape[0] != self.hidden_size:
                 warnings.append(f"hidden_size: checkpoint has {w.shape[0]}, config expects {self.hidden_size}")
         # Check for v4.1 components
         has_sol = any(k.startswith("sol_prior.") for k in state_dict)
         has_t5 = any(k.startswith("t5_pool.") for k in state_dict)
         has_lune = any(k.startswith("lune_predictor.") for k in state_dict)
         if self.use_sol_prior and not has_sol:
             warnings.append("config expects sol_prior but checkpoint missing it")
         if self.use_t5_vec and not has_t5:
             warnings.append("config expects t5_pool but checkpoint missing it")
         if self.use_lune_expert and not has_lune:
             warnings.append("config expects lune_predictor but checkpoint missing it")
         return warnings
@@ -1024,10 +1024,6 @@ class TinyFluxDeep(nn.Module):
         else:
             self.sol_prior = None
-        # === Legacy support ===
-        # Map old expert_predictor API to lune_predictor
-        self.expert_predictor = self.lune_predictor
         # Legacy guidance
         if cfg.guidance_embeds:
             self.guidance_in = MLPEmbedder(cfg.hidden_size)
@@ -1060,6 +1056,11 @@ class TinyFluxDeep(nn.Module):
         self.apply(_init)
         nn.init.zeros_(self.final_linear.weight)
     def forward(
         self,
         hidden_states: torch.Tensor,
@@ -1118,7 +1119,7 @@ class TinyFluxDeep(nn.Module):
         encoder_hidden_states = encoder_hidden_states.to(dtype=model_dtype)
         pooled_projections = pooled_projections.to(dtype=model_dtype)
         timestep = timestep.to(dtype=model_dtype)
         # Cast optional expert inputs if provided
         if lune_features is not None:
             lune_features = lune_features.to(dtype=model_dtype)

 class TinyFluxConfig:
     """
     Configuration for TinyFlux-Deep v4.1 model.
     This config fully defines the model architecture and can be used to:
     1. Initialize a new model
+    2. Convert checkpoints between versions
     3. Validate checkpoint compatibility
     All dimension constraints are validated on creation.
     """
                 f"num_attention_heads * attention_head_dim ({expected_hidden})"
             )
+        # Validate RoPE dimensions
         if isinstance(self.axes_dims_rope, list):
             self.axes_dims_rope = tuple(self.axes_dims_rope)
         rope_sum = sum(self.axes_dims_rope)
         if rope_sum != self.attention_head_dim:
             raise ValueError(
     def validate_checkpoint(self, state_dict: Dict[str, torch.Tensor]) -> List[str]:
         """
         Validate that a checkpoint matches this config.
         Returns list of warnings (empty if perfect match).
         """
         warnings = []
         # Check double block count
         max_double = 0
         for key in state_dict:
                 max_double = max(max_double, idx + 1)
         if max_double != self.num_double_layers:
             warnings.append(f"double_blocks: checkpoint has {max_double}, config expects {self.num_double_layers}")
         # Check single block count
         max_single = 0
         for key in state_dict:
                 max_single = max(max_single, idx + 1)
         if max_single != self.num_single_layers:
             warnings.append(f"single_blocks: checkpoint has {max_single}, config expects {self.num_single_layers}")
         # Check hidden size from a known weight
         if "img_in.weight" in state_dict:
             w = state_dict["img_in.weight"]
             if w.shape[0] != self.hidden_size:
                 warnings.append(f"hidden_size: checkpoint has {w.shape[0]}, config expects {self.hidden_size}")
         # Check for v4.1 components
         has_sol = any(k.startswith("sol_prior.") for k in state_dict)
         has_t5 = any(k.startswith("t5_pool.") for k in state_dict)
         has_lune = any(k.startswith("lune_predictor.") for k in state_dict)
         if self.use_sol_prior and not has_sol:
             warnings.append("config expects sol_prior but checkpoint missing it")
         if self.use_t5_vec and not has_t5:
             warnings.append("config expects t5_pool but checkpoint missing it")
         if self.use_lune_expert and not has_lune:
             warnings.append("config expects lune_predictor but checkpoint missing it")
         return warnings
         else:
             self.sol_prior = None
         # Legacy guidance
         if cfg.guidance_embeds:
             self.guidance_in = MLPEmbedder(cfg.hidden_size)
         self.apply(_init)
         nn.init.zeros_(self.final_linear.weight)
+    @property
+    def expert_predictor(self):
+        """Legacy API: alias for lune_predictor."""
+        return self.lune_predictor
     def forward(
         self,
         hidden_states: torch.Tensor,
         encoder_hidden_states = encoder_hidden_states.to(dtype=model_dtype)
         pooled_projections = pooled_projections.to(dtype=model_dtype)
         timestep = timestep.to(dtype=model_dtype)
         # Cast optional expert inputs if provided
         if lune_features is not None:
             lune_features = lune_features.to(dtype=model_dtype)