| | PRESET = { |
| | "full": { |
| | "enable_conv": True, |
| | "unet_target_module": [ |
| | "Transformer2DModel", |
| | "ResnetBlock2D", |
| | "Downsample2D", |
| | "Upsample2D", |
| | "HunYuanDiTBlock", |
| | "DoubleStreamBlock", |
| | "SingleStreamBlock", |
| | "SingleDiTBlock", |
| | "MMDoubleStreamBlock", |
| | "MMSingleStreamBlock", |
| | ], |
| | "unet_target_name": [ |
| | "conv_in", |
| | "conv_out", |
| | "time_embedding.linear_1", |
| | "time_embedding.linear_2", |
| | ], |
| | "text_encoder_target_module": [ |
| | "CLIPAttention", |
| | "CLIPSdpaAttention", |
| | "CLIPMLP", |
| | "MT5Block", |
| | "BertLayer", |
| | ], |
| | "text_encoder_target_name": [], |
| | }, |
| | "full-lin": { |
| | "enable_conv": False, |
| | "unet_target_module": [ |
| | "Transformer2DModel", |
| | "ResnetBlock2D", |
| | "HunYuanDiTBlock", |
| | "DoubleStreamBlock", |
| | "SingleStreamBlock", |
| | "SingleDiTBlock", |
| | "MMDoubleStreamBlock", |
| | "MMSingleStreamBlock", |
| | ], |
| | "unet_target_name": [ |
| | "time_embedding.linear_1", |
| | "time_embedding.linear_2", |
| | ], |
| | "text_encoder_target_module": [ |
| | "CLIPAttention", |
| | "CLIPSdpaAttention", |
| | "CLIPMLP", |
| | "MT5Block", |
| | "BertLayer", |
| | ], |
| | "text_encoder_target_name": [], |
| | }, |
| | "attn-mlp": { |
| | "enable_conv": False, |
| | "unet_target_module": [ |
| | "Transformer2DModel", |
| | "HunYuanDiTBlock", |
| | "DoubleStreamBlock", |
| | "SingleStreamBlock", |
| | "SingleDiTBlock", |
| | "MMDoubleStreamBlock", |
| | "MMSingleStreamBlock", |
| | ], |
| | "unet_target_name": [], |
| | "text_encoder_target_module": [ |
| | "CLIPAttention", |
| | "CLIPSdpaAttention", |
| | "CLIPMLP", |
| | "MT5Block", |
| | "BertLayer", |
| | ], |
| | "text_encoder_target_name": [], |
| | }, |
| | "attn-only": { |
| | "enable_conv": False, |
| | "unet_target_module": [ |
| | "CrossAttention", |
| | "SelfAttention", |
| | ], |
| | "unet_target_name": [], |
| | "text_encoder_target_module": [ |
| | "CLIPAttention", |
| | "CLIPSdpaAttention", |
| | "BertAttention", |
| | "MT5LayerSelfAttention", |
| | ], |
| | "text_encoder_target_name": [], |
| | }, |
| | "unet-only": { |
| | "enable_conv": True, |
| | "unet_target_module": [ |
| | "Transformer2DModel", |
| | "ResnetBlock2D", |
| | "Downsample2D", |
| | "Upsample2D", |
| | "HunYuanDiTBlock", |
| | "DoubleStreamBlock", |
| | "SingleStreamBlock", |
| | "SingleDiTBlock", |
| | "MMDoubleStreamBlock", |
| | "MMSingleStreamBlock", |
| | ], |
| | "unet_target_name": [ |
| | "conv_in", |
| | "conv_out", |
| | "time_embedding.linear_1", |
| | "time_embedding.linear_2", |
| | ], |
| | "text_encoder_target_module": [], |
| | "text_encoder_target_name": [], |
| | }, |
| | "unet-transformer-only": { |
| | "enable_conv": False, |
| | "unet_target_module": [ |
| | "Transformer2DModel", |
| | "HunYuanDiTBlock", |
| | "DoubleStreamBlock", |
| | "SingleStreamBlock", |
| | "SingleDiTBlock", |
| | "MMDoubleStreamBlock", |
| | "MMSingleStreamBlock", |
| | ], |
| | "unet_target_name": [], |
| | "text_encoder_target_module": [], |
| | "text_encoder_target_name": [], |
| | }, |
| | "unet-convblock-only": { |
| | "enable_conv": True, |
| | "unet_target_module": ["ResnetBlock2D", "Downsample2D", "Upsample2D"], |
| | "unet_target_name": [ |
| | "conv_in", |
| | "conv_out", |
| | ], |
| | "text_encoder_target_module": [], |
| | "text_encoder_target_name": [], |
| | }, |
| | "ia3": { |
| | "enable_conv": False, |
| | "unet_target_module": [], |
| | "unet_target_name": ["to_k", "to_v", "ff.net.2"], |
| | "text_encoder_target_module": [], |
| | "text_encoder_target_name": ["k_proj", "v_proj", "mlp.fc2"], |
| | "name_algo_map": { |
| | "mlp.fc2": {"train_on_input": True}, |
| | "ff.net.2": {"train_on_input": True}, |
| | }, |
| | }, |
| | } |
| |
|