| job: extension | |
| config: | |
| name: latex_v1 | |
| process: | |
| - type: diffusion_trainer | |
| training_folder: /data/app/output | |
| sqlite_db_path: /data/app/aitk_db.db | |
| device: cuda | |
| trigger_word: latex | |
| performance_log_every: 10 | |
| network: | |
| type: lora | |
| linear: 32 | |
| linear_alpha: 32 | |
| conv: 16 | |
| conv_alpha: 16 | |
| lokr_full_rank: true | |
| lokr_factor: -1 | |
| network_kwargs: | |
| ignore_if_contains: [] | |
| save: | |
| dtype: bf16 | |
| save_every: 250 | |
| max_step_saves_to_keep: 4 | |
| save_format: diffusers | |
| push_to_hub: false | |
| datasets: | |
| - folder_path: /data/app/datasets/latex_01 | |
| mask_path: null | |
| mask_min_value: 0.1 | |
| default_caption: '' | |
| caption_ext: txt | |
| caption_dropout_rate: 0.05 | |
| cache_latents_to_disk: false | |
| is_reg: false | |
| network_weight: 1 | |
| resolution: | |
| - 512 | |
| - 768 | |
| - 1024 | |
| controls: [] | |
| shrink_video_to_frames: true | |
| num_frames: 1 | |
| do_i2v: true | |
| flip_x: false | |
| flip_y: false | |
| train: | |
| batch_size: 1 | |
| bypass_guidance_embedding: false | |
| steps: 3000 | |
| gradient_accumulation: 1 | |
| train_unet: true | |
| train_text_encoder: false | |
| gradient_checkpointing: true | |
| noise_scheduler: flowmatch | |
| optimizer: adamw8bit | |
| timestep_type: weighted | |
| content_or_style: balanced | |
| optimizer_params: | |
| weight_decay: 0.0001 | |
| unload_text_encoder: false | |
| cache_text_embeddings: false | |
| lr: 0.0001 | |
| ema_config: | |
| use_ema: false | |
| ema_decay: 0.99 | |
| skip_first_sample: false | |
| force_first_sample: false | |
| disable_sampling: false | |
| dtype: bf16 | |
| diff_output_preservation: false | |
| diff_output_preservation_multiplier: 1 | |
| diff_output_preservation_class: person | |
| switch_boundary_every: 1 | |
| loss_type: mse | |
| do_differential_guidance: true | |
| differential_guidance_scale: 3 | |
| model: | |
| name_or_path: Tongyi-MAI/Z-Image-Turbo | |
| quantize: true | |
| qtype: qfloat8 | |
| quantize_te: true | |
| qtype_te: qfloat8 | |
| arch: zimage:turbo | |
| low_vram: false | |
| model_kwargs: {} | |
| layer_offloading: false | |
| layer_offloading_text_encoder_percent: 1 | |
| layer_offloading_transformer_percent: 1 | |
| assistant_lora_path: ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v2.safetensors | |
| sample: | |
| sampler: flowmatch | |
| sample_every: 300 | |
| width: 512 | |
| height: 512 | |
| samples: | |
| - prompt: A high-detail editorial portrait of a woman wearing a sleek, shining | |
| black latex bodysuit. High neck, long sleeves. The surface shows intense | |
| specular highlights and realistic micro-creases at the joints. Soft studio | |
| lighting, 8k resolution, minimalist grey background. | |
| - prompt: A fashion model walking in a neon-lit city street, wearing a form-fitting | |
| red latex crop top paired with baggy denim jeans. The glossy texture of | |
| the latex contrasts with the rough fabric of the denim. Cinematic lighting, | |
| rain-slicked pavement, vibrant reflections. | |
| - prompt: Full body shot of a woman in a midnight blue latex catsuit performing | |
| a dynamic pose. The suit has a mirror-like finish, reflecting the surrounding | |
| environment. Sharp focus on the stretching material around the knees and | |
| elbows. Professional photography, clean composition. | |
| - prompt: Extreme close-up macro shot of polished purple latex fabric. Focus | |
| on the smooth, non-porous surface and the way light curves around the edges. | |
| Subtle highlights and deep shadows, showing the thickness and elasticity | |
| of the material. | |
| - prompt: A high-fashion avant-garde look featuring a structured emerald green | |
| latex dress with exaggerated shoulder pads. The material is highly reflective | |
| and stiff, shimmering under bright runway lights. Fashion photography, blurred | |
| audience in the background. | |
| - prompt: A sci-fi heroine standing in a futuristic laboratory, wearing a white | |
| latex tactical suit with silver accents. The pearlescent latex surface catches | |
| the blue and orange glow of holographic displays. Hyper-realistic, volumetric | |
| lighting, intricate details. | |
| - prompt: A professional fashion shot of a model in a high-gloss black latex | |
| outfit, standing next to a sleek, minimalist wall. On the wall is a high-quality | |
| acrylic sign that reads "Valenti Dynasty" in elegant typography. The reflective | |
| surface of the latex catches the glow from the sign. Sharp focus, cinematic | |
| studio lighting, premium aesthetic. | |
| neg: '' | |
| seed: 42 | |
| walk_seed: true | |
| guidance_scale: 1 | |
| sample_steps: 8 | |
| num_frames: 1 | |
| fps: 1 | |
| meta: | |
| name: latex_v1 | |
| version: '1.0' | |