File size: 801 Bytes
04794eb | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 | # Inference-only architecture config for IScene-v1.
# This file intentionally excludes training logs, data paths, cluster settings,
# experiment names, and checkpoint metadata.
models:
denoiser:
name: SparseStructureSceneContextFlowModel
args:
resolution: 16
in_channels: 8
out_channels: 8
model_channels: 1024
cond_channels: 1024
num_blocks: 24
num_heads: 16
mlp_ratio: 4
patch_size: 1
pe_mode: ape
qk_rms_norm: true
use_fp16: true
scene_context_attn_num: 5
learning_pattern: full-finetune
exp_setting: global
img_conditioner:
name: ImageConditioner
args:
image_cond_model: dinov2_vitl14_reg
cond_in_channels: 3
use_fp16: false
dataset:
args:
exp_setting: global
|