Kimhi
/

RDM_DINO3_pooled_features

Model card Files Files and versions

RDM_DINO3_pooled_features / config.yaml

Kimhi's picture

Upload folder using huggingface_hub

0948ac1 verified about 2 months ago

history blame contribute delete

1.57 kB

	model:
	target: rdm.models.diffusion.ddpm.RDM
	params:
	linear_start: 0.0015
	linear_end: 0.0195
	num_timesteps_cond: 1
	log_every_t: 200
	timesteps: 1000
	first_stage_key: image
	cond_stage_key: class_label
	class_cond: true
	image_size: 1
	channels: 768
	cond_stage_trainable: true
	conditioning_key: crossattn
	parameterization: x0
	use_mean_pooling: true
	unet_config:
	target: rdm.modules.diffusionmodules.latentmlp.SimpleMLP
	params:
	in_channels: 768
	time_embed_dim: 256
	model_channels: 1536
	bottleneck_channels: 1536
	out_channels: 768
	num_res_blocks: 12
	use_context: true
	context_channels: 512
	pretrained_enc_config:
	params:
	pretrained_enc_arch: dinov3_vitb16
	# Set to the absolute path of the downloaded DINOv3 ViT-B/16 checkpoint
	# (e.g., dinov3_vitb16_pretrain_lvd1689m-73cec8be.pth). If left null,
	# torch.hub will attempt to download using the dinov3 repo helpers.
	pretrained_enc_path: /proj/mmfm/kimhi/EnrichCondImageGenerationUsingRCG/TrainRDM/dinov3_vit_b_16_checkpoint.pth
	proj_dim: 768
	pretrained_enc_withproj: false
	dinov3_check_hash: false
	# set to false to allow loading checkpoints that don't exactly match the repo architecture
	dinov3_load_strict: false
	cond_stage_config:
	target: rdm.modules.encoders.modules.ClassEmbedder
	params:
	embed_dim: 512
	n_classes: 1000
	key: class_label

	# Made with Bob