MonsterMMORPG
/

Wan_GGUF

Model card Files Files and versions

Wan_GGUF / Viso_Master_Models /ref-ldm_embedding /configs /refldm.yaml

MonsterMMORPG's picture

Add files using upload-large-folder tool

e9003d9 verified 4 months ago

history blame contribute delete

3.2 kB

	model:
	base_learning_rate: 5.0e-05
	lr_schedule:
	type: linear_warmup
	warmup_steps: 10000
	target: ldm.models.diffusion.ddpm.LatentDiffusion
	params:
	ckpt_path: ./ckpts/ldm.ckpt
	ignore_keys:
	- model_ema
	monitor: val/ddim_latent_l1_loss_ema
	val_loss_run_ddim_steps: 200
	linear_start: 0.0015
	linear_end: 0.0155
	log_every_t: 100
	timesteps: 1000
	loss_type: l2
	image_size: 64
	channels: 8
	first_stage_key: gt_image
	first_stage_config:
	target: ldm.models.autoencoder.VQModelInterface
	params:
	ckpt_path: ./ckpts/vqgan.ckpt
	embed_dim: 8
	n_embed: 8192
	monitor: val/rec_loss
	ddconfig:
	double_z: false
	z_channels: 8
	resolution: 512
	in_channels: 3
	out_ch: 3
	ch: 128
	ch_mult:
	- 1
	- 1
	- 2
	- 4
	num_res_blocks: 2
	attn_resolutions: []
	dropout: 0.0
	lossconfig:
	target: torch.nn.Identity
	cond_stage_config:
	- cond_stage_key: lq_image
	conditioning_key: concat
	uncond_prob: 0.1
	cond_model_config: __is_first_stage__
	- cond_stage_key: ref_image
	conditioning_key: cache_kv
	uncond_prob: 0.1
	cond_model_config: __is_first_stage__
	use_cache_kv: true
	unet_config:
	target: ldm.modules.diffusionmodules.openaimodel.UNetModel
	params:
	use_checkpoint: false
	image_size: 64
	in_channels: 16
	out_channels: 8
	model_channels: 160
	attention_resolutions:
	- 2
	- 4
	- 8
	num_res_blocks: 2
	channel_mult:
	- 1
	- 2
	- 2
	- 4
	num_head_channels: 32
	use_spatial_transformer: false
	perceptual_loss_scale: 0.1
	perceptual_loss_weight_by_t: true
	perceptual_loss_config:
	target: ldm.modules.losses.identity_loss.IdentityLoss
	params:
	model_path: ./pretrained/insightface_webface_r50.onnx
	center_crop: true
	resize_hw:
	- 112
	- 112
	data:
	target: main.DataModuleFromConfig
	params:
	batch_size: 1
	num_workers: 8
	wrap: false
	train:
	target: ldm.data.ir.ImageRestorationDataset
	params:
	use_given_lq: false
	use_given_ref: true
	max_num_refs: 5
	ref_rand_aug: true
	shuffle_refs_prob: 1.0
	use_sample_weight: false
	file_list: ./data/ffhq/file_list/train_references.csv
	gt_dir: ./data/ffhq/images512x512
	ref_dir: ./data/ffhq/images512x512
	image_size:
	- 512
	- 512
	degrad_opt:
	blur_kernel_list:
	- iso
	- aniso
	blur_kernel_prob:
	- 0.5
	- 0.5
	blur_kernel_size: 41
	blur_sigma:
	- 0
	- 16
	downsample_range:
	- 1
	- 32
	noise_range:
	- 0
	- 20
	jpeg_range:
	- 30
	- 100
	lr_flip_aug: true