rae-dit-s-ep14-diffusers / conversion_metadata.json

Fix RAEDiT Stage-2 positional embedding export

c4c58dd verified 8 days ago

1.82 kB

	{
	"source": {
	"weights_repo_or_path": "nyu-visionx/RAE-collections",
	"config_repo_or_path": "/home/ubuntu/rae-upstream-configs",
	"config_path": "configs/stage2/training/ImageNet256/DiTDH-S_DINOv2-B.yaml",
	"vae_model_name_or_path": "nyu-visionx/RAE-dinov2-wReg-base-ViTXL-n08"
	},
	"scheduler": {
	"num_train_timesteps": 1000,
	"shift": 6.928203230275509,
	"path_type": "Linear",
	"prediction": "velocity",
	"time_dist_type": "logit-normal_0_1"
	},
	"sampler": {
	"mode": "ODE",
	"params": {
	"sampling_method": "euler",
	"num_steps": 50,
	"atol": 1e-06,
	"rtol": 0.001,
	"reverse": false
	}
	},
	"guidance": {
	"method": "cfg",
	"scale": 1.0,
	"t_min": 0.0,
	"t_max": 1.0
	},
	"misc": {
	"latent_size": [
	768,
	16,
	16
	],
	"num_classes": 1000,
	"time_dist_shift_dim": 196608,
	"time_dist_shift_base": 4096
	},
	"transformer": {
	"checkpoint_path": "/home/ubuntu/.cache/huggingface/hub/models--nyu-visionx--RAE-collections/snapshots/1be4f03273523431f099a934da4cf1940dc6039f/DiTs/Dinov2/wReg_base/ImageNet256/DiTDH-S_ep14/stage2_model.pt",
	"checkpoint_key": null,
	"prefer_ema": true,
	"config": {
	"sample_size": 16,
	"patch_size": 1,
	"in_channels": 768,
	"hidden_size": [
	384,
	2048
	],
	"depth": [
	12,
	2
	],
	"num_heads": [
	6,
	16
	],
	"mlp_ratio": 4.0,
	"class_dropout_prob": 0.1,
	"num_classes": 1000,
	"use_qknorm": false,
	"use_swiglu": true,
	"use_rope": true,
	"use_rmsnorm": true,
	"wo_shift": false,
	"use_pos_embed": true
	},
	"num_parameters": 196554068
	},
	"pipeline": {
	"saved": true,
	"id2label_json_path": null
	}
	}