KangLiao commited on
Commit
444cc69
·
1 Parent(s): 4b5dec2
configs/models/qwen2_5_1_5b_radio_sd3_dynamic_puffin.py CHANGED
@@ -2,7 +2,6 @@ import torch
2
  from src.models.puffin.model import Qwen2p5RadioStableDiffusion3HFDynamic
3
  from src.models.stable_diffusion3.transformer_sd3_dynamic import SD3Transformer2DModel
4
  from src.models.radiov3.hf_model import RADIOModel
5
- from transformers import AutoConfig
6
  from diffusers import AutoencoderKL, FlowMatchEulerDiscreteScheduler
7
  from transformers import AutoModelForCausalLM, AutoTokenizer
8
 
@@ -41,45 +40,51 @@ model = dict(type=Qwen2p5RadioStableDiffusion3HFDynamic,
41
  ),
42
  transformer=dict(
43
  type=SD3Transformer2DModel.from_pretrained,
44
- #pretrained_model_name_or_path=sd3_model_name_or_path,
45
- #subfolder="transformer",
46
- #torch_dtype=torch.bfloat16
 
47
  ),
48
  test_scheduler=dict(
49
  type=FlowMatchEulerDiscreteScheduler.from_pretrained,
50
- #pretrained_model_name_or_path=sd3_model_name_or_path,
51
- #subfolder="scheduler"
 
52
  ),
53
  train_scheduler=dict(
54
  type=FlowMatchEulerDiscreteScheduler.from_pretrained,
55
- #pretrained_model_name_or_path=sd3_model_name_or_path,
56
- #subfolder="scheduler"
 
57
  ),
58
  vae=dict(
59
  type=AutoencoderKL.from_pretrained,
60
- #pretrained_model_name_or_path=sd3_model_name_or_path,
61
- #subfolder="vae",
62
- #torch_dtype=torch.bfloat16
 
63
  ),
64
  freeze_visual_encoder=True,
65
  freeze_llm=True,
66
  llm=dict(
67
  type=AutoModelForCausalLM.from_pretrained,
68
- #pretrained_model_name_or_path=llm_name_or_path,
69
- #torch_dtype=torch.bfloat16,
 
70
  #attn_implementation='flash_attention_2',
71
  ),
72
  tokenizer=dict(
73
  type=AutoTokenizer.from_pretrained,
74
- #pretrained_model_name_or_path=llm_name_or_path
 
75
  ),
76
  prompt_template=prompt_template,
77
  pretrained_pth=None,
78
  use_activation_checkpointing=False,
79
  visual_encoder=dict(
80
  type=RADIOModel.from_pretrained,
81
- config=AutoConfig.from_pretrained("nvidia/C-RADIOv3-H"),
82
- #pretrained_model_name_or_path="nvidia/C-RADIOv3-H",
83
- #torch_dtype=torch.bfloat16,
84
  ),
85
  )
 
2
  from src.models.puffin.model import Qwen2p5RadioStableDiffusion3HFDynamic
3
  from src.models.stable_diffusion3.transformer_sd3_dynamic import SD3Transformer2DModel
4
  from src.models.radiov3.hf_model import RADIOModel
 
5
  from diffusers import AutoencoderKL, FlowMatchEulerDiscreteScheduler
6
  from transformers import AutoModelForCausalLM, AutoTokenizer
7
 
 
40
  ),
41
  transformer=dict(
42
  type=SD3Transformer2DModel.from_pretrained,
43
+ pretrained_model_name_or_path=sd3_model_name_or_path,
44
+ subfolder="transformer",
45
+ torch_dtype=torch.bfloat16,
46
+ local_files_only=True,
47
  ),
48
  test_scheduler=dict(
49
  type=FlowMatchEulerDiscreteScheduler.from_pretrained,
50
+ pretrained_model_name_or_path=sd3_model_name_or_path,
51
+ subfolder="scheduler",
52
+ local_files_only=True,
53
  ),
54
  train_scheduler=dict(
55
  type=FlowMatchEulerDiscreteScheduler.from_pretrained,
56
+ pretrained_model_name_or_path=sd3_model_name_or_path,
57
+ subfolder="scheduler",
58
+ local_files_only=True,
59
  ),
60
  vae=dict(
61
  type=AutoencoderKL.from_pretrained,
62
+ pretrained_model_name_or_path=sd3_model_name_or_path,
63
+ subfolder="vae",
64
+ torch_dtype=torch.bfloat16,
65
+ local_files_only=True,
66
  ),
67
  freeze_visual_encoder=True,
68
  freeze_llm=True,
69
  llm=dict(
70
  type=AutoModelForCausalLM.from_pretrained,
71
+ pretrained_model_name_or_path=llm_name_or_path,
72
+ torch_dtype=torch.bfloat16,
73
+ local_files_only=True,
74
  #attn_implementation='flash_attention_2',
75
  ),
76
  tokenizer=dict(
77
  type=AutoTokenizer.from_pretrained,
78
+ pretrained_model_name_or_path=llm_name_or_path,
79
+ local_files_only=True,
80
  ),
81
  prompt_template=prompt_template,
82
  pretrained_pth=None,
83
  use_activation_checkpointing=False,
84
  visual_encoder=dict(
85
  type=RADIOModel.from_pretrained,
86
+ pretrained_model_name_or_path="nvidia/C-RADIOv3-H",
87
+ torch_dtype=torch.bfloat16,
88
+ local_files_only=True,
89
  ),
90
  )