File size: 2,638 Bytes
f9b9c88 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 | data_wrapper:
dataset:
garment_tokenizer:
standardize:
rotations:
_target_: data.datasets.panel_configs.StatsConfig
scale:
- 1
- 1
- 1
- 1
shift:
- 0
- 0
- 0
- 0
translations:
_target_: data.datasets.panel_configs.StatsConfig
scale:
- 26.06867645
- 32.42920198
- 22.29905009
shift:
- -0.0125378371
- 113.507532
- 2.63046369
vertices:
_target_: data.datasets.panel_configs.StatsConfig
scale:
- 24.4920733
- 26.60402835
shift:
- 8.44428116
- 16.84081321
_target_: data.datasets.panel_configs.StandardizeConfig
_target_: data.garment_tokenizers.gcd_garment_tokenizer.GCDGarmentTokenizer
random_tag: true
num_tags: 108
_target_: data.datasets.gcd_mm_dataset.GCDMM
root_dir: datadir/GarmentCodeData_v2/GarmentCodeData_v2
editing_dir: datadir/GarmentCodeData_v2/GCD-MM/editing_dir/garmentcodedata_editing
caption_dir: datadir/GarmentCodeData_v2/GCD-MM/caption_dir/long-caption-processed
editing_flip_prob: 0.5
sampling_rate:
- 0.2
- 0.2
- 0.2
- 0.2
- 0.2
panel_classification: assets/data_configs/panel_classes_garmentcodedata.json
load_by_dataname: assets/data_configs/garmentcodedata_list.txt
image_size: 448
max_num_patches: 12
conv_template: internvl2_5
_target_: data.data_wrappers.data_wrapper.DataWrapper
_recursive_: false
collate_fn: data.data_wrappers.collate_fns.collate_fn
split_file: assets/data_configs/garmentcodedata_datasplit.json
trainer:
_target_: trainers.trainer.Trainer
lr: 1.0e-05
beta1: 0.9
beta2: 0.95
grad_accumulation_steps: 10
batch_size: 4
num_steps: 12750
save_freq: 1000
experiment:
wandb_info:
wandb_dir: wandb
wandb_cache_dir: wandb_cache
project_name: AIpparel
run_name: train
run_id: null
local_dir: null
model:
edge_loss_weight: 0.1
pos_embed: true
num_freq: 0
pos_embed_type: sinusoidal
verts_bounds:
- -4
- -4
- 4
- 4
transf_bounds:
- -4
- -4
- -4
- -1
- -1
- -1
- -1
- 4
- 4
- 4
- 1
- 1
- 1
- 1
denormalize_for_loss: false
num_regression_layers: 2
discretize: true
bin_num: 256
my_pretrained_path: null
llm_pretrained_path: cache/InternVL3-2B-Instruct
resume_path: null
sampling_type: default
pretrained_config: null
precision: bf16
evaluate: false
conv_type: internvl2_5
from_start: false
storage_dir: output/
|