stmdit-anon commited on
Commit
67d7480
·
verified ·
1 Parent(s): 3d4d96b

Add adaln-flow-p01 (PixCell-Flow-GE-B (p=0.1))

Browse files
adaln-flow-p01/README.md ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - histopathology
5
+ - diffusion
6
+ - spatial-transcriptomics
7
+ - icml-2026-sd4h-workshop
8
+ ---
9
+
10
+ # PixCell-Flow-GE-B (p=0.1)
11
+
12
+ EMA-only inference weights for the **PixCell-Flow-GE-B (p=0.1)** row reported in the
13
+ ICML 2026 SD4H workshop submission *Transcriptomics-Conditioned Virtual Tissue
14
+ Synthesis via Diffusion Transformers*.
15
+
16
+ - **Source checkpoint**: `step_0578000_ema.pt`
17
+ - **Architecture**: see `training_config.yaml` in this folder.
18
+ - **License**: Apache-2.0.
19
+
20
+ See the umbrella repo README at `stmdit-anon/stmdit-checkpoints` for usage.
adaln-flow-p01/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda405125d00daada4013197f5bfbacab0bd2ed09bb23278d92670a40f8207d7
3
+ size 531225181
adaln-flow-p01/training_config.yaml ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Training Configuration - PixCell-Flow-GE-B with CancerFoundation Encoder
2
+ # =========================================================================
3
+ # Base variant (130M params) with CancerFoundation GE encoder.
4
+ # Uses flow matching (EulerSampler) instead of DDPM.
5
+ #
6
+ # Usage:
7
+ # run-training configs/training.yaml
8
+
9
+ output_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/PixCell-Flow-GE/training/pixcell-flow-ge-B"
10
+ device: "cuda"
11
+
12
+ model:
13
+ type: "pixcell_flow_ge"
14
+ variant: "B" # 130M params: depth=12, hidden=768, heads=12
15
+ ge_encoder_type: "cancerfoundation"
16
+ ge_hidden_dim: 512
17
+ cf_model_dir: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/cancer-foundation"
18
+ cf_freeze_backbone: true
19
+ ge_condition_final_layer: false
20
+
21
+ data:
22
+ features_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/feat-extraction/features_train"
23
+ load_gene_expression: true
24
+ load_gene_expression_binned: true
25
+ num_workers: 8
26
+ pin_memory: true
27
+ val_split: 0.1
28
+
29
+ diffusion:
30
+ timesteps: 1000
31
+ # No beta_schedule: flow matching uses linear interpolation, not a noise schedule
32
+ image_size: 256
33
+ latent_size: 32
34
+
35
+ training:
36
+ batch_size: 32
37
+ batch_size_val: 32
38
+ gradient_accumulation_steps: 4 # effective batch = 128
39
+ num_epochs: 1000
40
+ seed: 42
41
+ gradient_clip: 0.01
42
+ ema_rate: 0.999
43
+
44
+ optimizer:
45
+ lr: 2e-5
46
+ weight_decay: 0.01
47
+ betas: [0.9, 0.999]
48
+
49
+ scheduler:
50
+ warmup_steps: 1000
51
+ min_lr_ratio: 0.1
52
+
53
+ classifier_free_guidance:
54
+ conditioning_schedule:
55
+ - mask: [uni, ge] # full conditioning (UNI + GE active)
56
+ weight: 81
57
+ - mask: [ge] # GE only (UNI dropped)
58
+ weight: 9
59
+ - mask: [uni] # UNI only (GE dropped)
60
+ weight: 9
61
+ - mask: [] # unconditional (both dropped)
62
+ weight: 1
63
+
64
+ convergence:
65
+ monitor_timestep_range: [400, 600]
66
+ patience: 10
67
+ min_epochs: 50
68
+
69
+ distributed:
70
+ precision: "32"
71
+
72
+ checkpoint:
73
+ save_every: 1000
74
+ resume: null
75
+
76
+ logging:
77
+ log_every: 100
78
+ validate_every: 0
79
+ gpu_monitor: true
80
+ gpu_monitor_interval: 60.0
81
+ sample_every_epochs: 10
82
+ sample_every_steps: 0
83
+ num_samples: 16
84
+ sample_guidance_scale: 3.0
85
+ sample_num_steps: 20
86
+ sample_vae_path: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/stability-ai-stable-diffusion-3-5-large/models--stabilityai--stable-diffusion-3.5-large/snapshots/ceddf0a7fdf2064ea28e2213e3b84e4afa170a0f/vae"