stmdit-anon commited on
Commit
dbc957a
·
verified ·
1 Parent(s): 758aec5

Add ptpl-xattn-perceiver-p06 (PTPL-XAttn-Perceiver-B-p06)

Browse files
ptpl-xattn-perceiver-p06/README.md ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - histopathology
5
+ - diffusion
6
+ - spatial-transcriptomics
7
+ - icml-2026-sd4h-workshop
8
+ ---
9
+
10
+ # PTPL-XAttn-Perceiver-B-p06
11
+
12
+ EMA-only inference weights for the **PTPL-XAttn-Perceiver-B-p06** row reported in the
13
+ ICML 2026 SD4H workshop submission *Transcriptomics-Conditioned Virtual Tissue
14
+ Synthesis via Diffusion Transformers*.
15
+
16
+ - **Source checkpoint**: `step_2358000_ema.pt`
17
+ - **Architecture**: see `training_config.yaml` in this folder.
18
+ - **License**: Apache-2.0.
19
+
20
+ See the umbrella repo README at `stmdit-anon/stmdit-checkpoints` for usage.
ptpl-xattn-perceiver-p06/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dda4906dc48466d85bf4483f59cac7196ee2694259fbfa77e2795906252ec42
3
+ size 715792736
ptpl-xattn-perceiver-p06/training_config.yaml ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Training Configuration - PTPL-XAttn-Perceiver-B p=0.6
2
+ # =====================================================
3
+ # Multi-layer Perceiver Resampler: 32 latent tokens, depth=4.
4
+ # Dropout p=0.6 (weights 16/24/24/36).
5
+ # Trained on PTPL features (corrected normalization).
6
+ #
7
+ # Usage:
8
+ # run-training configs/training.yaml --lightning
9
+
10
+ output_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/PixCell-PTPL-XAttn/training/ptpl-xattn-perceiver-B-p06"
11
+ device: "cuda"
12
+
13
+ model:
14
+ type: "pixart_ge_xattn"
15
+ variant: "B"
16
+ ge_encoder_type: "cancerfoundation"
17
+ ge_hidden_dim: 512
18
+ cf_model_dir: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/cancer-foundation"
19
+ cf_freeze_backbone: true
20
+ ge_token_source: "perceiver"
21
+ ge_num_tokens: 32
22
+ ge_perceiver_depth: 4
23
+ ge_xattn_fusion: "xattn_only"
24
+
25
+ data:
26
+ features_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro-PTPL/feat-extraction/features_train"
27
+ load_gene_expression: true
28
+ load_gene_expression_binned: true
29
+ num_workers: 8
30
+ pin_memory: true
31
+ val_split: 0.1
32
+
33
+ diffusion:
34
+ timesteps: 1000
35
+ beta_schedule: "linear"
36
+ image_size: 256
37
+ latent_size: 32
38
+
39
+ training:
40
+ batch_size: 32
41
+ batch_size_val: 32
42
+ gradient_accumulation_steps: 4
43
+ num_epochs: 1000
44
+ seed: 42
45
+ gradient_clip: 0.01
46
+ ema_rate: 0.9999
47
+
48
+ optimizer:
49
+ lr: 2e-5
50
+ weight_decay: 0.01
51
+ betas: [0.9, 0.999]
52
+
53
+ scheduler:
54
+ warmup_steps: 1000
55
+ min_lr_ratio: 0.1
56
+
57
+ classifier_free_guidance:
58
+ conditioning_schedule:
59
+ - mask: [uni, ge]
60
+ weight: 16
61
+ - mask: [ge]
62
+ weight: 24
63
+ - mask: [uni]
64
+ weight: 24
65
+ - mask: []
66
+ weight: 36
67
+
68
+ convergence:
69
+ monitor_timestep_range: [900, 1000]
70
+ patience: 10
71
+ min_epochs: 50
72
+
73
+ distributed:
74
+ precision: "bf16-mixed"
75
+ compile_model: true
76
+
77
+ checkpoint:
78
+ save_every: 1000
79
+ resume: null
80
+
81
+ logging:
82
+ log_every: 100
83
+ validate_every: 0
84
+ gpu_monitor: true
85
+ gpu_monitor_interval: 60.0
86
+ sample_every_epochs: 10
87
+ sample_every_steps: 0
88
+ num_samples: 16
89
+ sample_guidance_scale: 3.0
90
+ sample_num_steps: 20
91
+ sample_vae_path: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/stability-ai-stable-diffusion-3-5-large/models--stabilityai--stable-diffusion-3.5-large/snapshots/ceddf0a7fdf2064ea28e2213e3b84e4afa170a0f/vae"