Add adaln-flow-p01 (PixCell-Flow-GE-B (p=0.1))

Browse files

Files changed (3) hide show

adaln-flow-p01/README.md +20 -0
adaln-flow-p01/model.pt +3 -0
adaln-flow-p01/training_config.yaml +86 -0

adaln-flow-p01/README.md ADDED Viewed

	@@ -0,0 +1,20 @@

+---
+license: apache-2.0
+tags:
+  - histopathology
+  - diffusion
+  - spatial-transcriptomics
+  - icml-2026-sd4h-workshop
+---
+# PixCell-Flow-GE-B (p=0.1)
+EMA-only inference weights for the **PixCell-Flow-GE-B (p=0.1)** row reported in the
+ICML 2026 SD4H workshop submission *Transcriptomics-Conditioned Virtual Tissue
+Synthesis via Diffusion Transformers*.
+- **Source checkpoint**: `step_0578000_ema.pt`
+- **Architecture**: see `training_config.yaml` in this folder.
+- **License**: Apache-2.0.
+See the umbrella repo README at `stmdit-anon/stmdit-checkpoints` for usage.

adaln-flow-p01/model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fda405125d00daada4013197f5bfbacab0bd2ed09bb23278d92670a40f8207d7
+size 531225181

adaln-flow-p01/training_config.yaml ADDED Viewed

	@@ -0,0 +1,86 @@

+# Training Configuration - PixCell-Flow-GE-B with CancerFoundation Encoder
+# =========================================================================
+# Base variant (130M params) with CancerFoundation GE encoder.
+# Uses flow matching (EulerSampler) instead of DDPM.
+#
+# Usage:
+#   run-training configs/training.yaml
+output_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/PixCell-Flow-GE/training/pixcell-flow-ge-B"
+device: "cuda"
+model:
+  type: "pixcell_flow_ge"
+  variant: "B"  # 130M params: depth=12, hidden=768, heads=12
+  ge_encoder_type: "cancerfoundation"
+  ge_hidden_dim: 512
+  cf_model_dir: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/cancer-foundation"
+  cf_freeze_backbone: true
+  ge_condition_final_layer: false
+data:
+  features_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/feat-extraction/features_train"
+  load_gene_expression: true
+  load_gene_expression_binned: true
+  num_workers: 8
+  pin_memory: true
+  val_split: 0.1
+diffusion:
+  timesteps: 1000
+  # No beta_schedule: flow matching uses linear interpolation, not a noise schedule
+  image_size: 256
+  latent_size: 32
+training:
+  batch_size: 32
+  batch_size_val: 32
+  gradient_accumulation_steps: 4  # effective batch = 128
+  num_epochs: 1000
+  seed: 42
+  gradient_clip: 0.01
+  ema_rate: 0.999
+  optimizer:
+    lr: 2e-5
+    weight_decay: 0.01
+    betas: [0.9, 0.999]
+  scheduler:
+    warmup_steps: 1000
+    min_lr_ratio: 0.1
+  classifier_free_guidance:
+    conditioning_schedule:
+      - mask: [uni, ge]   # full conditioning (UNI + GE active)
+        weight: 81
+      - mask: [ge]        # GE only (UNI dropped)
+        weight: 9
+      - mask: [uni]       # UNI only (GE dropped)
+        weight: 9
+      - mask: []          # unconditional (both dropped)
+        weight: 1
+  convergence:
+    monitor_timestep_range: [400, 600]
+    patience: 10
+    min_epochs: 50
+distributed:
+  precision: "32"
+checkpoint:
+  save_every: 1000
+  resume: null
+logging:
+  log_every: 100
+  validate_every: 0
+  gpu_monitor: true
+  gpu_monitor_interval: 60.0
+  sample_every_epochs: 10
+  sample_every_steps: 0
+  num_samples: 16
+  sample_guidance_scale: 3.0
+  sample_num_steps: 20
+  sample_vae_path: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/stability-ai-stable-diffusion-3-5-large/models--stabilityai--stable-diffusion-3.5-large/snapshots/ceddf0a7fdf2064ea28e2213e3b84e4afa170a0f/vae"