Add adaln-ddpm-p02 (PixCell-GE-B-p02)

Browse files

Files changed (3) hide show

adaln-ddpm-p02/README.md +20 -0
adaln-ddpm-p02/model.pt +3 -0
adaln-ddpm-p02/training_config.yaml +114 -0

adaln-ddpm-p02/README.md ADDED Viewed

	@@ -0,0 +1,20 @@

+---
+license: apache-2.0
+tags:
+  - histopathology
+  - diffusion
+  - spatial-transcriptomics
+  - icml-2026-sd4h-workshop
+---
+# PixCell-GE-B-p02
+EMA-only inference weights for the **PixCell-GE-B-p02** row reported in the
+ICML 2026 SD4H workshop submission *Transcriptomics-Conditioned Virtual Tissue
+Synthesis via Diffusion Transformers*.
+- **Source checkpoint**: `step_0545000_ema.pt`
+- **Architecture**: see `training_config.yaml` in this folder.
+- **License**: Apache-2.0.
+See the umbrella repo README at `stmdit-anon/stmdit-checkpoints` for usage.

adaln-ddpm-p02/model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb3997b8e6d1603ef5972101b32d32cda00ebfa946ed90e4a34d86c38405a4ed
+size 531422045

adaln-ddpm-p02/training_config.yaml ADDED Viewed

	@@ -0,0 +1,114 @@

+# Training Configuration - PixArtGE-B with CancerFoundation Encoder
+# ==================================================================
+# Base variant (130M params) with CancerFoundation gene expression encoder.
+#
+# Usage:
+#   run-training training.yaml --lightning
+output_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/PixCell-GE/training/pixart-ge-cf-B-dropout-p02"
+device: "cuda"
+# ============================================================================
+# MODEL
+# ============================================================================
+model:
+  type: "pixart_ge"
+  variant: "B"  # 130M params: depth=12, hidden=768, heads=12
+  ge_encoder_type: "cancerfoundation"
+  ge_hidden_dim: 512
+  cf_model_dir: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/cancer-foundation"
+  cf_freeze_backbone: true
+# ============================================================================
+# DATA
+# ============================================================================
+data:
+  # Dataset-centric path
+  features_dir: "/cluster/work/grlab/projects/projects2025-virtual-tissue-gen/scratch/10x_TuPro/feat-extraction/features_train"
+  load_gene_expression: true
+  load_gene_expression_binned: true
+  num_workers: 8
+  pin_memory: true
+  val_split: 0.1
+# ============================================================================
+# DIFFUSION
+# ============================================================================
+diffusion:
+  timesteps: 1000
+  beta_schedule: "linear"
+  image_size: 256
+  latent_size: 32
+# ============================================================================
+# TRAINING
+# ============================================================================
+training:
+  batch_size: 32
+  batch_size_val: 32
+  gradient_accumulation_steps: 4  # effective batch = 128 (matches original PixCell)
+  num_epochs: 1000
+  seed: 42
+  gradient_clip: 0.01
+  ema_rate: 0.9999
+  optimizer:
+    lr: 2e-5  # matches original PixCell (was 1e-4)
+    weight_decay: 0.01
+    betas: [0.9, 0.999]
+  scheduler:
+    warmup_steps: 1000
+    min_lr_ratio: 0.1
+  classifier_free_guidance:
+    conditioning_schedule:
+      - mask: [uni, ge]   # full conditioning (UNI + GE active)
+        weight: 64
+      - mask: [ge]        # GE only (UNI dropped)
+        weight: 16
+      - mask: [uni]       # UNI only (GE dropped)
+        weight: 16
+      - mask: []          # unconditional (both dropped)
+        weight: 4
+  modality_monitor:
+    enabled: true
+    diagnostic_freq: 10
+    diagnostic_batch_size: 64
+# ============================================================================
+# DISTRIBUTED
+# ============================================================================
+distributed:
+  precision: "32"
+# ============================================================================
+# CHECKPOINT
+# ============================================================================
+checkpoint:
+  save_every: 1000
+  resume: null
+# ============================================================================
+# LOGGING
+# ============================================================================
+logging:
+  log_every: 100
+  validate_every: 0
+  gpu_monitor: true
+  gpu_monitor_interval: 60.0
+  # Periodic image sampling (disabled; set vae_path + epochs/steps to enable)
+  sample_every_epochs: 10
+  sample_every_steps: 0
+  num_samples: 16
+  sample_guidance_scale: 3.0
+  sample_num_steps: 20
+  sample_vae_path: "/cluster/home/pvlachas/leomed-home/pretrained_model_weights/stability-ai-stable-diffusion-3-5-large/models--stabilityai--stable-diffusion-3.5-large/snapshots/ceddf0a7fdf2064ea28e2213e3b84e4afa170a0f/vae"