hieu3636
/

cxr-vlm-code

Model card Files Files and versions

cxr-vlm-code / docker /requirements_docker.txt

convitom

f

c9b4129 12 days ago

history blame contribute delete

2.34 kB

	# Versions match Colab GPU runtime (verified 2026-05). torch + torchvision
	# are NOT listed here — they come from the pytorch/pytorch base image with
	# the right CUDA build baked in.
	#
	# Pins are loose (>=) on purpose: pip resolves the latest mutually-compatible
	# set. If you want to lock exact versions for reproducibility, generate a
	# constraints file from a working build with:
	# pip freeze > requirements_lock.txt

	# ── Core HF stack ─────────────────────────────────────────────────────────────
	transformers>=4.46,<4.50
	peft>=0.13,<0.15
	accelerate>=1.0
	bitsandbytes>=0.45
	huggingface_hub>=0.27,<1.0 # transformers 4.49 declares hf_hub<1.0 — must match
	httpx>=0.27 # utils/_httpx_compat.py handles 0.28+ kwarg change

	# ── Vision encoder ────────────────────────────────────────────────────────────
	# rad_dino loads via transformers AutoModel — no extra dep needed.
	# hi-ml-multimodal (BioViL-T) intentionally omitted; model/rad_dino.py wraps
	# its import in try/except and falls back to timm/transformers cleanly.
	timm>=1.0
	Pillow>=10.0

	# ── Config / data ─────────────────────────────────────────────────────────────
	omegaconf==2.3.0
	sentencepiece>=0.2
	protobuf>=5.0
	numpy>=1.26,<3 # cap at 2.x for now; some libs still don't support numpy 2
	pandas>=2.2

	# ── Eval metrics ──────────────────────────────────────────────────────────────
	nltk>=3.9
	rouge-score>=0.1.2
	bert-score>=0.3.12
	scikit-learn>=1.5

	# ── Training / experiment tracking ────────────────────────────────────────────
	wandb>=0.18
	tqdm>=4.66

	# ── Optional: LLM-as-judge for VQA ────────────────────────────────────────────
	openai>=1.40