waltgrace commited on
Commit
cc72530
·
verified ·
1 Parent(s): ef0fc31

sync: data_label_factory/runpod/requirements-pod.txt

Browse files
data_label_factory/runpod/requirements-pod.txt CHANGED
@@ -5,15 +5,23 @@
5
  # on MLX instead of CUDA / torch.
6
 
7
  # --- Falcon Perception (the bbox grounder) ---
8
- # Soft-pinned to torch>=2.11 by the package, but actually works with the
9
- # torch 2.7.1+cu128 baked into the runpod/pytorch base image. If pip
10
- # refuses, install with --no-deps and hope.
11
- falcon-perception>=0.1.0
 
 
 
 
 
 
12
 
13
  # --- Vision-language models ---
14
- # Qwen 2.5-VL via transformers
15
- transformers>=4.49.0
16
- qwen-vl-utils[decord]>=0.0.10
 
 
17
  accelerate>=0.34
18
  safetensors>=0.4
19
 
 
5
  # on MLX instead of CUDA / torch.
6
 
7
  # --- Falcon Perception (the bbox grounder) ---
8
+ # NOTE: falcon-perception is installed in the Dockerfile with --no-deps
9
+ # because its torch>=2.11 pin would force a 2-3 GB upgrade of the base
10
+ # image's torch 2.7.1+cu128, which actually works fine. Falcon's runtime
11
+ # deps (transformers, accelerate, einops, opencv, scipy, pycocotools) are
12
+ # listed below explicitly so the no-deps install still gets them.
13
+ einops>=0.8.0
14
+ opencv-python>=4.10.0
15
+ scipy>=1.13.0
16
+ pycocotools>=2.0.7
17
+ tyro>=0.8.0
18
 
19
  # --- Vision-language models ---
20
+ # Qwen 2.5-VL via transformers. We deliberately do NOT pull the [decord] extra:
21
+ # decord is a video-frame helper that only ships Linux x86_64 wheels and we use
22
+ # yt-dlp for video work anyway.
23
+ transformers>=4.49.0,<5
24
+ qwen-vl-utils>=0.0.10
25
  accelerate>=0.34
26
  safetensors>=0.4
27