Pin torch<2.10 to avoid CUDA 13 driver mismatch on A100 flavor
Browse files- stage_candidates.py +2 -1
stage_candidates.py
CHANGED
|
@@ -1,12 +1,13 @@
|
|
| 1 |
# /// script
|
| 2 |
# requires-python = ">=3.10"
|
| 3 |
# dependencies = [
|
| 4 |
-
# "torch>=2.
|
| 5 |
# "transformers>=4.46",
|
| 6 |
# "huggingface_hub>=0.26",
|
| 7 |
# "accelerate>=1.0",
|
| 8 |
# "sentencepiece",
|
| 9 |
# "protobuf",
|
|
|
|
| 10 |
# ]
|
| 11 |
# ///
|
| 12 |
"""Stage the 4 HSAQ candidate models on an L40S, extract architecture facts,
|
|
|
|
| 1 |
# /// script
|
| 2 |
# requires-python = ">=3.10"
|
| 3 |
# dependencies = [
|
| 4 |
+
# "torch>=2.5,<2.10", # 2.10+ requires CUDA 13 driver; A100 HF Jobs flavor ships CUDA 12.9
|
| 5 |
# "transformers>=4.46",
|
| 6 |
# "huggingface_hub>=0.26",
|
| 7 |
# "accelerate>=1.0",
|
| 8 |
# "sentencepiece",
|
| 9 |
# "protobuf",
|
| 10 |
+
# "bitsandbytes>=0.45,<0.50", # for the 4-bit fallback path if we need it
|
| 11 |
# ]
|
| 12 |
# ///
|
| 13 |
"""Stage the 4 HSAQ candidate models on an L40S, extract architecture facts,
|