LeTue09 commited on
Commit
bccd5ed
·
verified ·
1 Parent(s): 64eea5b

Upload offline vLLM wheel archive

Browse files
.gitattributes CHANGED
@@ -1,35 +1 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
+ *.tar.gz filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
README.md ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # vLLM Nightly Wheel for Qwen3.5
2
+
3
+ This archive contains a Linux x86_64 vLLM nightly wheel that supports the
4
+ `Qwen3_5ForConditionalGeneration` architecture used by `Qwen/Qwen3.5-4B`.
5
+
6
+ ## Install on the cluster
7
+
8
+ ```bash
9
+ tar -xzf vllm-wheel-linux-x86_64.tar.gz
10
+ python -m pip install --no-index --no-deps --force-reinstall \
11
+ ./vllm-0.23.1rc1.dev102+ga46abb7ae-cp38-abi3-manylinux_2_28_x86_64.whl
12
+ python -c "import vllm; print(vllm.__version__)"
13
+ ```
14
+
15
+ ## Serve Qwen3.5
16
+
17
+ ```bash
18
+ CUDA_VISIBLE_DEVICES=1,2 vllm serve /cm/archive/tue09/model_hub/Qwen/Qwen3.5-4B \
19
+ --port 8000 \
20
+ --served-model-name Qwen/Qwen3.5-4B \
21
+ --tensor-parallel-size 2 \
22
+ --max-model-len 8192 \
23
+ --reasoning-parser qwen3 \
24
+ --language-model-only
25
+ ```
download_repo.py ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from huggingface_hub import snapshot_download
2
+
3
+
4
+ repo = "LeTue09/vllm-wheel"
5
+
6
+ snapshot_download(
7
+ repo_id=repo,
8
+ repo_type="model",
9
+ local_dir=f"/cm/shared/tue09/{repo}",
10
+ local_dir_use_symlinks=False,
11
+ )
install_from_archive.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env bash
2
+ set -euo pipefail
3
+
4
+ tar -xzf vllm-wheel-linux-x86_64.tar.gz
5
+ python -m pip install --no-index --no-deps --force-reinstall \
6
+ ./vllm-0.23.1rc1.dev102+ga46abb7ae-cp38-abi3-manylinux_2_28_x86_64.whl
7
+ python -c "import vllm; print(vllm.__version__)"
vllm-wheel-linux-x86_64.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ca5b8f0632d38686082a18e82efb330e46765838ac621b1f24d80a061abc767
3
+ size 271631344