Upload folder using huggingface_hub
Browse files- .gitattributes +25 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8 +3 -0
- 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9 +3 -0
- 87528f5e8e/rank_0_0/backbone/cache_key_factors.json +190 -0
- 87528f5e8e/rank_0_0/backbone/computation_graph.py +0 -0
- 87528f5e8e/rank_0_0/backbone/vllm_compile_cache.py +50 -0
.gitattributes
ADDED
|
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0 filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1 filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10 filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12 filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13 filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14 filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16 filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17 filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18 filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19 filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2 filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20 filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21 filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22 filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23 filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24 filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3 filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4 filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5 filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6 filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7 filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8 filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9 filter=lfs diff=lfs merge=lfs -text
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c84e1e26d868b02b43fcded458bbd21529c2064ff090c8f7523375df086ba648
|
| 3 |
+
size 1280088
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d8582d12fe32d9a765fe4f3ce86eaa48069109938d484cb5318fe96dce55b84
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f5504b9f24b90eceda2b176bd3c8d6213759cfc974406ed9b37031645b5297f
|
| 3 |
+
size 850054
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
|
| 3 |
+
size 1781682
|
87528f5e8e/rank_0_0/backbone/cache_key_factors.json
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"code_hash": "0d085c341409683b93462ace8da93154647fb6faa9f272ed53be27bc6c6e0417",
|
| 3 |
+
"compiler_hash": "f6a0d8ccc9",
|
| 4 |
+
"config_hash": "e339a61ac7",
|
| 5 |
+
"env": {
|
| 6 |
+
"CMAKE_BUILD_TYPE": null,
|
| 7 |
+
"CUDA_HOME": null,
|
| 8 |
+
"K_SCALE_CONSTANT": 200,
|
| 9 |
+
"NVCC_THREADS": null,
|
| 10 |
+
"Q_SCALE_CONSTANT": 200,
|
| 11 |
+
"RAY_EXPERIMENTAL_NOSET_ASCEND_RT_VISIBLE_DEVICES": null,
|
| 12 |
+
"RAY_EXPERIMENTAL_NOSET_CUDA_VISIBLE_DEVICES": null,
|
| 13 |
+
"RAY_EXPERIMENTAL_NOSET_HABANA_VISIBLE_MODULES": null,
|
| 14 |
+
"RAY_EXPERIMENTAL_NOSET_HIP_VISIBLE_DEVICES": null,
|
| 15 |
+
"RAY_EXPERIMENTAL_NOSET_NEURON_RT_VISIBLE_CORES": null,
|
| 16 |
+
"RAY_EXPERIMENTAL_NOSET_ONEAPI_DEVICE_SELECTOR": null,
|
| 17 |
+
"RAY_EXPERIMENTAL_NOSET_RBLN_RT_VISIBLE_DEVICES": null,
|
| 18 |
+
"RAY_EXPERIMENTAL_NOSET_ROCR_VISIBLE_DEVICES": null,
|
| 19 |
+
"RAY_EXPERIMENTAL_NOSET_TPU_VISIBLE_CHIPS": null,
|
| 20 |
+
"VERBOSE": false,
|
| 21 |
+
"VLLM_ALL2ALL_BACKEND": null,
|
| 22 |
+
"VLLM_ALLOW_CHUNKED_LOCAL_ATTN_WITH_HYBRID_KV_CACHE": true,
|
| 23 |
+
"VLLM_ALLOW_INSECURE_SERIALIZATION": false,
|
| 24 |
+
"VLLM_ALLOW_LONG_MAX_MODEL_LEN": false,
|
| 25 |
+
"VLLM_ALLOW_RUNTIME_LORA_UPDATING": false,
|
| 26 |
+
"VLLM_ALLREDUCE_USE_SYMM_MEM": true,
|
| 27 |
+
"VLLM_API_KEY": null,
|
| 28 |
+
"VLLM_ATTENTION_BACKEND": null,
|
| 29 |
+
"VLLM_BLOCKSCALE_FP8_GEMM_FLASHINFER": false,
|
| 30 |
+
"VLLM_COMPILE_CACHE_SAVE_FORMAT": "binary",
|
| 31 |
+
"VLLM_COMPUTE_NANS_IN_LOGITS": false,
|
| 32 |
+
"VLLM_CONFIGURE_LOGGING": true,
|
| 33 |
+
"VLLM_CONFIG_ROOT": "/root/.config/vllm",
|
| 34 |
+
"VLLM_CUDART_SO_PATH": null,
|
| 35 |
+
"VLLM_CUSTOM_SCOPES_FOR_PROFILING": false,
|
| 36 |
+
"VLLM_DBO_COMM_SMS": 20,
|
| 37 |
+
"VLLM_DEBUG_MFU_METRICS": false,
|
| 38 |
+
"VLLM_DEBUG_WORKSPACE": false,
|
| 39 |
+
"VLLM_DEEPEPLL_NVFP4_DISPATCH": false,
|
| 40 |
+
"VLLM_DEEPEP_BUFFER_SIZE_MB": 1024,
|
| 41 |
+
"VLLM_DEEPEP_HIGH_THROUGHPUT_FORCE_INTRA_NODE": false,
|
| 42 |
+
"VLLM_DEEPEP_LOW_LATENCY_USE_MNNVL": false,
|
| 43 |
+
"VLLM_DEEP_GEMM_WARMUP": "relax",
|
| 44 |
+
"VLLM_DISABLED_KERNELS": [],
|
| 45 |
+
"VLLM_DISABLE_COMPILE_CACHE": false,
|
| 46 |
+
"VLLM_DISABLE_FLASHINFER_PREFILL": false,
|
| 47 |
+
"VLLM_DISABLE_PYNCCL": false,
|
| 48 |
+
"VLLM_DISABLE_SHARED_EXPERTS_STREAM": false,
|
| 49 |
+
"VLLM_DOCKER_BUILD_CONTEXT": false,
|
| 50 |
+
"VLLM_DP_RANK": 0,
|
| 51 |
+
"VLLM_DP_RANK_LOCAL": 0,
|
| 52 |
+
"VLLM_DP_SIZE": 1,
|
| 53 |
+
"VLLM_ENABLE_CUDAGRAPH_GC": false,
|
| 54 |
+
"VLLM_ENABLE_FUSED_MOE_ACTIVATION_CHUNKING": true,
|
| 55 |
+
"VLLM_ENABLE_INDUCTOR_COORDINATE_DESCENT_TUNING": true,
|
| 56 |
+
"VLLM_ENABLE_INDUCTOR_MAX_AUTOTUNE": true,
|
| 57 |
+
"VLLM_ENABLE_MOE_DP_CHUNK": true,
|
| 58 |
+
"VLLM_ENABLE_RESPONSES_API_STORE": false,
|
| 59 |
+
"VLLM_ENGINE_READY_TIMEOUT_S": 600,
|
| 60 |
+
"VLLM_FLASHINFER_ALLREDUCE_FUSION_THRESHOLDS_MB": [],
|
| 61 |
+
"VLLM_FLASHINFER_DISABLE_Q_QUANTIZATION": false,
|
| 62 |
+
"VLLM_FLASHINFER_MOE_BACKEND": "latency",
|
| 63 |
+
"VLLM_FLASHINFER_WORKSPACE_BUFFER_SIZE": 413138944,
|
| 64 |
+
"VLLM_FLASH_ATTN_MAX_NUM_SPLITS_FOR_CUDA_GRAPH": 32,
|
| 65 |
+
"VLLM_FLASH_ATTN_VERSION": null,
|
| 66 |
+
"VLLM_FLOAT32_MATMUL_PRECISION": "highest",
|
| 67 |
+
"VLLM_FUSED_MOE_CHUNK_SIZE": 16384,
|
| 68 |
+
"VLLM_GC_DEBUG": "",
|
| 69 |
+
"VLLM_GPT_OSS_HARMONY_SYSTEM_INSTRUCTIONS": false,
|
| 70 |
+
"VLLM_GPT_OSS_SYSTEM_TOOL_MCP_LABELS": [],
|
| 71 |
+
"VLLM_HAS_FLASHINFER_CUBIN": false,
|
| 72 |
+
"VLLM_KV_CACHE_LAYOUT": null,
|
| 73 |
+
"VLLM_KV_EVENTS_USE_INT_BLOCK_HASHES": true,
|
| 74 |
+
"VLLM_LOG_BATCHSIZE_INTERVAL": -1.0,
|
| 75 |
+
"VLLM_LOG_MODEL_INSPECTION": false,
|
| 76 |
+
"VLLM_LOOPBACK_IP": "",
|
| 77 |
+
"VLLM_LORA_RESOLVER_CACHE_DIR": null,
|
| 78 |
+
"VLLM_MAIN_CUDA_VERSION": "12.9",
|
| 79 |
+
"VLLM_MARLIN_INPUT_DTYPE": null,
|
| 80 |
+
"VLLM_MARLIN_USE_ATOMIC_ADD": false,
|
| 81 |
+
"VLLM_MAX_TOKENS_PER_EXPERT_FP4_MOE": 163840,
|
| 82 |
+
"VLLM_MLA_DISABLE": false,
|
| 83 |
+
"VLLM_MOE_DP_CHUNK_SIZE": 256,
|
| 84 |
+
"VLLM_MOE_ROUTING_SIMULATION_STRATEGY": "",
|
| 85 |
+
"VLLM_MOE_USE_DEEP_GEMM": true,
|
| 86 |
+
"VLLM_MOONCAKE_ABORT_REQUEST_TIMEOUT": 480,
|
| 87 |
+
"VLLM_MOONCAKE_BOOTSTRAP_PORT": 8998,
|
| 88 |
+
"VLLM_MORIIO_CONNECTOR_READ_MODE": false,
|
| 89 |
+
"VLLM_MORIIO_NUM_WORKERS": 1,
|
| 90 |
+
"VLLM_MORIIO_POST_BATCH_SIZE": -1,
|
| 91 |
+
"VLLM_MORIIO_QP_PER_TRANSFER": 1,
|
| 92 |
+
"VLLM_MQ_MAX_CHUNK_BYTES_MB": 16,
|
| 93 |
+
"VLLM_MSGPACK_ZERO_COPY_THRESHOLD": 256,
|
| 94 |
+
"VLLM_MXFP4_USE_MARLIN": null,
|
| 95 |
+
"VLLM_NCCL_INCLUDE_PATH": null,
|
| 96 |
+
"VLLM_NCCL_SO_PATH": null,
|
| 97 |
+
"VLLM_NIXL_ABORT_REQUEST_TIMEOUT": 480,
|
| 98 |
+
"VLLM_NIXL_SIDE_CHANNEL_HOST": "localhost",
|
| 99 |
+
"VLLM_NIXL_SIDE_CHANNEL_PORT": 5600,
|
| 100 |
+
"VLLM_NVFP4_GEMM_BACKEND": null,
|
| 101 |
+
"VLLM_NVTX_SCOPES_FOR_PROFILING": false,
|
| 102 |
+
"VLLM_OBJECT_STORAGE_SHM_BUFFER_NAME": "VLLM_OBJECT_STORAGE_SHM_BUFFER",
|
| 103 |
+
"VLLM_PATTERN_MATCH_DEBUG": null,
|
| 104 |
+
"VLLM_PLUGINS": null,
|
| 105 |
+
"VLLM_PP_LAYER_PARTITION": null,
|
| 106 |
+
"VLLM_PROCESS_NAME_PREFIX": "VLLM",
|
| 107 |
+
"VLLM_PROFILER_DELAY_ITERS": null,
|
| 108 |
+
"VLLM_PROFILER_MAX_ITERS": null,
|
| 109 |
+
"VLLM_RAY_BUNDLE_INDICES": "",
|
| 110 |
+
"VLLM_RAY_DP_PACK_STRATEGY": "strict",
|
| 111 |
+
"VLLM_RAY_PER_WORKER_GPUS": 1.0,
|
| 112 |
+
"VLLM_ROCM_CUSTOM_PAGED_ATTN": true,
|
| 113 |
+
"VLLM_ROCM_FP8_MFMA_PAGE_ATTN": false,
|
| 114 |
+
"VLLM_ROCM_FP8_PADDING": true,
|
| 115 |
+
"VLLM_ROCM_MOE_PADDING": true,
|
| 116 |
+
"VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16": true,
|
| 117 |
+
"VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB": null,
|
| 118 |
+
"VLLM_ROCM_QUICK_REDUCE_QUANTIZATION": "NONE",
|
| 119 |
+
"VLLM_ROCM_SLEEP_MEM_CHUNK_SIZE": 256,
|
| 120 |
+
"VLLM_ROCM_USE_AITER": false,
|
| 121 |
+
"VLLM_ROCM_USE_AITER_FP4_ASM_GEMM": false,
|
| 122 |
+
"VLLM_ROCM_USE_AITER_FP8BMM": true,
|
| 123 |
+
"VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS": false,
|
| 124 |
+
"VLLM_ROCM_USE_AITER_LINEAR": true,
|
| 125 |
+
"VLLM_ROCM_USE_AITER_MHA": true,
|
| 126 |
+
"VLLM_ROCM_USE_AITER_MLA": true,
|
| 127 |
+
"VLLM_ROCM_USE_AITER_MOE": true,
|
| 128 |
+
"VLLM_ROCM_USE_AITER_PAGED_ATTN": false,
|
| 129 |
+
"VLLM_ROCM_USE_AITER_RMSNORM": true,
|
| 130 |
+
"VLLM_ROCM_USE_AITER_TRITON_GEMM": true,
|
| 131 |
+
"VLLM_ROCM_USE_AITER_TRITON_ROPE": false,
|
| 132 |
+
"VLLM_ROCM_USE_AITER_UNIFIED_ATTENTION": false,
|
| 133 |
+
"VLLM_ROCM_USE_SKINNY_GEMM": true,
|
| 134 |
+
"VLLM_RPC_TIMEOUT": 10000,
|
| 135 |
+
"VLLM_SHARED_EXPERTS_STREAM_TOKEN_THRESHOLD": 256,
|
| 136 |
+
"VLLM_SKIP_P2P_CHECK": true,
|
| 137 |
+
"VLLM_SKIP_PRECOMPILED_VERSION_SUFFIX": false,
|
| 138 |
+
"VLLM_TARGET_DEVICE": "cuda",
|
| 139 |
+
"VLLM_TEST_FORCE_FP8_MARLIN": false,
|
| 140 |
+
"VLLM_TOOL_JSON_ERROR_AUTOMATIC_RETRY": false,
|
| 141 |
+
"VLLM_TOOL_PARSE_REGEX_TIMEOUT_SECONDS": 1,
|
| 142 |
+
"VLLM_TORCH_CUDA_PROFILE": null,
|
| 143 |
+
"VLLM_TORCH_PROFILER_DIR": null,
|
| 144 |
+
"VLLM_TORCH_PROFILER_DISABLE_ASYNC_LLM": null,
|
| 145 |
+
"VLLM_TORCH_PROFILER_DUMP_CUDA_TIME_TOTAL": null,
|
| 146 |
+
"VLLM_TORCH_PROFILER_RECORD_SHAPES": null,
|
| 147 |
+
"VLLM_TORCH_PROFILER_USE_GZIP": null,
|
| 148 |
+
"VLLM_TORCH_PROFILER_WITH_FLOPS": null,
|
| 149 |
+
"VLLM_TORCH_PROFILER_WITH_PROFILE_MEMORY": null,
|
| 150 |
+
"VLLM_TORCH_PROFILER_WITH_STACK": null,
|
| 151 |
+
"VLLM_TPU_BUCKET_PADDING_GAP": 0,
|
| 152 |
+
"VLLM_TPU_MOST_MODEL_LEN": null,
|
| 153 |
+
"VLLM_TPU_USING_PATHWAYS": false,
|
| 154 |
+
"VLLM_TRACE_FUNCTION": 0,
|
| 155 |
+
"VLLM_USAGE_SOURCE": "production",
|
| 156 |
+
"VLLM_USE_AOT_COMPILE": false,
|
| 157 |
+
"VLLM_USE_BYTECODE_HOOK": true,
|
| 158 |
+
"VLLM_USE_CUDNN_PREFILL": false,
|
| 159 |
+
"VLLM_USE_DEEP_GEMM": true,
|
| 160 |
+
"VLLM_USE_DEEP_GEMM_E8M0": true,
|
| 161 |
+
"VLLM_USE_EXPERIMENTAL_PARSER_CONTEXT": false,
|
| 162 |
+
"VLLM_USE_FBGEMM": false,
|
| 163 |
+
"VLLM_USE_FLASHINFER_MOE_FP16": false,
|
| 164 |
+
"VLLM_USE_FLASHINFER_MOE_FP4": false,
|
| 165 |
+
"VLLM_USE_FLASHINFER_MOE_FP8": false,
|
| 166 |
+
"VLLM_USE_FLASHINFER_MOE_MXFP4_BF16": false,
|
| 167 |
+
"VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8": false,
|
| 168 |
+
"VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8_CUTLASS": false,
|
| 169 |
+
"VLLM_USE_FLASHINFER_SAMPLER": null,
|
| 170 |
+
"VLLM_USE_FUSED_MOE_GROUPED_TOPK": true,
|
| 171 |
+
"VLLM_USE_NCCL_SYMM_MEM": false,
|
| 172 |
+
"VLLM_USE_NVFP4_CT_EMULATIONS": false,
|
| 173 |
+
"VLLM_USE_PRECOMPILED": false,
|
| 174 |
+
"VLLM_USE_RAY_COMPILED_DAG_CHANNEL_TYPE": "auto",
|
| 175 |
+
"VLLM_USE_RAY_COMPILED_DAG_OVERLAP_COMM": false,
|
| 176 |
+
"VLLM_USE_RAY_WRAPPED_PP_COMM": true,
|
| 177 |
+
"VLLM_USE_STANDALONE_COMPILE": true,
|
| 178 |
+
"VLLM_USE_TRITON_AWQ": false,
|
| 179 |
+
"VLLM_USE_TRTLLM_ATTENTION": null,
|
| 180 |
+
"VLLM_USE_TRTLLM_RAGGED_DEEPSEEK_PREFILL": false,
|
| 181 |
+
"VLLM_USE_V2_MODEL_RUNNER": false,
|
| 182 |
+
"VLLM_V1_USE_OUTLINES_CACHE": false,
|
| 183 |
+
"VLLM_V1_USE_PREFILL_DECODE_ATTENTION": false,
|
| 184 |
+
"VLLM_XGRAMMAR_CACHE_MB": 512,
|
| 185 |
+
"VLLM_XLA_CACHE_PATH": "/root/.cache/vllm/xla_cache",
|
| 186 |
+
"VLLM_XLA_CHECK_RECOMPILATION": false,
|
| 187 |
+
"VLLM_XLA_USE_SPMD": false,
|
| 188 |
+
"V_SCALE_CONSTANT": 100
|
| 189 |
+
}
|
| 190 |
+
}
|
87528f5e8e/rank_0_0/backbone/computation_graph.py
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
87528f5e8e/rank_0_0/backbone/vllm_compile_cache.py
ADDED
|
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{ ((1, 8192), 0, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_0',
|
| 2 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0'),
|
| 3 |
+
((1, 8192), 1, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_1',
|
| 4 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1'),
|
| 5 |
+
((1, 8192), 2, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_2',
|
| 6 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2'),
|
| 7 |
+
((1, 8192), 3, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_3',
|
| 8 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3'),
|
| 9 |
+
((1, 8192), 4, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_4',
|
| 10 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4'),
|
| 11 |
+
((1, 8192), 5, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_5',
|
| 12 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5'),
|
| 13 |
+
((1, 8192), 6, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_6',
|
| 14 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6'),
|
| 15 |
+
((1, 8192), 7, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_7',
|
| 16 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7'),
|
| 17 |
+
((1, 8192), 8, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_8',
|
| 18 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8'),
|
| 19 |
+
((1, 8192), 9, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_9',
|
| 20 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9'),
|
| 21 |
+
((1, 8192), 10, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_10',
|
| 22 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10'),
|
| 23 |
+
((1, 8192), 11, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_11',
|
| 24 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11'),
|
| 25 |
+
((1, 8192), 12, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_12',
|
| 26 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12'),
|
| 27 |
+
((1, 8192), 13, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_13',
|
| 28 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13'),
|
| 29 |
+
((1, 8192), 14, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_14',
|
| 30 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14'),
|
| 31 |
+
((1, 8192), 15, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_15',
|
| 32 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15'),
|
| 33 |
+
((1, 8192), 16, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_16',
|
| 34 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16'),
|
| 35 |
+
((1, 8192), 17, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_17',
|
| 36 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17'),
|
| 37 |
+
((1, 8192), 18, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_18',
|
| 38 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18'),
|
| 39 |
+
((1, 8192), 19, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_19',
|
| 40 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19'),
|
| 41 |
+
((1, 8192), 20, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_20',
|
| 42 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20'),
|
| 43 |
+
((1, 8192), 21, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_21',
|
| 44 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21'),
|
| 45 |
+
((1, 8192), 22, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_22',
|
| 46 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22'),
|
| 47 |
+
((1, 8192), 23, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_23',
|
| 48 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23'),
|
| 49 |
+
((1, 8192), 24, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_24',
|
| 50 |
+
'/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24')}
|