erikkaum HF Staff commited on
Commit
f3311c0
·
verified ·
1 Parent(s): 40f6aca

Upload folder using huggingface_hub

Browse files
Files changed (29) hide show
  1. .gitattributes +25 -0
  2. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0 +3 -0
  3. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1 +3 -0
  4. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10 +3 -0
  5. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11 +3 -0
  6. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12 +3 -0
  7. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13 +3 -0
  8. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14 +3 -0
  9. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15 +3 -0
  10. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16 +3 -0
  11. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17 +3 -0
  12. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18 +3 -0
  13. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19 +3 -0
  14. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2 +3 -0
  15. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20 +3 -0
  16. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21 +3 -0
  17. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22 +3 -0
  18. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23 +3 -0
  19. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24 +3 -0
  20. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3 +3 -0
  21. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4 +3 -0
  22. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5 +3 -0
  23. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6 +3 -0
  24. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7 +3 -0
  25. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8 +3 -0
  26. 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9 +3 -0
  27. 87528f5e8e/rank_0_0/backbone/cache_key_factors.json +190 -0
  28. 87528f5e8e/rank_0_0/backbone/computation_graph.py +0 -0
  29. 87528f5e8e/rank_0_0/backbone/vllm_compile_cache.py +50 -0
.gitattributes ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0 filter=lfs diff=lfs merge=lfs -text
2
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1 filter=lfs diff=lfs merge=lfs -text
3
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10 filter=lfs diff=lfs merge=lfs -text
4
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11 filter=lfs diff=lfs merge=lfs -text
5
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12 filter=lfs diff=lfs merge=lfs -text
6
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13 filter=lfs diff=lfs merge=lfs -text
7
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14 filter=lfs diff=lfs merge=lfs -text
8
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15 filter=lfs diff=lfs merge=lfs -text
9
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16 filter=lfs diff=lfs merge=lfs -text
10
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17 filter=lfs diff=lfs merge=lfs -text
11
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18 filter=lfs diff=lfs merge=lfs -text
12
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19 filter=lfs diff=lfs merge=lfs -text
13
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2 filter=lfs diff=lfs merge=lfs -text
14
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20 filter=lfs diff=lfs merge=lfs -text
15
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21 filter=lfs diff=lfs merge=lfs -text
16
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22 filter=lfs diff=lfs merge=lfs -text
17
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23 filter=lfs diff=lfs merge=lfs -text
18
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24 filter=lfs diff=lfs merge=lfs -text
19
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3 filter=lfs diff=lfs merge=lfs -text
20
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4 filter=lfs diff=lfs merge=lfs -text
21
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5 filter=lfs diff=lfs merge=lfs -text
22
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6 filter=lfs diff=lfs merge=lfs -text
23
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7 filter=lfs diff=lfs merge=lfs -text
24
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8 filter=lfs diff=lfs merge=lfs -text
25
+ 87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9 filter=lfs diff=lfs merge=lfs -text
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c84e1e26d868b02b43fcded458bbd21529c2064ff090c8f7523375df086ba648
3
+ size 1280088
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d8582d12fe32d9a765fe4f3ce86eaa48069109938d484cb5318fe96dce55b84
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5504b9f24b90eceda2b176bd3c8d6213759cfc974406ed9b37031645b5297f
3
+ size 850054
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a85fc138ac08e60bc0eb04e154cffd99e1fb1e732bb357582b94299004a2d941
3
+ size 1781682
87528f5e8e/rank_0_0/backbone/cache_key_factors.json ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "code_hash": "0d085c341409683b93462ace8da93154647fb6faa9f272ed53be27bc6c6e0417",
3
+ "compiler_hash": "f6a0d8ccc9",
4
+ "config_hash": "e339a61ac7",
5
+ "env": {
6
+ "CMAKE_BUILD_TYPE": null,
7
+ "CUDA_HOME": null,
8
+ "K_SCALE_CONSTANT": 200,
9
+ "NVCC_THREADS": null,
10
+ "Q_SCALE_CONSTANT": 200,
11
+ "RAY_EXPERIMENTAL_NOSET_ASCEND_RT_VISIBLE_DEVICES": null,
12
+ "RAY_EXPERIMENTAL_NOSET_CUDA_VISIBLE_DEVICES": null,
13
+ "RAY_EXPERIMENTAL_NOSET_HABANA_VISIBLE_MODULES": null,
14
+ "RAY_EXPERIMENTAL_NOSET_HIP_VISIBLE_DEVICES": null,
15
+ "RAY_EXPERIMENTAL_NOSET_NEURON_RT_VISIBLE_CORES": null,
16
+ "RAY_EXPERIMENTAL_NOSET_ONEAPI_DEVICE_SELECTOR": null,
17
+ "RAY_EXPERIMENTAL_NOSET_RBLN_RT_VISIBLE_DEVICES": null,
18
+ "RAY_EXPERIMENTAL_NOSET_ROCR_VISIBLE_DEVICES": null,
19
+ "RAY_EXPERIMENTAL_NOSET_TPU_VISIBLE_CHIPS": null,
20
+ "VERBOSE": false,
21
+ "VLLM_ALL2ALL_BACKEND": null,
22
+ "VLLM_ALLOW_CHUNKED_LOCAL_ATTN_WITH_HYBRID_KV_CACHE": true,
23
+ "VLLM_ALLOW_INSECURE_SERIALIZATION": false,
24
+ "VLLM_ALLOW_LONG_MAX_MODEL_LEN": false,
25
+ "VLLM_ALLOW_RUNTIME_LORA_UPDATING": false,
26
+ "VLLM_ALLREDUCE_USE_SYMM_MEM": true,
27
+ "VLLM_API_KEY": null,
28
+ "VLLM_ATTENTION_BACKEND": null,
29
+ "VLLM_BLOCKSCALE_FP8_GEMM_FLASHINFER": false,
30
+ "VLLM_COMPILE_CACHE_SAVE_FORMAT": "binary",
31
+ "VLLM_COMPUTE_NANS_IN_LOGITS": false,
32
+ "VLLM_CONFIGURE_LOGGING": true,
33
+ "VLLM_CONFIG_ROOT": "/root/.config/vllm",
34
+ "VLLM_CUDART_SO_PATH": null,
35
+ "VLLM_CUSTOM_SCOPES_FOR_PROFILING": false,
36
+ "VLLM_DBO_COMM_SMS": 20,
37
+ "VLLM_DEBUG_MFU_METRICS": false,
38
+ "VLLM_DEBUG_WORKSPACE": false,
39
+ "VLLM_DEEPEPLL_NVFP4_DISPATCH": false,
40
+ "VLLM_DEEPEP_BUFFER_SIZE_MB": 1024,
41
+ "VLLM_DEEPEP_HIGH_THROUGHPUT_FORCE_INTRA_NODE": false,
42
+ "VLLM_DEEPEP_LOW_LATENCY_USE_MNNVL": false,
43
+ "VLLM_DEEP_GEMM_WARMUP": "relax",
44
+ "VLLM_DISABLED_KERNELS": [],
45
+ "VLLM_DISABLE_COMPILE_CACHE": false,
46
+ "VLLM_DISABLE_FLASHINFER_PREFILL": false,
47
+ "VLLM_DISABLE_PYNCCL": false,
48
+ "VLLM_DISABLE_SHARED_EXPERTS_STREAM": false,
49
+ "VLLM_DOCKER_BUILD_CONTEXT": false,
50
+ "VLLM_DP_RANK": 0,
51
+ "VLLM_DP_RANK_LOCAL": 0,
52
+ "VLLM_DP_SIZE": 1,
53
+ "VLLM_ENABLE_CUDAGRAPH_GC": false,
54
+ "VLLM_ENABLE_FUSED_MOE_ACTIVATION_CHUNKING": true,
55
+ "VLLM_ENABLE_INDUCTOR_COORDINATE_DESCENT_TUNING": true,
56
+ "VLLM_ENABLE_INDUCTOR_MAX_AUTOTUNE": true,
57
+ "VLLM_ENABLE_MOE_DP_CHUNK": true,
58
+ "VLLM_ENABLE_RESPONSES_API_STORE": false,
59
+ "VLLM_ENGINE_READY_TIMEOUT_S": 600,
60
+ "VLLM_FLASHINFER_ALLREDUCE_FUSION_THRESHOLDS_MB": [],
61
+ "VLLM_FLASHINFER_DISABLE_Q_QUANTIZATION": false,
62
+ "VLLM_FLASHINFER_MOE_BACKEND": "latency",
63
+ "VLLM_FLASHINFER_WORKSPACE_BUFFER_SIZE": 413138944,
64
+ "VLLM_FLASH_ATTN_MAX_NUM_SPLITS_FOR_CUDA_GRAPH": 32,
65
+ "VLLM_FLASH_ATTN_VERSION": null,
66
+ "VLLM_FLOAT32_MATMUL_PRECISION": "highest",
67
+ "VLLM_FUSED_MOE_CHUNK_SIZE": 16384,
68
+ "VLLM_GC_DEBUG": "",
69
+ "VLLM_GPT_OSS_HARMONY_SYSTEM_INSTRUCTIONS": false,
70
+ "VLLM_GPT_OSS_SYSTEM_TOOL_MCP_LABELS": [],
71
+ "VLLM_HAS_FLASHINFER_CUBIN": false,
72
+ "VLLM_KV_CACHE_LAYOUT": null,
73
+ "VLLM_KV_EVENTS_USE_INT_BLOCK_HASHES": true,
74
+ "VLLM_LOG_BATCHSIZE_INTERVAL": -1.0,
75
+ "VLLM_LOG_MODEL_INSPECTION": false,
76
+ "VLLM_LOOPBACK_IP": "",
77
+ "VLLM_LORA_RESOLVER_CACHE_DIR": null,
78
+ "VLLM_MAIN_CUDA_VERSION": "12.9",
79
+ "VLLM_MARLIN_INPUT_DTYPE": null,
80
+ "VLLM_MARLIN_USE_ATOMIC_ADD": false,
81
+ "VLLM_MAX_TOKENS_PER_EXPERT_FP4_MOE": 163840,
82
+ "VLLM_MLA_DISABLE": false,
83
+ "VLLM_MOE_DP_CHUNK_SIZE": 256,
84
+ "VLLM_MOE_ROUTING_SIMULATION_STRATEGY": "",
85
+ "VLLM_MOE_USE_DEEP_GEMM": true,
86
+ "VLLM_MOONCAKE_ABORT_REQUEST_TIMEOUT": 480,
87
+ "VLLM_MOONCAKE_BOOTSTRAP_PORT": 8998,
88
+ "VLLM_MORIIO_CONNECTOR_READ_MODE": false,
89
+ "VLLM_MORIIO_NUM_WORKERS": 1,
90
+ "VLLM_MORIIO_POST_BATCH_SIZE": -1,
91
+ "VLLM_MORIIO_QP_PER_TRANSFER": 1,
92
+ "VLLM_MQ_MAX_CHUNK_BYTES_MB": 16,
93
+ "VLLM_MSGPACK_ZERO_COPY_THRESHOLD": 256,
94
+ "VLLM_MXFP4_USE_MARLIN": null,
95
+ "VLLM_NCCL_INCLUDE_PATH": null,
96
+ "VLLM_NCCL_SO_PATH": null,
97
+ "VLLM_NIXL_ABORT_REQUEST_TIMEOUT": 480,
98
+ "VLLM_NIXL_SIDE_CHANNEL_HOST": "localhost",
99
+ "VLLM_NIXL_SIDE_CHANNEL_PORT": 5600,
100
+ "VLLM_NVFP4_GEMM_BACKEND": null,
101
+ "VLLM_NVTX_SCOPES_FOR_PROFILING": false,
102
+ "VLLM_OBJECT_STORAGE_SHM_BUFFER_NAME": "VLLM_OBJECT_STORAGE_SHM_BUFFER",
103
+ "VLLM_PATTERN_MATCH_DEBUG": null,
104
+ "VLLM_PLUGINS": null,
105
+ "VLLM_PP_LAYER_PARTITION": null,
106
+ "VLLM_PROCESS_NAME_PREFIX": "VLLM",
107
+ "VLLM_PROFILER_DELAY_ITERS": null,
108
+ "VLLM_PROFILER_MAX_ITERS": null,
109
+ "VLLM_RAY_BUNDLE_INDICES": "",
110
+ "VLLM_RAY_DP_PACK_STRATEGY": "strict",
111
+ "VLLM_RAY_PER_WORKER_GPUS": 1.0,
112
+ "VLLM_ROCM_CUSTOM_PAGED_ATTN": true,
113
+ "VLLM_ROCM_FP8_MFMA_PAGE_ATTN": false,
114
+ "VLLM_ROCM_FP8_PADDING": true,
115
+ "VLLM_ROCM_MOE_PADDING": true,
116
+ "VLLM_ROCM_QUICK_REDUCE_CAST_BF16_TO_FP16": true,
117
+ "VLLM_ROCM_QUICK_REDUCE_MAX_SIZE_BYTES_MB": null,
118
+ "VLLM_ROCM_QUICK_REDUCE_QUANTIZATION": "NONE",
119
+ "VLLM_ROCM_SLEEP_MEM_CHUNK_SIZE": 256,
120
+ "VLLM_ROCM_USE_AITER": false,
121
+ "VLLM_ROCM_USE_AITER_FP4_ASM_GEMM": false,
122
+ "VLLM_ROCM_USE_AITER_FP8BMM": true,
123
+ "VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS": false,
124
+ "VLLM_ROCM_USE_AITER_LINEAR": true,
125
+ "VLLM_ROCM_USE_AITER_MHA": true,
126
+ "VLLM_ROCM_USE_AITER_MLA": true,
127
+ "VLLM_ROCM_USE_AITER_MOE": true,
128
+ "VLLM_ROCM_USE_AITER_PAGED_ATTN": false,
129
+ "VLLM_ROCM_USE_AITER_RMSNORM": true,
130
+ "VLLM_ROCM_USE_AITER_TRITON_GEMM": true,
131
+ "VLLM_ROCM_USE_AITER_TRITON_ROPE": false,
132
+ "VLLM_ROCM_USE_AITER_UNIFIED_ATTENTION": false,
133
+ "VLLM_ROCM_USE_SKINNY_GEMM": true,
134
+ "VLLM_RPC_TIMEOUT": 10000,
135
+ "VLLM_SHARED_EXPERTS_STREAM_TOKEN_THRESHOLD": 256,
136
+ "VLLM_SKIP_P2P_CHECK": true,
137
+ "VLLM_SKIP_PRECOMPILED_VERSION_SUFFIX": false,
138
+ "VLLM_TARGET_DEVICE": "cuda",
139
+ "VLLM_TEST_FORCE_FP8_MARLIN": false,
140
+ "VLLM_TOOL_JSON_ERROR_AUTOMATIC_RETRY": false,
141
+ "VLLM_TOOL_PARSE_REGEX_TIMEOUT_SECONDS": 1,
142
+ "VLLM_TORCH_CUDA_PROFILE": null,
143
+ "VLLM_TORCH_PROFILER_DIR": null,
144
+ "VLLM_TORCH_PROFILER_DISABLE_ASYNC_LLM": null,
145
+ "VLLM_TORCH_PROFILER_DUMP_CUDA_TIME_TOTAL": null,
146
+ "VLLM_TORCH_PROFILER_RECORD_SHAPES": null,
147
+ "VLLM_TORCH_PROFILER_USE_GZIP": null,
148
+ "VLLM_TORCH_PROFILER_WITH_FLOPS": null,
149
+ "VLLM_TORCH_PROFILER_WITH_PROFILE_MEMORY": null,
150
+ "VLLM_TORCH_PROFILER_WITH_STACK": null,
151
+ "VLLM_TPU_BUCKET_PADDING_GAP": 0,
152
+ "VLLM_TPU_MOST_MODEL_LEN": null,
153
+ "VLLM_TPU_USING_PATHWAYS": false,
154
+ "VLLM_TRACE_FUNCTION": 0,
155
+ "VLLM_USAGE_SOURCE": "production",
156
+ "VLLM_USE_AOT_COMPILE": false,
157
+ "VLLM_USE_BYTECODE_HOOK": true,
158
+ "VLLM_USE_CUDNN_PREFILL": false,
159
+ "VLLM_USE_DEEP_GEMM": true,
160
+ "VLLM_USE_DEEP_GEMM_E8M0": true,
161
+ "VLLM_USE_EXPERIMENTAL_PARSER_CONTEXT": false,
162
+ "VLLM_USE_FBGEMM": false,
163
+ "VLLM_USE_FLASHINFER_MOE_FP16": false,
164
+ "VLLM_USE_FLASHINFER_MOE_FP4": false,
165
+ "VLLM_USE_FLASHINFER_MOE_FP8": false,
166
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_BF16": false,
167
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8": false,
168
+ "VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8_CUTLASS": false,
169
+ "VLLM_USE_FLASHINFER_SAMPLER": null,
170
+ "VLLM_USE_FUSED_MOE_GROUPED_TOPK": true,
171
+ "VLLM_USE_NCCL_SYMM_MEM": false,
172
+ "VLLM_USE_NVFP4_CT_EMULATIONS": false,
173
+ "VLLM_USE_PRECOMPILED": false,
174
+ "VLLM_USE_RAY_COMPILED_DAG_CHANNEL_TYPE": "auto",
175
+ "VLLM_USE_RAY_COMPILED_DAG_OVERLAP_COMM": false,
176
+ "VLLM_USE_RAY_WRAPPED_PP_COMM": true,
177
+ "VLLM_USE_STANDALONE_COMPILE": true,
178
+ "VLLM_USE_TRITON_AWQ": false,
179
+ "VLLM_USE_TRTLLM_ATTENTION": null,
180
+ "VLLM_USE_TRTLLM_RAGGED_DEEPSEEK_PREFILL": false,
181
+ "VLLM_USE_V2_MODEL_RUNNER": false,
182
+ "VLLM_V1_USE_OUTLINES_CACHE": false,
183
+ "VLLM_V1_USE_PREFILL_DECODE_ATTENTION": false,
184
+ "VLLM_XGRAMMAR_CACHE_MB": 512,
185
+ "VLLM_XLA_CACHE_PATH": "/root/.cache/vllm/xla_cache",
186
+ "VLLM_XLA_CHECK_RECOMPILATION": false,
187
+ "VLLM_XLA_USE_SPMD": false,
188
+ "V_SCALE_CONSTANT": 100
189
+ }
190
+ }
87528f5e8e/rank_0_0/backbone/computation_graph.py ADDED
The diff for this file is too large to render. See raw diff
 
87528f5e8e/rank_0_0/backbone/vllm_compile_cache.py ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ { ((1, 8192), 0, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_0',
2
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_0'),
3
+ ((1, 8192), 1, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_1',
4
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_1'),
5
+ ((1, 8192), 2, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_2',
6
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_2'),
7
+ ((1, 8192), 3, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_3',
8
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_3'),
9
+ ((1, 8192), 4, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_4',
10
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_4'),
11
+ ((1, 8192), 5, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_5',
12
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_5'),
13
+ ((1, 8192), 6, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_6',
14
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_6'),
15
+ ((1, 8192), 7, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_7',
16
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_7'),
17
+ ((1, 8192), 8, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_8',
18
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_8'),
19
+ ((1, 8192), 9, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_9',
20
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_9'),
21
+ ((1, 8192), 10, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_10',
22
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_10'),
23
+ ((1, 8192), 11, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_11',
24
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_11'),
25
+ ((1, 8192), 12, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_12',
26
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_12'),
27
+ ((1, 8192), 13, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_13',
28
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_13'),
29
+ ((1, 8192), 14, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_14',
30
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_14'),
31
+ ((1, 8192), 15, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_15',
32
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_15'),
33
+ ((1, 8192), 16, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_16',
34
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_16'),
35
+ ((1, 8192), 17, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_17',
36
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_17'),
37
+ ((1, 8192), 18, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_18',
38
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_18'),
39
+ ((1, 8192), 19, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_19',
40
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_19'),
41
+ ((1, 8192), 20, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_20',
42
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_20'),
43
+ ((1, 8192), 21, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_21',
44
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_21'),
45
+ ((1, 8192), 22, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_22',
46
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_22'),
47
+ ((1, 8192), 23, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_23',
48
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_23'),
49
+ ((1, 8192), 24, 'inductor_standalone'): ( 'artifact_compile_range_1_8192_subgraph_24',
50
+ '/root/.cache/vllm/torch_compile_cache/87528f5e8e/rank_0_0/backbone/artifact_compile_range_1_8192_subgraph_24')}