test
Browse files
vaedecode_fp8ization_wan21_fp8_20260109_233933_0eee5653_e567f199.log
ADDED
|
@@ -0,0 +1,209 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[2026-01-09 23:39:33] [INFO] === WAN21 ONNX->ModelOpt Quantization Run START ===
|
| 2 |
+
[2026-01-09 23:39:33] [INFO] log_path: /ComfyUI/output/vaedecode_fp8ization_wan21_fp8_20260109_233933_0eee5653_e567f199.log
|
| 3 |
+
[2026-01-09 23:39:33] [INFO] LD_LIBRARY_PATH already contains: /usr/lib/x86_64-linux-gnu
|
| 4 |
+
[2026-01-09 23:39:33] [INFO] Versions:
|
| 5 |
+
{
|
| 6 |
+
"python": "3.12.3 (main, Nov 6 2025, 13:44:16) [GCC 13.3.0]",
|
| 7 |
+
"numpy": "1.26.4",
|
| 8 |
+
"onnx": "1.19.1",
|
| 9 |
+
"onnxruntime": "1.22.1",
|
| 10 |
+
"tensorrt": "10.14.1.48.post1",
|
| 11 |
+
"modelopt": "0.40.0"
|
| 12 |
+
}
|
| 13 |
+
[2026-01-09 23:39:33] [INFO] onnxruntime.get_available_providers(): ['AzureExecutionProvider', 'CPUExecutionProvider']
|
| 14 |
+
[2026-01-09 23:39:33] [INFO] workdir: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199
|
| 15 |
+
[2026-01-09 23:39:33] [INFO] Copied ONNX into workdir:
|
| 16 |
+
src: /ComfyUI/custom_nodes/vaedecode_fp8ization.onnx
|
| 17 |
+
dst: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization.onnx
|
| 18 |
+
[2026-01-09 23:39:34] [INFO] No external data files were copied (model may be embedded).
|
| 19 |
+
[2026-01-09 23:39:34] [INFO] Loaded ONNX: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization.onnx
|
| 20 |
+
[2026-01-09 23:39:34] [INFO] Model inputs: ['latent']
|
| 21 |
+
[2026-01-09 23:39:34] [INFO] Model outputs: ['video']
|
| 22 |
+
[2026-01-09 23:39:34] [INFO] latent dims (as exported): ['B', 16, 11, 72, 42]
|
| 23 |
+
[2026-01-09 23:39:34] [INFO] video dims (as exported): ['B', 'Transposevideo_dim_1', 'Transposevideo_dim_2', 'Transposevideo_dim_3', 3]
|
| 24 |
+
[2026-01-09 23:39:34] [INFO] WAN IO verified (or best-effort verified).
|
| 25 |
+
[2026-01-09 23:39:36] [INFO] Initial onnx.checker.check_model OK
|
| 26 |
+
[2026-01-09 23:39:36] [INFO] Created initializer: __wan_resize_roi_empty_f32 (empty float32 tensor)
|
| 27 |
+
[2026-01-09 23:39:36] [INFO] Created initializer: __wan_resize_scales_1_1_2_2_f32 (float32 [1,1,2,2])
|
| 28 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 29 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 30 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 31 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_1/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_1/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 32 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_1/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_1/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 33 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_1/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_1/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 34 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_2/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_2/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 35 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_2/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_2/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 36 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_2/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_2/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 37 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_3/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_3/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 38 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_3/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_3/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 39 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_3/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_3/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 40 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_4/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_4/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 41 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_4/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_4/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 42 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_4/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_4/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 43 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_5/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_5/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 44 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_5/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_5/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 45 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_5/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_5/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 46 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_6/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_6/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 47 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_6/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_6/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 48 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_6/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_6/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 49 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_7/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_7/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 50 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_7/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_7/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 51 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_7/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_7/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 52 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_8/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_8/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 53 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_8/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_8/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 54 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_8/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_8/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 55 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_9/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_9/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 56 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_9/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_9/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 57 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_9/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_9/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 58 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.3/resample/resample.0_10/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.3_10/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 59 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.7/resample/resample.0_10/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.7_10/Reshape_2_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 60 |
+
[2026-01-09 23:39:36] [INFO] [WAN FORCE 2x] /decoder/upsamples.11/resample/resample.0_10/Resize: roi=__wan_resize_roi_empty_f32, scales=__wan_resize_scales_1_1_2_2_f32, sizes omitted. inputs=['/decoder/upsamples.11_10/Reshape_output_0', '__wan_resize_roi_empty_f32', '__wan_resize_scales_1_1_2_2_f32', '']
|
| 61 |
+
[2026-01-09 23:39:36] [INFO] ResizeFixStats:
|
| 62 |
+
{
|
| 63 |
+
"resize_total": 33,
|
| 64 |
+
"resized_both_present_fixed": 0,
|
| 65 |
+
"resized_empty_scales_dropped": 0,
|
| 66 |
+
"resized_wan_forced_2x": 33,
|
| 67 |
+
"resized_unfixable": 0,
|
| 68 |
+
"resized_scales_only_ok": 0,
|
| 69 |
+
"resized_sizes_only_ok": 0
|
| 70 |
+
}
|
| 71 |
+
[2026-01-09 23:39:36] [INFO] Model opset (pre-quant): 18
|
| 72 |
+
[2026-01-09 23:39:36] [WARN] Model opset 18 < 19; attempting convert_version(model, 19) for FP8.
|
| 73 |
+
[2026-01-09 23:40:04] [INFO] Opset conversion to 19: OK
|
| 74 |
+
[2026-01-09 23:40:04] [INFO] Saved ONNX: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx (external=True, location=vaedecode_fp8ization_wan21_fixed.onnx_data)
|
| 75 |
+
[2026-01-09 23:40:05] [INFO] onnx.checker.check_model OK
|
| 76 |
+
[2026-01-09 23:40:11] [INFO] ORT CPU InferenceSession load OK
|
| 77 |
+
[2026-01-09 23:40:12] [INFO] Wrote calibration npz: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_calib_latent_64.npz (latent shape=(64, 16, 11, 72, 42), dtype=float32, seed=0)
|
| 78 |
+
[2026-01-09 23:40:12] [WARN] Requested EP 'cuda:0' but CUDAExecutionProvider not present in ORT provider list.
|
| 79 |
+
[2026-01-09 23:40:12] [WARN] Requested EP 'trt' but TensorrtExecutionProvider not present in ORT provider list.
|
| 80 |
+
[2026-01-09 23:40:12] [INFO] Filtered calibration_eps: ['cpu']
|
| 81 |
+
[2026-01-09 23:40:12] [INFO] ModelOpt Python API kwargs:
|
| 82 |
+
{
|
| 83 |
+
"onnx_path": "/ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx",
|
| 84 |
+
"output_path": "/ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fp8_quant.onnx",
|
| 85 |
+
"quantize_mode": "fp8",
|
| 86 |
+
"calibration_method": "entropy",
|
| 87 |
+
"calibration_data": "NpzFile '/ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_calib_latent_64.npz' with keys: latent",
|
| 88 |
+
"calibration_eps": [
|
| 89 |
+
"cpu"
|
| 90 |
+
],
|
| 91 |
+
"override_shapes": "latent:1x16x11x72x42",
|
| 92 |
+
"use_external_data_format": true,
|
| 93 |
+
"calibrate_per_node": true,
|
| 94 |
+
"dq_only": true,
|
| 95 |
+
"disable_mha_qdq": true,
|
| 96 |
+
"keep_intermediate_files": true,
|
| 97 |
+
"high_precision_dtype": "fp32"
|
| 98 |
+
}
|
| 99 |
+
[2026-01-09 23:40:24] [ERROR] ModelOpt Python API failed: Data of TensorProto ( tensor name: onnx::Mul_32598) should be stored in vaedecode_fp8ization_wan21_fixed_static.onnx_data, but it doesn't exist or is not accessible.
|
| 100 |
+
[2026-01-09 23:40:24] [ERROR] Traceback (most recent call last):
|
| 101 |
+
File "/ComfyUI/custom_nodes/comfyui-vae-tensorrt/nodes/gpt1_onnx_to_fp8.py", line 986, in _modelopt_quantize_python_api
|
| 102 |
+
moq.quantize(**kwargs)
|
| 103 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 413, in quantize
|
| 104 |
+
) = _preprocess_onnx(
|
| 105 |
+
^^^^^^^^^^^^^^^^^
|
| 106 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 166, in _preprocess_onnx
|
| 107 |
+
onnx_model, is_duplicated_constant = duplicate_shared_constants(
|
| 108 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 109 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/utils.py", line 546, in duplicate_shared_constants
|
| 110 |
+
values=tensor.values,
|
| 111 |
+
^^^^^^^^^^^^^
|
| 112 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 391, in values
|
| 113 |
+
self._values = self._values.load()
|
| 114 |
+
^^^^^^^^^^^^^^^^^^^
|
| 115 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 257, in load
|
| 116 |
+
return np.array(onnx.numpy_helper.to_array(self.tensor))
|
| 117 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 118 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/numpy_helper.py", line 414, in to_array
|
| 119 |
+
onnx.external_data_helper.load_external_data_for_tensor(tensor, base_dir)
|
| 120 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/external_data_helper.py", line 53, in load_external_data_for_tensor
|
| 121 |
+
external_data_file_path = c_checker._resolve_external_data_location( # type: ignore[attr-defined]
|
| 122 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 123 |
+
onnx.onnx_cpp2py_export.checker.ValidationError: Data of TensorProto ( tensor name: onnx::Mul_32598) should be stored in vaedecode_fp8ization_wan21_fixed_static.onnx_data, but it doesn't exist or is not accessible.
|
| 124 |
+
|
| 125 |
+
[2026-01-09 23:40:24] [WARN] Python API not used: ModelOpt Python API failed: Data of TensorProto ( tensor name: onnx::Mul_32598) should be stored in vaedecode_fp8ization_wan21_fixed_static.onnx_data, but it doesn't exist or is not accessible.
|
| 126 |
+
[2026-01-09 23:40:24] [INFO] ModelOpt CLI command:
|
| 127 |
+
/opt/venv/bin/python -m modelopt.onnx.quantization --onnx_path /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx --quantize_mode fp8 --calibration_method entropy --calibration_data_path /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_calib_latent_64.npz --calibration_eps cpu --override_shapes latent:1x16x11x72x42 --output_path /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fp8_quant.onnx --log_level INFO --log_file /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_modelopt_fp8.log --use_external_data_format --keep_intermediate_files --disable_mha_qdq --dq_only --calibrate_per_node --high_precision_dtype fp32
|
| 128 |
+
[2026-01-09 23:40:40] [INFO] ModelOpt CLI returncode: 1
|
| 129 |
+
[2026-01-09 23:40:40] [INFO] ModelOpt CLI stdout (tail):
|
| 130 |
+
[modelopt][onnx] - INFO - Starting quantization process for model: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx
|
| 131 |
+
[modelopt][onnx] - INFO - Quantization mode: fp8
|
| 132 |
+
[modelopt][onnx] - INFO - Preprocessing the model /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx
|
| 133 |
+
[modelopt][onnx] - INFO - Model has dynamic inputs: ['latent']
|
| 134 |
+
[modelopt][onnx] - INFO - Setting 'latent' shape to [1, 16, 11, 72, 42]
|
| 135 |
+
[modelopt][onnx] - INFO - Found 0 custom layers and 52764 tensors
|
| 136 |
+
[modelopt][onnx] - INFO - No custom ops found. If that's not correct, please make sure that the 'tensorrt' python package is correctly installed and that the paths to 'libcudnn*.so' and TensorRT 'lib/' are in 'LD_LIBRARY_PATH'. If the custom op is not directly available as a plugin in TensorRT, please also make sure that the path to the compiled '.so' TensorRT plugin is also being given via the '--trt_plugins' flag (requires TRT 10+).
|
| 137 |
+
[modelopt][onnx] - INFO - Duplicating shared constants
|
| 138 |
+
|
| 139 |
+
[2026-01-09 23:40:40] [WARN] ModelOpt CLI stderr (tail):
|
| 140 |
+
Traceback (most recent call last):
|
| 141 |
+
File "<frozen runpy>", line 198, in _run_module_as_main
|
| 142 |
+
File "<frozen runpy>", line 88, in _run_code
|
| 143 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/__main__.py", line 305, in <module>
|
| 144 |
+
main()
|
| 145 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/__main__.py", line 271, in main
|
| 146 |
+
quantize(
|
| 147 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 413, in quantize
|
| 148 |
+
) = _preprocess_onnx(
|
| 149 |
+
^^^^^^^^^^^^^^^^^
|
| 150 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 166, in _preprocess_onnx
|
| 151 |
+
onnx_model, is_duplicated_constant = duplicate_shared_constants(
|
| 152 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 153 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/utils.py", line 546, in duplicate_shared_constants
|
| 154 |
+
values=tensor.values,
|
| 155 |
+
^^^^^^^^^^^^^
|
| 156 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 391, in values
|
| 157 |
+
self._values = self._values.load()
|
| 158 |
+
^^^^^^^^^^^^^^^^^^^
|
| 159 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 257, in load
|
| 160 |
+
return np.array(onnx.numpy_helper.to_array(self.tensor))
|
| 161 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 162 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/numpy_helper.py", line 414, in to_array
|
| 163 |
+
onnx.external_data_helper.load_external_data_for_tensor(tensor, base_dir)
|
| 164 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/external_data_helper.py", line 53, in load_external_data_for_tensor
|
| 165 |
+
external_data_file_path = c_checker._resolve_external_data_location( # type: ignore[attr-defined]
|
| 166 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 167 |
+
onnx.onnx_cpp2py_export.checker.ValidationError: Data of TensorProto ( tensor name: onnx::Mul_32598) should be stored in vaedecode_fp8ization_wan21_fixed_static.onnx_data, but it doesn't exist or is not accessible.
|
| 168 |
+
|
| 169 |
+
[2026-01-09 23:40:40] [ERROR] ModelOpt CLI failed (returncode=1)
|
| 170 |
+
[2026-01-09 23:40:40] [ERROR] ModelOpt output tail:
|
| 171 |
+
[modelopt][onnx] - INFO - Starting quantization process for model: /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx
|
| 172 |
+
[modelopt][onnx] - INFO - Quantization mode: fp8
|
| 173 |
+
[modelopt][onnx] - INFO - Preprocessing the model /ComfyUI/output/wan21_work_20260109_233933_0eee5653_e567f199/vaedecode_fp8ization_wan21_fixed.onnx
|
| 174 |
+
[modelopt][onnx] - INFO - Model has dynamic inputs: ['latent']
|
| 175 |
+
[modelopt][onnx] - INFO - Setting 'latent' shape to [1, 16, 11, 72, 42]
|
| 176 |
+
[modelopt][onnx] - INFO - Found 0 custom layers and 52764 tensors
|
| 177 |
+
[modelopt][onnx] - INFO - No custom ops found. If that's not correct, please make sure that the 'tensorrt' python package is correctly installed and that the paths to 'libcudnn*.so' and TensorRT 'lib/' are in 'LD_LIBRARY_PATH'. If the custom op is not directly available as a plugin in TensorRT, please also make sure that the path to the compiled '.so' TensorRT plugin is also being given via the '--trt_plugins' flag (requires TRT 10+).
|
| 178 |
+
[modelopt][onnx] - INFO - Duplicating shared constants
|
| 179 |
+
|
| 180 |
+
Traceback (most recent call last):
|
| 181 |
+
File "<frozen runpy>", line 198, in _run_module_as_main
|
| 182 |
+
File "<frozen runpy>", line 88, in _run_code
|
| 183 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/__main__.py", line 305, in <module>
|
| 184 |
+
main()
|
| 185 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/__main__.py", line 271, in main
|
| 186 |
+
quantize(
|
| 187 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 413, in quantize
|
| 188 |
+
) = _preprocess_onnx(
|
| 189 |
+
^^^^^^^^^^^^^^^^^
|
| 190 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/quantization/quantize.py", line 166, in _preprocess_onnx
|
| 191 |
+
onnx_model, is_duplicated_constant = duplicate_shared_constants(
|
| 192 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 193 |
+
File "/opt/venv/lib/python3.12/site-packages/modelopt/onnx/utils.py", line 546, in duplicate_shared_constants
|
| 194 |
+
values=tensor.values,
|
| 195 |
+
^^^^^^^^^^^^^
|
| 196 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 391, in values
|
| 197 |
+
self._values = self._values.load()
|
| 198 |
+
^^^^^^^^^^^^^^^^^^^
|
| 199 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx_graphsurgeon/ir/tensor.py", line 257, in load
|
| 200 |
+
return np.array(onnx.numpy_helper.to_array(self.tensor))
|
| 201 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 202 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/numpy_helper.py", line 414, in to_array
|
| 203 |
+
onnx.external_data_helper.load_external_data_for_tensor(tensor, base_dir)
|
| 204 |
+
File "/opt/venv/lib/python3.12/site-packages/onnx/external_data_helper.py", line 53, in load_external_data_for_tensor
|
| 205 |
+
external_data_file_path = c_checker._resolve_external_data_location( # type: ignore[attr-defined]
|
| 206 |
+
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
| 207 |
+
onnx.onnx_cpp2py_export.checker.ValidationError: Data of TensorProto ( tensor name: onnx::Mul_32598) should be stored in vaedecode_fp8ization_wan21_fixed_static.onnx_data, but it doesn't exist or is not accessible.
|
| 208 |
+
|
| 209 |
+
[2026-01-09 23:40:40] [INFO] === RUN END ===
|