Error: H-HIGH-H4_svd_fp32-s1
Browse files
H/HIGH/H4_svd_fp32/seed1_ERROR/error.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"config": {
|
| 3 |
+
"group": "H",
|
| 4 |
+
"variant": "H4_svd_fp32",
|
| 5 |
+
"band": "HIGH",
|
| 6 |
+
"seed": 1,
|
| 7 |
+
"phase": 2,
|
| 8 |
+
"num_epochs": 1,
|
| 9 |
+
"batch_size": 256,
|
| 10 |
+
"overrides": {
|
| 11 |
+
"svd": "fp32"
|
| 12 |
+
},
|
| 13 |
+
"description": "H-HIGH-H4_svd_fp32-s1"
|
| 14 |
+
},
|
| 15 |
+
"error": "cusolver error: CUSOLVER_STATUS_INVALID_VALUE, when calling `cusolverDnXsyevBatched_bufferSize( handle, params, jobz, uplo, n, CUDA_R_32F, reinterpret_cast<const void*>(A), lda, CUDA_R_32F, reinterpret_cast<const void*>(W), CUDA_R_32F, workspaceInBytesOnDevice, workspaceInBytesOnHost, batchSize)`. This error may appear if the input matrix contains NaN. If you keep seeing this error, you may use `torch.backends.cuda.preferred_linalg_library()` to try linear algebra operators with other supported backends. See https://pytorch.org/docs/stable/backends.html#torch.backends.cuda.preferred_linalg_library",
|
| 16 |
+
"traceback": "Traceback (most recent call last):\n File \"/tmp/ipykernel_4109/3798867187.py\", line 305, in run_phase2\n result = run_ablation_config(\n ^^^^^^^^^^^^^^^^^^^^\n File \"/tmp/ipykernel_4109/3142053339.py\", line 562, in run_ablation_config\n out = model(images)\n ^^^^^^^^^^^^^\n File \"/usr/local/lib/python3.12/dist-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n return self._call_impl(*args, **kwargs)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/usr/local/lib/python3.12/dist-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n return forward_call(*args, **kwargs)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/tmp/ipykernel_4109/2994023296.py\", line 408, in forward\n svd = self.encode_patches(patches)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/tmp/ipykernel_4109/3142053339.py\", line 166, in encode_patches\n eigenvalues, Vmat = torch.linalg.eigh(G)\n ^^^^^^^^^^^^^^^^^^^^\ntorch._C._LinAlgError: cusolver error: CUSOLVER_STATUS_INVALID_VALUE, when calling `cusolverDnXsyevBatched_bufferSize( handle, params, jobz, uplo, n, CUDA_R_32F, reinterpret_cast<const void*>(A), lda, CUDA_R_32F, reinterpret_cast<const void*>(W), CUDA_R_32F, workspaceInBytesOnDevice, workspaceInBytesOnHost, batchSize)`. This error may appear if the input matrix contains NaN. If you keep seeing this error, you may use `torch.backends.cuda.preferred_linalg_library()` to try linear algebra operators with other supported backends. See https://pytorch.org/docs/stable/backends.html#torch.backends.cuda.preferred_linalg_library\n",
|
| 17 |
+
"timestamp": "2026-04-21T18:55:57.520932"
|
| 18 |
+
}
|