Update modular_openpangu_dense.py
Browse files
modular_openpangu_dense.py
CHANGED
|
@@ -24,12 +24,13 @@ from typing import Callable, Optional, Tuple
|
|
| 24 |
import torch
|
| 25 |
from torch import nn
|
| 26 |
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
|
|
|
| 33 |
NPU_ATTN_INFR = False
|
| 34 |
|
| 35 |
from transformers.cache_utils import Cache
|
|
|
|
| 24 |
import torch
|
| 25 |
from torch import nn
|
| 26 |
|
| 27 |
+
try:
|
| 28 |
+
import torch_npu
|
| 29 |
+
from torch_npu.contrib import transfer_to_npu
|
| 30 |
+
if "910" in torch.npu.get_device_name():
|
| 31 |
+
NPU_ATTN_INFR = True
|
| 32 |
+
print("[INFO] torch_npu detected. Using NPU fused infer attention.")
|
| 33 |
+
except ImportError:
|
| 34 |
NPU_ATTN_INFR = False
|
| 35 |
|
| 36 |
from transformers.cache_utils import Cache
|