Update modular_openpangu_dense.py
Browse files
modular_openpangu_dense.py
CHANGED
@@ -24,12 +24,13 @@ from typing import Callable, Optional, Tuple
|
|
24 |
import torch
|
25 |
from torch import nn
|
26 |
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
|
|
|
33 |
NPU_ATTN_INFR = False
|
34 |
|
35 |
from transformers.cache_utils import Cache
|
|
|
24 |
import torch
|
25 |
from torch import nn
|
26 |
|
27 |
+
try:
|
28 |
+
import torch_npu
|
29 |
+
from torch_npu.contrib import transfer_to_npu
|
30 |
+
if "910" in torch.npu.get_device_name():
|
31 |
+
NPU_ATTN_INFR = True
|
32 |
+
print("[INFO] torch_npu detected. Using NPU fused infer attention.")
|
33 |
+
except ImportError:
|
34 |
NPU_ATTN_INFR = False
|
35 |
|
36 |
from transformers.cache_utils import Cache
|