Commit
·
c506c42
1
Parent(s):
8e1346e
dummy test
Browse files- modeling_vmistral.py +1 -0
modeling_vmistral.py
CHANGED
@@ -824,6 +824,7 @@ class MistralFlashAttention2(MistralAttention):
|
|
824 |
use_cache: bool = False,
|
825 |
**kwargs,
|
826 |
):
|
|
|
827 |
if "padding_mask" in kwargs:
|
828 |
warnings.warn(
|
829 |
"Passing `padding_mask` is deprecated and will be removed in v4.37. Please make sure use"
|
|
|
824 |
use_cache: bool = False,
|
825 |
**kwargs,
|
826 |
):
|
827 |
+
print("using flash attention")
|
828 |
if "padding_mask" in kwargs:
|
829 |
warnings.warn(
|
830 |
"Passing `padding_mask` is deprecated and will be removed in v4.37. Please make sure use"
|