HuggingFaceM4
/

tiny-random-siglip

Zero-Shot Image Classification

Model card Files Files and versions

VictorSanh commited on Jan 31, 2024

Commit

1f50acd

·

1 Parent(s): 2ca24ef

fix ops

Files changed (1) hide show

modeling_siglip.py +5 -4

modeling_siglip.py CHANGED Viewed

@@ -95,11 +95,12 @@ def _trunc_normal_(tensor, mean, std, a, b):
     # Use inverse cdf transform for normal distribution to get truncated
     # standard normal
-    if tensor.dtype == torch.float16:
-        # The `erfinv_` op is not (yet?) defined in float16
         tensor = tensor.to(torch.float32)
         tensor.erfinv_()
-        tensor = tensor.to(torch.float16)
     else:
         tensor.erfinv_()
@@ -109,7 +110,7 @@ def _trunc_normal_(tensor, mean, std, a, b):
     # Clamp to ensure it's in the proper range
     if tensor.dtype == torch.float16:
-        # The `clamp_` op is not (yet?) defined in float16
         tensor = tensor.to(torch.float32)
         tensor.clamp_(min=a, max=b)
         tensor = tensor.to(torch.float16)

     # Use inverse cdf transform for normal distribution to get truncated
     # standard normal
+    if tensor.dtype in [torch.float16, torch.bfloat16]:
+        # The `erfinv_` op is not (yet?) defined in float16+cpu, bfloat16+gpu
+        og_dtype = tensor.dtype
         tensor = tensor.to(torch.float32)
         tensor.erfinv_()
+        tensor = tensor.to(og_dtype)
     else:
         tensor.erfinv_()
     # Clamp to ensure it's in the proper range
     if tensor.dtype == torch.float16:
+        # The `clamp_` op is not (yet?) defined in float16+cpu
         tensor = tensor.to(torch.float32)
         tensor.clamp_(min=a, max=b)
         tensor = tensor.to(torch.float16)