bytedance-research
/

ChatTS-14B

Text Generation

feature-extraction

text-generation-inference

Model card Files Files and versions Community

Fix BF16 training

#19

by alexanderchemeris - opened Jun 3

base: refs/heads/main

←

from: refs/pr/19

Discussion Files changed

Files changed (1) hide show

modeling_qwen2.py +1 -1

modeling_qwen2.py CHANGED Viewed

@@ -131,7 +131,7 @@ class TimeSeriesEmbedding(nn.Module):
         x = x.reshape(batch_size, -1, self.num_features)
         mask = x[:, :, -1].long()
-        valid_lengths = mask.sum(dim=1).long()  # Shape: (batch_size)
         patch_cnt = (valid_lengths + self.patch_size - 1) // self.patch_size  # 向上取整

         x = x.reshape(batch_size, -1, self.num_features)
         mask = x[:, :, -1].long()
+        valid_lengths = (mask > 0.5).long().sum(dim=1)  # Shape: (batch_size)
         patch_cnt = (valid_lengths + self.patch_size - 1) // self.patch_size  # 向上取整