Azure · wkcn · Nov 28, 2023 · Nov 18, 2023 · Nov 18, 2023 · Nov 18, 2023
diff --git a/msamp/common/tensor/meta.py b/msamp/common/tensor/meta.py
@@ -6,7 +6,7 @@
 import copy
 import torch
 
-from msamp.common.dtype import Floating
+from msamp.common.dtype import Floating, Dtypes
 
 
 class ScalingMeta:
@@ -104,9 +104,12 @@ def reset_scaling_factor(self, qtype=None):
         if qtype is None:
             qtype = self.qtype
 
-        fp_max = Floating.qfp_max[qtype]
-        sf = ScalingMeta.compute_scaling_factor(self.amax[0], self.scale, fp_max, 0)
-        self.scale.copy_(sf)
+        if qtype in [Dtypes.kfloat32, Dtypes.kbfloat16]:
+            self.scale.fill_(1)
+        else:
+            fp_max = Floating.qfp_max[qtype]
+            sf = ScalingMeta.compute_scaling_factor(self.amax[0], self.scale, fp_max, 0)
+            self.scale.copy_(sf)
 
     def copy_(self, src):
         """Copies the members from src into self and returns self.

diff --git a/tests/common/tensor/test_tensor.py b/tests/common/tensor/test_tensor.py
@@ -154,6 +154,15 @@ def _allclose(input, other):
                     # check if tensor is not changed
                     self.assertTrue(torch.equal(tensor, tensor_bak))
 
+    @decorator.cuda_test
+    def test_tensor_cast_to_scaling_fp32(self):
+        """Test cast function to ScalingFP32 or ScalingBF16 in ScalingTensor."""
+        for dtype in [Dtypes.kfloat32, Dtypes.kbfloat16]:
+            with self.subTest(dtype=dtype):
+                x = torch.tensor([1.0 / 512], dtype=torch.float32, device=self.device)
+                y = x.cast(dtype)
+                self.assertTrue(x == y.float())
+
     @decorator.cuda_test
     def test_tensor_cast_with_exception_value(self):
         """Test cast function in ScalingTensor with exception value."""