pytorch
diff --git a/‎test/prototype/mx_formats/test_mx_tensor.py
Lines changed: 204 additions & 0 deletions b/‎test/prototype/mx_formats/test_mx_tensor.py
Lines changed: 204 additions & 0 deletions
@@ -1,4 +1,5 @@
 # Copyright (c) Meta Platforms, Inc. and affiliates.
+# Copyright (c) 2025, NVIDIA CORPORATION.
 # All rights reserved.
 
 # This source code is licensed under the license found in the
@@ -105,6 +106,209 @@ def test_some_zeros(elem_dtype):
     _test_mx(data, elem_dtype, block_size)
 
 
+@pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available")
+def test_to_mx_rceil():
+    # nan
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        2143289344, 1054459450, 1060527345, 1045656552, 1058239340, 1045057552, 1061158006, 1049626606,
+        1052757568, 1032293288, 1056992320, 1064929425, 1061036255, 1047450552, 1057077424, 1055125012,
+        1036491424, 1063542041, 1057099838, 1058731224, 1050189482, 1049114228, 1058347802, 1060065968,
+        1058846156, 1048878912, 1065109089, 1054494928, 1044803976, 1049117692, 1065222528, 1056965012,
+        ],
+        dtype=torch.uint32,
+    ).view(torch.float32)
+    # fmt: on
+    ground_truth_scale = torch.tensor([255], dtype=torch.uint8)
+    # fmt: off
+    ground_truth_fp8 = torch.tensor(
+        [
+        127, 0, 0, 0, 0, 0, 0, 0,
+        0, 0, 0, 0, 0, 0, 0, 0,
+        0, 0, 0, 0, 0, 0, 0, 0,
+        0, 0, 0, 0, 0, 0, 0, 0,
+        ],
+        dtype=torch.uint8,
+    ).view(torch.float8_e4m3fn)
+    # fmt: on
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    assert torch.isnan(data_mx._data[0])
+    assert torch.all(data_mx._data[1:] == 0)
+    # fp32 denorm
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        6142315, 5096174, 3345704, 6178415, 5728750, 419002, 1716691, 4335089,
+        5785800, 6234845, 1697524, 33075, 3975816, 3714822, 5411407, 3040844,
+        7400945, 4474166, 7257182, 1273750, 5872176, 4694081, 2096530, 6273621,
+        67028, 7585260, 4532315, 4599275, 6133942, 4542483, 5992199, 6862780,
+        ],
+        dtype=torch.uint32,
+    ).view(torch.float32)
+    # fmt: on
+    ground_truth_scale = torch.tensor([0], dtype=torch.uint8)
+    ground_truth_fp8 = torch.tensor([0] * 32, dtype=torch.uint8).view(
+        torch.float8_e4m3fn
+    )
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # bf16 denorm
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        101, 3, 47, 54, 36, 19, 70, 79,
+        35, 95, 28, 120, 84, 94, 20, 92,
+        18, 42, 98, 58, 3, 26, 64, 86,
+        60, 86, 52, 23, 61, 70, 59, 74,
+        ],
+        dtype=torch.uint16,
+    ).view(torch.bfloat16)
+    # fmt: on
+    ground_truth_scale = torch.tensor([0], dtype=torch.uint8)
+    ground_truth_fp8 = torch.tensor([0] * 32, dtype=torch.uint8).view(
+        torch.float8_e4m3fn
+    )
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # fp32 some denorm
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        8388608, 1063716449, 1064039365, 1063568877, 1051091338, 1062185569, 1034449408, 1060813641,
+        1054893736, 1034907680, 1036660744, 1023639888, 1058536559, 1050896496, 1049237634, 1064950601,
+        1051852994, 1059794063, 1054011102, 1062023602, 1059467900, 1062276774, 1059155029, 1053287574,
+        1064378711, 1055768540, 1045266076, 1059575077, 1054928758, 1040468200, 1058061961, 1053066436,
+        ],
+        dtype=torch.uint32,
+    ).view(torch.float32)
+    # fmt: on
+    ground_truth_scale = torch.tensor([119], dtype=torch.uint8)
+    # fmt: off
+    ground_truth_fp8 = torch.tensor(
+        [
+        0, 118, 119, 118, 106, 117, 91, 116,
+        110, 91, 93, 80, 113, 106, 105, 120,
+        107, 115, 109, 117, 114, 117, 114, 108,
+        119, 111, 101, 114, 110, 96, 113, 108,
+        ],
+        dtype=torch.uint8,
+    ).view(torch.float8_e4m3fn)
+    # fmt: on
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # bf16 some denorm
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        128, 16118, 16143, 16074, 16187, 16002, 16193, 16217,
+        15680, 16183, 16092, 16158, 16251, 15876, 15896, 16194,
+        16135, 16214, 16205, 16110, 16122, 15960, 15824, 16106,
+        16220, 16230, 15952, 15896, 16000, 16144, 16232, 16157,
+        ],
+        dtype=torch.uint16,
+    ).view(torch.bfloat16)
+    # fmt: on
+    ground_truth_scale = torch.tensor([119], dtype=torch.uint8)
+    # fmt: off
+    ground_truth_fp8 = torch.tensor(
+        [
+        0, 111, 113, 109, 116, 104, 116, 118,
+        84, 115, 110, 114, 120, 96, 98, 116,
+        112, 117, 117, 111, 112, 102, 93, 111,
+        118, 118, 101, 98, 104, 113, 118, 114,
+        ],
+        dtype=torch.uint8,
+    ).view(torch.float8_e4m3fn)
+    # fmt: on
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # zero
+    data_hp = torch.tensor([0] * 32, dtype=torch.uint32).view(torch.float32)
+    ground_truth_scale = torch.tensor([0], dtype=torch.uint8)
+    ground_truth_fp8 = torch.tensor([0] * 32, dtype=torch.uint8).view(
+        torch.float8_e4m3fn
+    )
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # fp32 normal
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        1037408064, 1058534842, 1053630662, 1063310394, 994704128, 1057245441, 1060663708, 1058053571,
+        1052395648, 1064831570, 1038427336, 1064777688, 1059248393, 1060959028, 1062878286, 1057799482,
+        1057854101, 1053562724, 1027482352, 1060498324, 1063238522, 1060472055, 1054346794, 1029092912,
+        1056687298, 1059146141, 1037992128, 1064097772, 1056522806, 1059255744, 1064364912, 1060606252,
+        ],
+        dtype=torch.uint32,
+    ).view(torch.float32)
+    # fmt: on
+    ground_truth_scale = torch.tensor([119], dtype=torch.uint8)
+    # fmt: off
+    ground_truth_fp8 = torch.tensor(
+        [
+        93, 113, 109, 118, 53, 112, 116, 113,
+        108, 120, 94, 119, 114, 116, 118, 113,
+        113, 109, 84, 115, 118, 115, 110, 85,
+        112, 114, 94, 119, 112, 114, 119, 115,
+        ],
+        dtype=torch.uint8,
+    ).view(torch.float8_e4m3fn)
+    # fmt: on
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+    # bf16 normal
+    # fmt: off
+    data_hp = torch.tensor(
+        [
+        15752, 16143, 16182, 15896, 16195, 16186, 16048, 16223,
+        15988, 16231, 16140, 16088, 16032, 16240, 16228, 16133,
+        16210, 16024, 16248, 16187, 16050, 15696, 16060, 15956,
+        16131, 16251, 15896, 16014, 15808, 16024, 16159, 16186,
+        ],
+        dtype=torch.uint16,
+    ).view(torch.bfloat16)
+    # fmt: on
+    ground_truth_scale = torch.tensor([119], dtype=torch.uint8)
+    # fmt: off
+    ground_truth_fp8 = torch.tensor(
+        [
+        88, 113, 115, 98, 116, 116, 107, 118,
+        103, 118, 113, 110, 106, 119, 118, 112,
+        117, 106, 120, 116, 107, 85, 108, 101,
+        112, 120, 98, 105, 92, 106, 114, 116,
+        ],
+        dtype=torch.uint8,
+    ).view(torch.float8_e4m3fn)
+    # fmt: on
+    data_mx = MXTensor.to_mx(
+        data_hp, torch.float8_e4m3fn, 32, ScaleCalculationMode.RCEIL
+    )
+    torch.testing.assert_close(data_mx._scale_e8m0, ground_truth_scale)
+    torch.testing.assert_close(data_mx._data, ground_truth_fp8)
+
+
 @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available")
 @pytest.mark.parametrize("elem_dtype", SUPPORTED_ELEM_DTYPES)
 def test_exponent_nan_in(elem_dtype):