/******************************************************************************* * Copyright 2023-2024 Intel Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. *******************************************************************************/ #include #include "dnnl_test_common.hpp" #include "gtest/gtest.h" #include "tests/test_isa_common.hpp" #include "src/common/bit_cast.hpp" #include "src/common/float8.hpp" using dnnl::impl::utils::bit_cast; namespace dnnl { TEST(test_ref_float8_conversions, f8_e5m2_to_f32) { SKIP_IF(!impl::cpu::platform::has_data_type_support( impl::data_type::f8_e5m2), "Engine does not support this data type."); // check all 256 f8_e5m2 values impl::parallel_nd(0xff, [&](uint16_t u16) { // convert f8_e5m2 to f32 and back again, // expecting bitwise idendical values except for sNaN, // where the convention is to set the quiet bit: // * +sNaN: 0x7d -> 0x7f // * -sNaN: 0xfd -> 0xff // f8_e5m2 encoding: seeeeemm // |_-> quiet bit is msb of mantissa uint8_t u8 = static_cast(u16); constexpr bool is_bitcast = true; float8_e5m2_t x8(u8, is_bitcast); ASSERT_EQ(u8, x8.raw_bits_); ASSERT_EQ(u8, bit_cast(x8)); float x32(x8); float8_e5m2_t y8(x32); // if x8 is an sNaN the conversion sets the quiet bit (msb of mantissa) const bool is_x8_snan = impl::utils::one_of(u8, 0x7d, 0xfd); const uint8_t y8_expect = is_x8_snan ? u8 | 0x02 : u8; ASSERT_EQ(y8_expect, bit_cast(y8)); }); } TEST(test_ref_float8_conversions, f8_e4m3_to_f32) { SKIP_IF(!impl::cpu::platform::has_data_type_support( impl::data_type::f8_e4m3), "Engine does not support this data type."); // check all 256 f8_e4m3 values impl::parallel_nd(0xff, [&](uint16_t u16) { uint8_t u8 = static_cast(u16); constexpr bool is_bitcast = true; float8_e4m3_t x8(u8, is_bitcast); ASSERT_EQ(u8, x8.raw_bits_); ASSERT_EQ(u8, bit_cast(x8)); // convert f8_e4m3 to f32 and back again, // expecting bitwise idendical values. // Note: f8_e4m3 does not have sNaN values, so no need to set quiet bit float x32(x8); float8_e4m3_t y8(x32); const uint8_t y8_expect = u8; ASSERT_EQ(y8_expect, bit_cast(y8)) << std::hex << std::endl << "u8 = " << static_cast(u8) << std::endl << "x8.raw_bits_ = " << static_cast(bit_cast(x8)) << std::endl << "y8.raw_bits_ = " << static_cast(bit_cast(y8)) << std::endl << "y8_expect = " << static_cast(y8_expect) << std::endl << std::dec; }); } TEST(test_ref_float8_conversions, f32_to_f8_e4m3) { SKIP_IF(!impl::cpu::platform::has_data_type_support( impl::data_type::f8_e4m3), "Engine does not support this data type."); // check all 2^32 f32 values impl::parallel_nd(0x100000000, [&](int64_t s64) { uint32_t u32 = static_cast(s64); float x32 = bit_cast(u32); ASSERT_EQ(u32, bit_cast(x32)); float16_t x16(x32); float8_e4m3_t x8_from_x16(x16); float8_e4m3_t x8_from_x32(x32); // check for double rounding ASSERT_EQ(x8_from_x16.raw_bits_, x8_from_x32.raw_bits_) << std::hex << std::endl << "x32 (raw bits) = " << bit_cast(x32) << std::endl << "x16 (raw bits) = " << bit_cast(x16) << std::endl << "x8_from_x16 (raw bits) = " << static_cast(bit_cast(x8_from_x16)) << std::endl << "x8_from_x32 (raw_bits) = " << static_cast(bit_cast(x8_from_x32)) << std::endl << std::dec; }); } #if DNNL_X64 TEST(test_jit_float8_conversions, f8_e5m2_to_f32) { SKIP_IF(!impl::cpu::platform::has_data_type_support( impl::data_type::f8_e5m2), "Engine does not support this data type."); // check all 2^8 fp8 values impl::parallel_nd(0xff, [&](uint16_t u16) { // convert from f8_e5m2 to f32 using ref and jit converters uint8_t u8 = static_cast(u16); constexpr bool is_bitcast = true; float8_e5m2_t x8(u8, is_bitcast); ASSERT_EQ(u8, x8.raw_bits_); ASSERT_EQ(u8, bit_cast(x8)); float16_t ref_x16 = x8; float16_t jit_x16; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f8_e5m2_to_f16(&jit_x16, &x8)); // expect bitwise identical results ASSERT_EQ(bit_cast(ref_x16), bit_cast(jit_x16)) << std::hex << std::endl << "x8.raw_bits_ = " << static_cast(u8) << std::endl << "ref_x16.raw_bits_ = " << bit_cast(ref_x16) << std::endl << "jit_x16.raw_bits_ = " << bit_cast(jit_x16) << std::endl << std::dec; float ref_x32 = static_cast(x8); float jit_x32; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f8_e5m2_to_f32(&jit_x32, &x8)); // expect bitwise identical results ASSERT_EQ(bit_cast(ref_x32), bit_cast(jit_x32)) << std::hex << std::endl << "x8.raw_bits_ = " << static_cast(u8) << std::endl << "ref_x32.raw_bits_ = " << bit_cast(ref_x32) << std::endl << "jit_x32.raw_bits_ = " << bit_cast(jit_x32) << std::endl << std::dec; }); } TEST(test_jit_float8_conversions, f8_e4m3_to_f32) { SKIP_IF(!impl::cpu::platform::has_data_type_support( impl::data_type::f8_e4m3), "Engine does not support this data type."); // check all 2^8 fp8 values impl::parallel_nd(0xff, [&](uint16_t u16) { // convert from f8_e4m3 to f32 using ref and jit converters uint8_t u8 = static_cast(u16); constexpr bool is_bitcast = true; float8_e4m3_t x8(u8, is_bitcast); ASSERT_EQ(u8, x8.raw_bits_); ASSERT_EQ(u8, bit_cast(x8)); float16_t ref_x16 = x8; float16_t jit_x16; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f8_e4m3_to_f16(&jit_x16, &x8)); // expect bitwise identical results ASSERT_EQ(bit_cast(ref_x16), bit_cast(jit_x16)) << std::hex << std::endl << "x8.raw_bits_ = " << static_cast(u8) << std::endl << "ref_x16.raw_bits_ = " << bit_cast(ref_x16) << std::endl << "jit_x16.raw_bits_ = " << bit_cast(jit_x16) << std::endl << std::dec; float ref_x32 = static_cast(x8); float jit_x32; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f8_e4m3_to_f32(&jit_x32, &x8)); // expect bitwise identical results ASSERT_EQ(bit_cast(ref_x32), bit_cast(jit_x32)) << std::hex << std::endl << "x8.raw_bits_ = " << static_cast(u8) << std::endl << "ref_x32.raw_bits_ = " << bit_cast(ref_x32) << std::endl << "jit_x32.raw_bits_ = " << bit_cast(jit_x32) << std::endl << std::dec; }); } TEST(test_jit_float8_conversions, f16_to_fp8) { const bool is_fp8_supported = impl::utils::everyone_is(true, impl::cpu::platform::has_data_type_support( impl::data_type::f8_e5m2), impl::cpu::platform::has_data_type_support( impl::data_type::f8_e4m3)); SKIP_IF(!is_fp8_supported, "Engine does not support this data type."); // check all 2^16 f16 values impl::parallel_nd(0xffff, [&](uint16_t u32) { uint16_t u16 = static_cast(u32); constexpr bool is_bitcast = true; auto x16 = float16_t(u16, is_bitcast); ASSERT_EQ(u16, x16.raw); ASSERT_EQ(u16, bit_cast(x16)); // convert from f16 to f8_e5m2 using ref and jit converters float8_e5m2_t ref_x8_e5m2 = x16; float8_e5m2_t jit_x8_e5m2; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f16_to_f8_e5m2(&jit_x8_e5m2, &x16)); // expect bitwise identical results ASSERT_EQ( bit_cast(ref_x8_e5m2), bit_cast(jit_x8_e5m2)) << std::hex << std::endl << "x16.raw_bits_ = " << static_cast(u16) << std::endl << "ref_x8_e5m2.raw_bits_ = " << static_cast(bit_cast(ref_x8_e5m2)) << std::endl << "jit_x8_e5m2.raw_bits_ = " << static_cast(bit_cast(jit_x8_e5m2)) << std::endl << std::dec; // convert from f16 to f8_e4m3 using ref and jit converters float8_e4m3_t ref_x8_e4m3 = x16; float8_e4m3_t jit_x8_e4m3; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f16_to_f8_e4m3(&jit_x8_e4m3, &x16)); // expect bitwise identical results ASSERT_EQ( bit_cast(ref_x8_e4m3), bit_cast(jit_x8_e4m3)) << std::hex << std::endl << "x16.raw_bits_ = " << static_cast(u16) << std::endl << "ref_x8_e4m3.raw_bits_ = " << static_cast(bit_cast(ref_x8_e4m3)) << std::endl << "jit_x8_e4m3.raw_bits_ = " << static_cast(bit_cast(jit_x8_e4m3)) << std::endl << std::dec; }); } TEST(test_f16_conversions, f16_to_f32) { SKIP_IF(!mayiuse(impl::cpu::x64::avx512_core_fp16), "Engine does not support this ISA."); // check all 2^16 f16 values impl::parallel_nd(0xffff, [&](uint16_t u32) { // convert from f16 to f32 using ref and jit converters uint16_t u16 = static_cast(u32); constexpr bool is_bitcast = true; auto x16 = float16_t(u16, is_bitcast); ASSERT_EQ(u16, x16.raw); ASSERT_EQ(u16, bit_cast(x16)); float ref_x32 = static_cast(x16); float jit_x32; // can only fail if data type not supported ASSERT_TRUE(impl::cpu::x64::try_cvt_f16_to_f32(&jit_x32, &x16)); // expect bitwise identical results ASSERT_EQ(bit_cast(ref_x32), bit_cast(jit_x32)) << std::hex << std::endl << "x16.raw_bits_ = " << static_cast(u16) << std::endl << "ref_x32.raw_bits_ = " << bit_cast(ref_x32) << std::endl << "jit_x32.raw_bits_ = " << bit_cast(jit_x32) << std::endl << std::dec; }); } #endif // DNNL_X64 } // namespace dnnl