core/stdarch/crates/core_arch/src/x86/
f16c.rs1use crate::core_arch::{simd::*, x86::*};
6use crate::intrinsics::simd::*;
7
8#[cfg(test)]
9use stdarch_test::assert_instr;
10
11#[allow(improper_ctypes)]
12unsafe extern "unadjusted" {
13 #[link_name = "llvm.x86.vcvtps2ph.128"]
14 fn llvm_vcvtps2ph_128(a: f32x4, rounding: i32) -> i16x8;
15 #[link_name = "llvm.x86.vcvtps2ph.256"]
16 fn llvm_vcvtps2ph_256(a: f32x8, rounding: i32) -> i16x8;
17}
18
19#[inline]
25#[target_feature(enable = "f16c")]
26#[cfg_attr(test, assert_instr("vcvtph2ps"))]
27#[stable(feature = "x86_f16c_intrinsics", since = "1.68.0")]
28pub fn _mm_cvtph_ps(a: __m128i) -> __m128 {
29 unsafe {
30 let a: f16x8 = transmute(a);
31 let a: f16x4 = simd_shuffle!(a, a, [0, 1, 2, 3]);
32 simd_cast(a)
33 }
34}
35
36#[inline]
41#[target_feature(enable = "f16c")]
42#[cfg_attr(test, assert_instr("vcvtph2ps"))]
43#[stable(feature = "x86_f16c_intrinsics", since = "1.68.0")]
44pub fn _mm256_cvtph_ps(a: __m128i) -> __m256 {
45 unsafe {
46 let a: f16x8 = transmute(a);
47 simd_cast(a)
48 }
49}
50
51#[inline]
65#[target_feature(enable = "f16c")]
66#[cfg_attr(test, assert_instr("vcvtps2ph", IMM_ROUNDING = 0))]
67#[rustc_legacy_const_generics(1)]
68#[stable(feature = "x86_f16c_intrinsics", since = "1.68.0")]
69pub fn _mm_cvtps_ph<const IMM_ROUNDING: i32>(a: __m128) -> __m128i {
70 static_assert_uimm_bits!(IMM_ROUNDING, 3);
71 unsafe {
72 let a = a.as_f32x4();
73 let r = llvm_vcvtps2ph_128(a, IMM_ROUNDING);
74 transmute(r)
75 }
76}
77
78#[inline]
91#[target_feature(enable = "f16c")]
92#[cfg_attr(test, assert_instr("vcvtps2ph", IMM_ROUNDING = 0))]
93#[rustc_legacy_const_generics(1)]
94#[stable(feature = "x86_f16c_intrinsics", since = "1.68.0")]
95pub fn _mm256_cvtps_ph<const IMM_ROUNDING: i32>(a: __m256) -> __m128i {
96 static_assert_uimm_bits!(IMM_ROUNDING, 3);
97 unsafe {
98 let a = a.as_f32x8();
99 let r = llvm_vcvtps2ph_256(a, IMM_ROUNDING);
100 transmute(r)
101 }
102}
103
104#[cfg(test)]
105mod tests {
106 use crate::{core_arch::x86::*, mem::transmute};
107 use stdarch_test::simd_test;
108
109 const F16_ONE: i16 = 0x3c00;
110 const F16_TWO: i16 = 0x4000;
111 const F16_THREE: i16 = 0x4200;
112 const F16_FOUR: i16 = 0x4400;
113 const F16_FIVE: i16 = 0x4500;
114 const F16_SIX: i16 = 0x4600;
115 const F16_SEVEN: i16 = 0x4700;
116 const F16_EIGHT: i16 = 0x4800;
117
118 #[simd_test(enable = "f16c")]
119 unsafe fn test_mm_cvtph_ps() {
120 let a = _mm_set_epi16(0, 0, 0, 0, F16_ONE, F16_TWO, F16_THREE, F16_FOUR);
121 let r = _mm_cvtph_ps(a);
122 let e = _mm_set_ps(1.0, 2.0, 3.0, 4.0);
123 assert_eq_m128(r, e);
124 }
125
126 #[simd_test(enable = "f16c")]
127 unsafe fn test_mm256_cvtph_ps() {
128 let a = _mm_set_epi16(
129 F16_ONE, F16_TWO, F16_THREE, F16_FOUR, F16_FIVE, F16_SIX, F16_SEVEN, F16_EIGHT,
130 );
131 let r = _mm256_cvtph_ps(a);
132 let e = _mm256_set_ps(1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0);
133 assert_eq_m256(r, e);
134 }
135
136 #[simd_test(enable = "f16c")]
137 unsafe fn test_mm_cvtps_ph() {
138 let a = _mm_set_ps(1.0, 2.0, 3.0, 4.0);
139 let r = _mm_cvtps_ph::<_MM_FROUND_CUR_DIRECTION>(a);
140 let e = _mm_set_epi16(0, 0, 0, 0, F16_ONE, F16_TWO, F16_THREE, F16_FOUR);
141 assert_eq_m128i(r, e);
142 }
143
144 #[simd_test(enable = "f16c")]
145 unsafe fn test_mm256_cvtps_ph() {
146 let a = _mm256_set_ps(1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0);
147 let r = _mm256_cvtps_ph::<_MM_FROUND_CUR_DIRECTION>(a);
148 let e = _mm_set_epi16(
149 F16_ONE, F16_TWO, F16_THREE, F16_FOUR, F16_FIVE, F16_SIX, F16_SEVEN, F16_EIGHT,
150 );
151 assert_eq_m128i(r, e);
152 }
153}