Home | History | Annotate | Download | only in include
      1 /*===---- f16cintrin.h - F16C intrinsics ---------------------------------===
      2  *
      3  * Permission is hereby granted, free of charge, to any person obtaining __a copy
      4  * of this software and associated documentation files (the "Software"), to deal
      5  * in the Software without restriction, including without limitation the rights
      6  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
      7  * copies of the Software, and to permit persons to whom the Software is
      8  * furnished to do so, subject to the following conditions:
      9  *
     10  * The above copyright notice and this permission notice shall be included in
     11  * all copies or substantial portions of the Software.
     12  *
     13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     15  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
     16  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
     17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
     18  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
     19  * THE SOFTWARE.
     20  *
     21  *===-----------------------------------------------------------------------===
     22  */
     23 
     24 #if !defined __X86INTRIN_H && !defined __IMMINTRIN_H
     25 #error "Never use <f16cintrin.h> directly; include <x86intrin.h> instead."
     26 #endif
     27 
     28 #ifndef __F16C__
     29 # error "F16C instruction is not enabled"
     30 #endif /* __F16C__ */
     31 
     32 #ifndef __F16CINTRIN_H
     33 #define __F16CINTRIN_H
     34 
     35 typedef float __v8sf __attribute__ ((__vector_size__ (32)));
     36 typedef float __m256 __attribute__ ((__vector_size__ (32)));
     37 
     38 #define _mm_cvtps_ph(a, imm) __extension__ ({ \
     39   __m128 __a = (a); \
     40  (__m128i)__builtin_ia32_vcvtps2ph((__v4sf)__a, (imm)); })
     41 
     42 #define _mm256_cvtps_ph(a, imm) __extension__ ({ \
     43   __m256 __a = (a); \
     44  (__m128i)__builtin_ia32_vcvtps2ph256((__v8sf)__a, (imm)); })
     45 
     46 static __inline __m128 __attribute__((__always_inline__, __nodebug__))
     47 _mm_cvtph_ps(__m128i __a)
     48 {
     49   return (__m128)__builtin_ia32_vcvtph2ps((__v8hi)__a);
     50 }
     51 
     52 static __inline __m256 __attribute__((__always_inline__, __nodebug__))
     53 _mm256_cvtph_ps(__m128i __a)
     54 {
     55   return (__m256)__builtin_ia32_vcvtph2ps256((__v8hi)__a);
     56 }
     57 
     58 #endif /* __F16CINTRIN_H */
     59