81 lines
1.3 KiB
C
81 lines
1.3 KiB
C
#ifndef _INTRIN_H_
|
|
#define _INTRIN_H_
|
|
|
|
#if defined(_MSC_VER)
|
|
#define BLAS_INLINE __inline
|
|
#elif defined(__GNUC__)
|
|
#if defined(__STRICT_ANSI__)
|
|
#define BLAS_INLINE __inline__
|
|
#else
|
|
#define BLAS_INLINE inline
|
|
#endif
|
|
#else
|
|
#define BLAS_INLINE
|
|
#endif
|
|
|
|
#ifdef _MSC_VER
|
|
#define BLAS_FINLINE static __forceinline
|
|
#elif defined(__GNUC__)
|
|
#define BLAS_FINLINE static BLAS_INLINE __attribute__((always_inline))
|
|
#else
|
|
#define BLAS_FINLINE static
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
// include head
|
|
/** SSE **/
|
|
#ifdef HAVE_SSE
|
|
#include <xmmintrin.h>
|
|
#endif
|
|
/** SSE2 **/
|
|
#ifdef HAVE_SSE2
|
|
#include <emmintrin.h>
|
|
#endif
|
|
/** SSE3 **/
|
|
#ifdef HAVE_SSE3
|
|
#include <pmmintrin.h>
|
|
#endif
|
|
/** SSSE3 **/
|
|
#ifdef HAVE_SSSE3
|
|
#include <tmmintrin.h>
|
|
#endif
|
|
/** SSE41 **/
|
|
#ifdef HAVE_SSE4_1
|
|
#include <smmintrin.h>
|
|
#endif
|
|
|
|
/** AVX **/
|
|
#if defined(HAVE_AVX) || defined(HAVE_FMA3)
|
|
#include <immintrin.h>
|
|
#endif
|
|
|
|
/** NEON **/
|
|
#ifdef HAVE_NEON
|
|
#include <arm_neon.h>
|
|
#endif
|
|
|
|
// distribute
|
|
#if defined(HAVE_AVX512VL) || defined(HAVE_AVX512BF16)
|
|
#include "intrin_avx512.h"
|
|
#elif defined(HAVE_AVX2)
|
|
#include "intrin_avx.h"
|
|
#elif defined(HAVE_SSE2)
|
|
#include "intrin_sse.h"
|
|
#endif
|
|
|
|
#ifdef HAVE_NEON
|
|
#include "intrin_neon.h"
|
|
#endif
|
|
|
|
#ifndef V_SIMD
|
|
#define V_SIMD 0
|
|
#define V_SIMD_F64 0
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
#endif // _INTRIN_H_
|