diff --git a/include/clang/Basic/BuiltinsX86.def b/include/clang/Basic/BuiltinsX86.def index 832b4163206bbc55570330f5f21057fc8771b126..2a73310954747c1157c2a43e3245634e7a5fd16a 100644 --- a/include/clang/Basic/BuiltinsX86.def +++ b/include/clang/Basic/BuiltinsX86.def @@ -426,9 +426,9 @@ BUILTIN(__builtin_ia32_vperm2f128_pd256, "V4dV4dV4dIc", "") BUILTIN(__builtin_ia32_vperm2f128_ps256, "V8fV8fV8fIc", "") BUILTIN(__builtin_ia32_vperm2f128_si256, "V8iV8iV8iIc", "") BUILTIN(__builtin_ia32_vpermilpd, "V2dV2dIc", "") -BUILTIN(__builtin_ia32_vpermilps, "V4fV4fc", "") +BUILTIN(__builtin_ia32_vpermilps, "V4fV4fIc", "") BUILTIN(__builtin_ia32_vpermilpd256, "V4dV4dIc", "") -BUILTIN(__builtin_ia32_vpermilps256, "V8fV8fc", "") +BUILTIN(__builtin_ia32_vpermilps256, "V8fV8fIc", "") BUILTIN(__builtin_ia32_vinsertf128_pd256, "V4dV4dV2dIc", "") BUILTIN(__builtin_ia32_vinsertf128_ps256, "V8fV8fV4fIc", "") BUILTIN(__builtin_ia32_vinsertf128_si256, "V8iV8iV4iIc", "") diff --git a/lib/Headers/avxintrin.h b/lib/Headers/avxintrin.h index 64ab67b5859c8245a639dcc1d8a70c3c76e13435..d33a07639260d3cc1288c6834604e858691dddb6 100644 --- a/lib/Headers/avxintrin.h +++ b/lib/Headers/avxintrin.h @@ -266,17 +266,13 @@ _mm256_permutevar_ps(__m256 a, __m256i c) __m256d __A = (A); \ (__m256d)__builtin_ia32_vpermilpd256((__v4df)__A, C); }) -static __inline __m128 __attribute__((__always_inline__, __nodebug__)) -_mm_permute_ps(__m128 a, const int c) -{ - return (__m128)__builtin_ia32_vpermilps((__v4sf)a, c); -} +#define _mm_permute_ps(A, C) __extension__ ({ \ + __m128 __A = (A); \ + (__m128)__builtin_ia32_vpermilps((__v4sf)__A, C); }) -static __inline __m256 __attribute__((__always_inline__, __nodebug__)) -_mm256_permute_ps(__m256 a, const int c) -{ - return (__m256)__builtin_ia32_vpermilps256((__v8sf)a, c); -} +#define _mm256_permute_ps(A, C) __extension__ ({ \ + __m256 __A = (A); \ + (__m256)__builtin_ia32_vpermilps256((__v8sf)__A, C); }) #define _mm256_permute2f128_pd(V1, V2, M) __extension__ ({ \ __m256d __V1 = (V1); \