[babl/wip/msvc: 6/6] build: Enable F16C intrinsics on Visual Studio
- From: Chun-wei Fan <fanchunwei src gnome org>
- To: commits-list gnome org
- Cc:
- Subject: [babl/wip/msvc: 6/6] build: Enable F16C intrinsics on Visual Studio
- Date: Tue, 21 Jan 2020 10:20:10 +0000 (UTC)
commit e03fc5b1f5e3f754b20f90741427eb38de061c30
Author: Chun-wei Fan <fanchunwei src gnome org>
Date: Tue Jan 21 18:18:11 2020 +0800
build: Enable F16C intrinsics on Visual Studio
The Visual Studio versions that we support is capab;e of building F16C
intrinsics, so enable the build to build such support. Also update the
code so that we avoid using GCC-specific intrinsics implementations
extensions/sse-half.c | 16 ++++++++--------
meson.build | 4 ++++
2 files changed, 12 insertions(+), 8 deletions(-)
---
diff --git a/extensions/sse-half.c b/extensions/sse-half.c
index cee397555..dc9e39f0f 100644
--- a/extensions/sse-half.c
+++ b/extensions/sse-half.c
@@ -36,17 +36,17 @@ conv_yHalf_yF (const Babl *conversion,
long samples)
{
const uint64_t *s_vec;
- __v4sf *d_vec;
+ __m128 *d_vec;
long n = samples;
s_vec = (const uint64_t *)src;
- d_vec = (__v4sf *)dst;
+ d_vec = (__m128 *)dst;
while (n >= 4)
{
- __m128i in_val = _mm_insert_epi64((__m128i)_mm_setzero_ps(), *s_vec++, 0);
- __v4sf out_val = (__v4sf)_mm_cvtph_ps(in_val);
+ __m128i in_val = _mm_insert_epi64(_mm_castps_si128(_mm_setzero_ps()), *s_vec++, 0);
+ __m128 out_val = _mm_cvtph_ps(in_val);
_mm_storeu_ps((float *)d_vec++, out_val);
n -= 4;
}
@@ -56,8 +56,8 @@ conv_yHalf_yF (const Babl *conversion,
while (n)
{
- __m128i in_val = _mm_insert_epi16((__m128i)_mm_setzero_ps(), *src++, 0);
- __v4sf out_val = (__v4sf)_mm_cvtph_ps(in_val);
+ __m128i in_val = _mm_insert_epi16(_mm_castps_si128(_mm_setzero_ps()), *src++, 0);
+ __m128 out_val = _mm_cvtph_ps(in_val);
_mm_store_ss(dst++, out_val);
n -= 1;
}
@@ -96,12 +96,12 @@ conv_yF_yHalf (const Babl *conversion,
uint16_t *dst,
long samples)
{
- const __v4sf *s_vec;
+ const __m128 *s_vec;
uint64_t *d_vec;
long n = samples;
- s_vec = (const __v4sf *)src;
+ s_vec = (const __m128 *)src;
d_vec = (uint64_t *)dst;
while (n >= 4)
diff --git a/meson.build b/meson.build
index 248aa0792..fed45711c 100644
--- a/meson.build
+++ b/meson.build
@@ -306,6 +306,10 @@ if cc.get_id() == 'msvc' and have_x86
endif
endif
endif
+ if get_option('enable-f16c')
+ conf.set('USE_F16C', 1, description:
+ 'Define to 1 if f16c intrinsics are available.')
+ endif
endif
endif
[
Date Prev][
Date Next] [
Thread Prev][
Thread Next]
[
Thread Index]
[
Date Index]
[
Author Index]