From 5de29aeef00f6adf4b9ef278415d8f753283ef03 Mon Sep 17 00:00:00 2001 From: Brian Paul Date: Wed, 17 Aug 2016 10:41:30 -0600 Subject: util: try to use SSE instructions with MSVC and 32-bit gcc MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The lrint() and lrintf() functions are pretty slow and make some texture transfers very inefficient. This patch makes a better effort at using those intrisics for 32-bit gcc and MSVC. Note, this patch doesn't address the use of SSE4.1 with MSVC. v2: get rid of the ROUND_WITH_SSE symbol, per Matt. Reviewed-by: José Fonseca Reviewed-by: Matt Turner --- src/util/rounding.h | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/util/rounding.h b/src/util/rounding.h index afb38fb..dfc691e 100644 --- a/src/util/rounding.h +++ b/src/util/rounding.h @@ -29,7 +29,8 @@ #include #include -#ifdef __x86_64__ +#if defined(__SSE__) || defined(_MSC_VER) +/* MSVC always has SSE nowadays */ #include #include #endif @@ -95,7 +96,7 @@ _mesa_roundeven(double x) static inline long _mesa_lroundevenf(float x) { -#ifdef __x86_64__ +#if defined(__SSE__) || defined(_MSC_VER) #if LONG_MAX == INT64_MAX return _mm_cvtss_si64(_mm_load_ss(&x)); #elif LONG_MAX == INT32_MAX @@ -115,7 +116,7 @@ _mesa_lroundevenf(float x) static inline long _mesa_lroundeven(double x) { -#ifdef __x86_64__ +#if defined(__SSE__) || defined(_MSC_VER) #if LONG_MAX == INT64_MAX return _mm_cvtsd_si64(_mm_load_sd(&x)); #elif LONG_MAX == INT32_MAX -- cgit v1.1