mirror of
https://git.ffmpeg.org/ffmpeg.git
synced 2024-12-24 08:12:44 +00:00
x86/intmath: add sse optimized av_clipf and av_clipd
Reviewed-by: Michael Niedermayer <michael@niedermayer.cc> Reviewed-by: Ronald S. Bultje <rsbultje@gmail.com> Signed-off-by: James Almer <jamrial@gmail.com>
This commit is contained in:
parent
9f17d4ae7e
commit
f4c1a48483
@ -22,6 +22,7 @@
|
||||
#define AVUTIL_X86_INTMATH_H
|
||||
|
||||
#include <stdint.h>
|
||||
#include <stdlib.h>
|
||||
#if HAVE_FAST_CLZ
|
||||
#if defined(_MSC_VER)
|
||||
#include <intrin.h>
|
||||
@ -98,6 +99,38 @@ static av_always_inline av_const unsigned av_mod_uintp2_bmi2(unsigned a, unsigne
|
||||
|
||||
#endif /* __BMI2__ */
|
||||
|
||||
#if defined(__SSE2__)
|
||||
|
||||
#define av_clipd av_clipd_sse2
|
||||
static av_always_inline av_const double av_clipd_sse2(double a, double amin, double amax)
|
||||
{
|
||||
#if defined(ASSERT_LEVEL) && ASSERT_LEVEL >= 2
|
||||
if (amin > amax) abort();
|
||||
#endif
|
||||
__asm__ ("minsd %2, %0 \n\t"
|
||||
"maxsd %1, %0 \n\t"
|
||||
: "+x"(a) : "xm"(amin), "xm"(amax));
|
||||
return a;
|
||||
}
|
||||
|
||||
#endif /* __SSE2__ */
|
||||
|
||||
#if defined(__SSE__)
|
||||
|
||||
#define av_clipf av_clipf_sse
|
||||
static av_always_inline av_const float av_clipf_sse(float a, float amin, float amax)
|
||||
{
|
||||
#if defined(ASSERT_LEVEL) && ASSERT_LEVEL >= 2
|
||||
if (amin > amax) abort();
|
||||
#endif
|
||||
__asm__ ("minss %2, %0 \n\t"
|
||||
"maxss %1, %0 \n\t"
|
||||
: "+x"(a) : "xm"(amin), "xm"(amax));
|
||||
return a;
|
||||
}
|
||||
|
||||
#endif /* __SSE__ */
|
||||
|
||||
#endif /* __GNUC__ */
|
||||
|
||||
#endif /* AVUTIL_X86_INTMATH_H */
|
||||
|
Loading…
Reference in New Issue
Block a user