2013-03-12 14:28:11 +00:00
|
|
|
OBJS += x86/constants.o \
|
|
|
|
x86/fmtconvert_init.o \
|
2012-10-05 17:54:10 +00:00
|
|
|
|
|
|
|
OBJS-$(CONFIG_AAC_DECODER) += x86/sbrdsp_init.o
|
|
|
|
OBJS-$(CONFIG_AC3DSP) += x86/ac3dsp_init.o
|
2012-10-07 15:23:54 +00:00
|
|
|
OBJS-$(CONFIG_CAVS_DECODER) += x86/cavsdsp.o
|
2013-08-04 11:24:15 +00:00
|
|
|
OBJS-$(CONFIG_DCT) += x86/dct_init.o
|
2012-08-28 15:47:39 +00:00
|
|
|
OBJS-$(CONFIG_DNXHD_ENCODER) += x86/dnxhdenc.o
|
2012-10-12 17:57:25 +00:00
|
|
|
OBJS-$(CONFIG_DSPUTIL) += x86/dsputil_init.o
|
|
|
|
OBJS-$(CONFIG_ENCODERS) += x86/dsputilenc_mmx.o \
|
|
|
|
x86/motion_est.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_FFT) += x86/fft_init.o
|
2013-02-06 14:34:39 +00:00
|
|
|
OBJS-$(CONFIG_H264CHROMA) += x86/h264chroma_init.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_H264DSP) += x86/h264dsp_init.o
|
|
|
|
OBJS-$(CONFIG_H264PRED) += x86/h264_intrapred_init.o
|
2013-01-24 04:24:53 +00:00
|
|
|
OBJS-$(CONFIG_H264QPEL) += x86/h264_qpel.o
|
2013-05-05 23:01:05 +00:00
|
|
|
OBJS-$(CONFIG_HPELDSP) += x86/hpeldsp_init.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_LPC) += x86/lpc.o
|
2010-03-16 21:23:03 +00:00
|
|
|
OBJS-$(CONFIG_MLP_DECODER) += x86/mlpdsp.o
|
2013-04-26 23:03:37 +00:00
|
|
|
OBJS-$(CONFIG_MPEGAUDIODSP) += x86/mpegaudiodsp.o
|
2012-08-28 15:47:39 +00:00
|
|
|
OBJS-$(CONFIG_MPEGVIDEO) += x86/mpegvideo.o
|
|
|
|
OBJS-$(CONFIG_MPEGVIDEOENC) += x86/mpegvideoenc.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_PNG_DECODER) += x86/pngdsp_init.o
|
2012-12-11 01:52:55 +00:00
|
|
|
OBJS-$(CONFIG_PRORES_DECODER) += x86/proresdsp_init.o
|
2012-10-08 19:36:14 +00:00
|
|
|
OBJS-$(CONFIG_PRORES_LGPL_DECODER) += x86/proresdsp_init.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_RV30_DECODER) += x86/rv34dsp_init.o
|
|
|
|
OBJS-$(CONFIG_RV40_DECODER) += x86/rv34dsp_init.o \
|
|
|
|
x86/rv40dsp_init.o
|
2012-10-08 19:36:14 +00:00
|
|
|
OBJS-$(CONFIG_V210_DECODER) += x86/v210-init.o
|
2010-03-16 21:23:03 +00:00
|
|
|
OBJS-$(CONFIG_TRUEHD_DECODER) += x86/mlpdsp.o
|
2012-10-07 15:41:10 +00:00
|
|
|
OBJS-$(CONFIG_VC1_DECODER) += x86/vc1dsp_init.o
|
2012-12-15 17:46:02 +00:00
|
|
|
OBJS-$(CONFIG_VIDEODSP) += x86/videodsp_init.o
|
2013-01-20 06:21:10 +00:00
|
|
|
OBJS-$(CONFIG_VORBIS_DECODER) += x86/vorbisdsp_init.o
|
2012-07-17 15:47:43 +00:00
|
|
|
OBJS-$(CONFIG_VP3DSP) += x86/vp3dsp_init.o
|
2012-10-06 18:28:56 +00:00
|
|
|
OBJS-$(CONFIG_VP6_DECODER) += x86/vp6dsp_init.o
|
2012-10-05 17:54:10 +00:00
|
|
|
OBJS-$(CONFIG_VP8_DECODER) += x86/vp8dsp_init.o
|
2013-03-30 07:25:44 +00:00
|
|
|
OBJS-$(CONFIG_WEBP_DECODER) += x86/vp8dsp_init.o
|
2012-02-02 22:55:57 +00:00
|
|
|
OBJS-$(CONFIG_XMM_CLOBBER_TEST) += x86/w64xmmtest.o
|
2010-03-16 21:22:59 +00:00
|
|
|
|
2012-10-12 17:57:25 +00:00
|
|
|
MMX-OBJS-$(CONFIG_DSPUTIL) += x86/dsputil_mmx.o \
|
2012-08-08 00:12:17 +00:00
|
|
|
x86/fdct.o \
|
2013-04-23 15:10:59 +00:00
|
|
|
x86/fpel_mmx.o \
|
2012-02-02 22:55:57 +00:00
|
|
|
x86/idct_mmx_xvid.o \
|
|
|
|
x86/idct_sse2_xvid.o \
|
2013-05-06 22:42:22 +00:00
|
|
|
x86/rnd_mmx.o \
|
2012-10-12 17:57:25 +00:00
|
|
|
x86/simple_idct.o
|
2013-01-14 22:40:26 +00:00
|
|
|
MMX-OBJS-$(CONFIG_DIRAC_DECODER) += x86/dirac_dwt.o
|
2013-04-23 16:36:25 +00:00
|
|
|
MMX-OBJS-$(CONFIG_HPELDSP) += x86/fpel_mmx.o \
|
2013-05-06 22:42:22 +00:00
|
|
|
x86/hpeldsp_mmx.o \
|
|
|
|
x86/rnd_mmx.o
|
2013-01-14 21:30:30 +00:00
|
|
|
MMX-OBJS-$(CONFIG_SNOW_DECODER) += x86/snowdsp.o
|
|
|
|
MMX-OBJS-$(CONFIG_SNOW_ENCODER) += x86/snowdsp.o
|
2012-02-02 22:55:57 +00:00
|
|
|
MMX-OBJS-$(CONFIG_VC1_DECODER) += x86/vc1dsp_mmx.o
|
|
|
|
|
2013-05-29 21:15:17 +00:00
|
|
|
YASM-OBJS += x86/deinterlace.o \
|
|
|
|
x86/fmtconvert.o \
|
|
|
|
|
2012-02-02 22:55:57 +00:00
|
|
|
YASM-OBJS-$(CONFIG_AAC_DECODER) += x86/sbrdsp.o
|
|
|
|
YASM-OBJS-$(CONFIG_AC3DSP) += x86/ac3dsp.o
|
2012-08-07 23:49:46 +00:00
|
|
|
YASM-OBJS-$(CONFIG_DCT) += x86/dct32.o
|
2013-01-14 21:30:30 +00:00
|
|
|
YASM-OBJS-$(CONFIG_DIRAC_DECODER) += x86/diracdsp_mmx.o x86/diracdsp_yasm.o\
|
2013-01-14 22:40:26 +00:00
|
|
|
x86/dwt_yasm.o
|
2013-03-12 14:28:11 +00:00
|
|
|
YASM-OBJS-$(CONFIG_DSPUTIL) += x86/dsputil.o \
|
2013-03-10 22:37:59 +00:00
|
|
|
x86/fpel.o \
|
2013-03-12 14:28:11 +00:00
|
|
|
x86/mpeg4qpel.o \
|
|
|
|
x86/qpel.o
|
2012-08-07 22:35:43 +00:00
|
|
|
YASM-OBJS-$(CONFIG_ENCODERS) += x86/dsputilenc.o
|
2012-08-08 00:12:17 +00:00
|
|
|
YASM-OBJS-$(CONFIG_FFT) += x86/fft.o
|
2013-02-18 15:50:06 +00:00
|
|
|
YASM-OBJS-$(CONFIG_H263_DECODER) += x86/h263_loopfilter.o
|
|
|
|
YASM-OBJS-$(CONFIG_H263_ENCODER) += x86/h263_loopfilter.o
|
2013-02-06 14:34:39 +00:00
|
|
|
YASM-OBJS-$(CONFIG_H264CHROMA) += x86/h264_chromamc.o \
|
2011-12-13 21:54:52 +00:00
|
|
|
x86/h264_chromamc_10bit.o
|
2010-09-03 16:52:46 +00:00
|
|
|
YASM-OBJS-$(CONFIG_H264DSP) += x86/h264_deblock.o \
|
2011-05-10 15:55:12 +00:00
|
|
|
x86/h264_deblock_10bit.o \
|
2010-09-14 13:36:26 +00:00
|
|
|
x86/h264_idct.o \
|
2011-05-24 19:14:38 +00:00
|
|
|
x86/h264_idct_10bit.o \
|
|
|
|
x86/h264_weight.o \
|
2012-02-02 22:55:57 +00:00
|
|
|
x86/h264_weight_10bit.o
|
2011-06-05 23:20:05 +00:00
|
|
|
YASM-OBJS-$(CONFIG_H264PRED) += x86/h264_intrapred.o \
|
|
|
|
x86/h264_intrapred_10bit.o
|
2012-10-13 15:04:50 +00:00
|
|
|
YASM-OBJS-$(CONFIG_H264QPEL) += x86/h264_qpel_8bit.o \
|
2013-03-09 04:40:16 +00:00
|
|
|
x86/h264_qpel_10bit.o \
|
2013-03-10 22:37:59 +00:00
|
|
|
x86/fpel.o \
|
2013-03-12 14:28:11 +00:00
|
|
|
x86/qpel.o
|
2013-03-10 22:37:59 +00:00
|
|
|
YASM-OBJS-$(CONFIG_HPELDSP) += x86/fpel.o \
|
|
|
|
x86/hpeldsp.o
|
2012-08-07 23:49:46 +00:00
|
|
|
YASM-OBJS-$(CONFIG_MPEGAUDIODSP) += x86/imdct36.o
|
2012-01-27 15:21:55 +00:00
|
|
|
YASM-OBJS-$(CONFIG_PNG_DECODER) += x86/pngdsp.o
|
2011-10-12 17:10:22 +00:00
|
|
|
YASM-OBJS-$(CONFIG_PRORES_DECODER) += x86/proresdsp.o
|
2012-03-26 18:34:29 +00:00
|
|
|
YASM-OBJS-$(CONFIG_PRORES_LGPL_DECODER) += x86/proresdsp.o
|
2012-01-01 17:33:22 +00:00
|
|
|
YASM-OBJS-$(CONFIG_RV30_DECODER) += x86/rv34dsp.o
|
rv40: x86 SIMD for biweight
Provide MMX, SSE2 and SSSE3 versions, with a fast-path when the weights are
multiples of 512 (which is often the case when the values round up nicely).
*_TIMER report for the 16x16 and 8x8 cases:
C:
9015 decicycles in 16, 524257 runs, 31 skips
2656 decicycles in 8, 524271 runs, 17 skips
MMX:
4156 decicycles in 16, 262090 runs, 54 skips
1206 decicycles in 8, 262131 runs, 13 skips
MMX on fast-path:
2760 decicycles in 16, 524222 runs, 66 skips
995 decicycles in 8, 524252 runs, 36 skips
SSE2:
2163 decicycles in 16, 262131 runs, 13 skips
832 decicycles in 8, 262137 runs, 7 skips
SSE2 with fast path:
1783 decicycles in 16, 524276 runs, 12 skips
711 decicycles in 8, 524283 runs, 5 skips
SSSE3:
2117 decicycles in 16, 262136 runs, 8 skips
814 decicycles in 8, 262143 runs, 1 skips
SSSE3 with fast path:
1315 decicycles in 16, 524285 runs, 3 skips
578 decicycles in 8, 524286 runs, 2 skips
This means around a 4% speedup for some sequences.
Signed-off-by: Diego Biurrun <diego@biurrun.de>
2012-01-11 23:11:15 +00:00
|
|
|
YASM-OBJS-$(CONFIG_RV40_DECODER) += x86/rv34dsp.o \
|
|
|
|
x86/rv40dsp.o
|
2011-10-18 18:50:49 +00:00
|
|
|
YASM-OBJS-$(CONFIG_V210_DECODER) += x86/v210.o
|
2012-08-07 22:35:43 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VC1_DECODER) += x86/vc1dsp.o
|
2012-12-15 17:46:02 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VIDEODSP) += x86/videodsp.o
|
2013-01-16 01:00:41 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VORBIS_DECODER) += x86/vorbisdsp.o
|
2012-07-16 11:50:14 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VP3DSP) += x86/vp3dsp.o
|
2012-10-06 18:28:56 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VP6_DECODER) += x86/vp6dsp.o
|
2010-06-27 02:01:45 +00:00
|
|
|
YASM-OBJS-$(CONFIG_VP8_DECODER) += x86/vp8dsp.o
|
2013-03-30 07:25:44 +00:00
|
|
|
YASM-OBJS-$(CONFIG_WEBP_DECODER) += x86/vp8dsp.o
|