ffmpeg/libavutil
Ronald S. Bultje f0a2b6249b vp9: add 16x16 idct avx2 (8-bit).
checkasm --bench, 10k runs, for *_add_${bpc}_${sub_idct}_${opt}, shows
that it's about 1.65x as fast as the AVX version for the full IDCT, and
similar speedups for the sub-IDCTs:

nop: 24.6
vp9_inv_dct_dct_16x16_add_8_1_c: 6444.8
vp9_inv_dct_dct_16x16_add_8_1_sse2: 638.6
vp9_inv_dct_dct_16x16_add_8_1_ssse3: 484.4
vp9_inv_dct_dct_16x16_add_8_1_avx: 661.2
vp9_inv_dct_dct_16x16_add_8_1_avx2: 311.5
vp9_inv_dct_dct_16x16_add_8_2_c: 6665.7
vp9_inv_dct_dct_16x16_add_8_2_sse2: 646.9
vp9_inv_dct_dct_16x16_add_8_2_ssse3: 455.2
vp9_inv_dct_dct_16x16_add_8_2_avx: 521.9
vp9_inv_dct_dct_16x16_add_8_2_avx2: 304.3
vp9_inv_dct_dct_16x16_add_8_4_c: 7022.7
vp9_inv_dct_dct_16x16_add_8_4_sse2: 647.4
vp9_inv_dct_dct_16x16_add_8_4_ssse3: 467.1
vp9_inv_dct_dct_16x16_add_8_4_avx: 446.1
vp9_inv_dct_dct_16x16_add_8_4_avx2: 297.0
vp9_inv_dct_dct_16x16_add_8_8_c: 6800.4
vp9_inv_dct_dct_16x16_add_8_8_sse2: 598.6
vp9_inv_dct_dct_16x16_add_8_8_ssse3: 465.7
vp9_inv_dct_dct_16x16_add_8_8_avx: 440.9
vp9_inv_dct_dct_16x16_add_8_8_avx2: 290.2
vp9_inv_dct_dct_16x16_add_8_16_c: 6626.6
vp9_inv_dct_dct_16x16_add_8_16_sse2: 599.5
vp9_inv_dct_dct_16x16_add_8_16_ssse3: 475.0
vp9_inv_dct_dct_16x16_add_8_16_avx: 469.9
vp9_inv_dct_dct_16x16_add_8_16_avx2: 286.4
2016-07-11 10:14:58 -04:00
..
aarch64
arm
avr32 Merge commit '41ed7ab45fc693f7d7fc35664c0233f4c32d69bb' 2016-06-21 21:55:34 +02:00
bfin
mips
ppc
sh4
tests Merge commit 'ded4a6543dfb5a2f1d9f7fb8d3ab27a1872c22b3' 2016-06-24 11:16:52 +02:00
tomi
x86 vp9: add 16x16 idct avx2 (8-bit). 2016-07-11 10:14:58 -04:00
.gitignore Merge commit '257f00ec1ab06a2a161f535036c6512f3fc8e801' 2016-06-22 11:28:51 +02:00
Makefile Merge commit 'c46db38cde8e8fd8ecb1c6602f10ec0e002f29a8' 2016-06-22 22:38:49 +02:00
adler32.c
adler32.h
aes.c
aes.h
aes_ctr.c
aes_ctr.h
aes_internal.h
atomic.c
atomic.h
atomic_gcc.h
atomic_suncc.h
atomic_win32.h
attributes.h
audio_fifo.c
audio_fifo.h
avassert.h Merge commit '41ed7ab45fc693f7d7fc35664c0233f4c32d69bb' 2016-06-21 21:55:34 +02:00
avstring.c
avstring.h
avutil.h Merge commit '41ed7ab45fc693f7d7fc35664c0233f4c32d69bb' 2016-06-21 21:55:34 +02:00
avutilres.rc
base64.c
base64.h
blowfish.c
blowfish.h
bprint.c
bprint.h
bswap.h
buffer.c
buffer.h
buffer_internal.h
camellia.c
camellia.h
cast5.c
cast5.h
channel_layout.c
channel_layout.h
color_utils.c
color_utils.h
colorspace.h Merge commit '1f77e634bb838f71ff21923b5e9fe3104c831c52' 2016-06-21 22:16:16 +02:00
common.h
cpu.c
cpu.h
cpu_internal.h
crc.c
crc.h
des.c Merge commit 'a6a750c7ef240b72ce01e9653343a0ddf247d196' 2016-06-22 13:44:34 +02:00
des.h
dict.c
dict.h
display.c
display.h
downmix_info.c
downmix_info.h
dynarray.h
error.c
error.h
eval.c
eval.h
ffmath.h
fifo.c
fifo.h
file.c
file.h
file_open.c lavu/file_open: Use current directory for temporary files also on Android. 2016-06-11 22:41:18 +02:00
fixed_dsp.c
fixed_dsp.h
float_dsp.c
float_dsp.h
frame.c
frame.h avutil/frame: Move new field to the end of AVFrame 2016-06-30 17:43:01 +02:00
hash.c
hash.h
hmac.c
hmac.h
hwcontext.c Merge commit '1c9e8616c535ef496e7ee8a5cbc5e9e972a6977d' 2016-06-26 15:23:24 +02:00
hwcontext.h Merge commit '1c9e8616c535ef496e7ee8a5cbc5e9e972a6977d' 2016-06-26 15:23:24 +02:00
hwcontext_cuda.c Merge commit '2e219b491bcc0845248345fdad31231b081e06d1' 2016-06-26 15:25:12 +02:00
hwcontext_cuda.h
hwcontext_dxva2.c hwcontext_dxva2: Use GetDesktopWindow instead of GetShellWindow 2016-06-26 15:34:40 +02:00
hwcontext_dxva2.h Merge commit 'c46db38cde8e8fd8ecb1c6602f10ec0e002f29a8' 2016-06-22 22:38:49 +02:00
hwcontext_internal.h Merge commit '1c9e8616c535ef496e7ee8a5cbc5e9e972a6977d' 2016-06-26 15:23:24 +02:00
hwcontext_vaapi.c Merge commit 'b8bf9194af602cf3a4bcd19a5e278e3d6d69f8fa' 2016-06-26 15:25:38 +02:00
hwcontext_vaapi.h
hwcontext_vdpau.c Merge commit '38392b2af815898b8716826c4e29d95c04fb2647' 2016-06-26 15:24:53 +02:00
hwcontext_vdpau.h
imgutils.c
imgutils.h
integer.c
integer.h
internal.h
intfloat.h
intmath.c
intmath.h
intreadwrite.h
lfg.c
lfg.h
libavutil.v
libm.h
lls.c
lls.h
log.c
log.h
log2_tab.c
lzo.c
lzo.h
macros.h
mastering_display_metadata.c
mastering_display_metadata.h
mathematics.c
mathematics.h
md5.c Merge commit '41ed7ab45fc693f7d7fc35664c0233f4c32d69bb' 2016-06-21 21:55:34 +02:00
md5.h
mem.c
mem.h
mem_internal.h
motion_vector.h
murmur3.c
murmur3.h
opencl.c
opencl.h
opencl_internal.c
opencl_internal.h
opt.c
opt.h Merge commit '41ed7ab45fc693f7d7fc35664c0233f4c32d69bb' 2016-06-21 21:55:34 +02:00
parseutils.c avutil/parseutils: dont assume standard time when parsing a timestamp 2016-07-11 01:06:23 +02:00
parseutils.h
pca.c
pca.h
pixdesc.c Merge commit 'bcc07e2576cb723007bea1238afd019ae2d1b005' 2016-07-09 14:21:01 +02:00
pixdesc.h
pixelutils.c
pixelutils.h
pixfmt.h lavc: add mediacodec hwaccel support 2016-07-08 17:02:37 +02:00
qsort.h
random_seed.c
random_seed.h
rational.c
rational.h
rc4.c
rc4.h
replaygain.h
reverse.c
ripemd.c
ripemd.h
samplefmt.c
samplefmt.h
sha.c
sha.h
sha512.c
sha512.h
softfloat.h
softfloat_tables.h
stereo3d.c Merge commit '0c4468dc185fa8b9e7d6add914595c5e928b24fd' 2016-06-23 12:38:51 +02:00
stereo3d.h Merge commit '0c4468dc185fa8b9e7d6add914595c5e928b24fd' 2016-06-23 12:38:51 +02:00
tablegen.h
tea.c
tea.h
thread.h
threadmessage.c
threadmessage.h avutil/threadmessage.h: Fix swapped comments 2016-06-16 23:54:51 +02:00
time.c
time.h
time_internal.h
timecode.c
timecode.h
timer.h
timestamp.h
tree.c
tree.h
twofish.c
twofish.h
utils.c
version.h avutil/frame: Move new field to the end of AVFrame 2016-06-30 17:43:01 +02:00
wchar_filename.h
xga_font_data.c
xga_font_data.h
xtea.c
xtea.h