mirror of https://git.ffmpeg.org/ffmpeg.git
0d7caa5b09
This commit adds new code paths for vscale when filterSize is 2, 4, or 8. By using specialized code with unrolling to match the filterSize we can improve performance. On AWS c7g (Graviton 3, Neoverse V1) instances: before after yuv2yuvX_2_0_512_accurate_neon: 558.8 268.9 yuv2yuvX_4_0_512_accurate_neon: 637.5 434.9 yuv2yuvX_8_0_512_accurate_neon: 1144.8 806.2 yuv2yuvX_16_0_512_accurate_neon: 2080.5 1853.7 Signed-off-by: Jonathan Swinney <jswinney@amazon.com> Signed-off-by: Martin Storsjö <martin@martin.st> |
||
---|---|---|
.. | ||
aarch64 | ||
arm | ||
ppc | ||
tests | ||
x86 | ||
Makefile | ||
alphablend.c | ||
bayer_template.c | ||
gamma.c | ||
hscale.c | ||
hscale_fast_bilinear.c | ||
input.c | ||
libswscale.v | ||
log2_tab.c | ||
options.c | ||
output.c | ||
rgb2rgb.c | ||
rgb2rgb.h | ||
rgb2rgb_template.c | ||
slice.c | ||
swscale.c | ||
swscale.h | ||
swscale_internal.h | ||
swscale_unscaled.c | ||
swscaleres.rc | ||
utils.c | ||
version.c | ||
version.h | ||
version_major.h | ||
vscale.c | ||
yuv2rgb.c |