mirror of
https://git.ffmpeg.org/ffmpeg.git
synced 2025-02-19 21:36:54 +00:00
lavc/vp9dsp: R-V V ipred hor
C908: vp9_hor_8x8_8bpp_c: 74.7 vp9_hor_8x8_8bpp_rvv_i32: 35.7 vp9_hor_16x16_8bpp_c: 175.5 vp9_hor_16x16_8bpp_rvv_i32: 80.2 vp9_hor_32x32_8bpp_c: 510.2 vp9_hor_32x32_8bpp_rvv_i32: 264.0 Signed-off-by: Rémi Denis-Courmont <remi@remlab.net>
This commit is contained in:
parent
b82d9f55d1
commit
0cc8661499
@ -117,3 +117,59 @@ func_dc dc_left 8 left 3 0 zve64x
|
||||
func_dc dc_top 32 top 5 1 zve32x
|
||||
func_dc dc_top 16 top 4 1 zve32x
|
||||
func_dc dc_top 8 top 3 0 zve64x
|
||||
|
||||
func ff_h_32x32_rvv, zve32x
|
||||
li t0, 32
|
||||
addi a2, a2, 31
|
||||
vsetvli zero, t0, e8, m2, ta, ma
|
||||
|
||||
.rept 2
|
||||
.irp n 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30
|
||||
lbu t1, (a2)
|
||||
addi a2, a2, -1
|
||||
vmv.v.x v\n, t1
|
||||
.endr
|
||||
.irp n 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30
|
||||
vse8.v v\n, (a0)
|
||||
add a0, a0, a1
|
||||
.endr
|
||||
.endr
|
||||
|
||||
ret
|
||||
endfunc
|
||||
|
||||
func ff_h_16x16_rvv, zve32x
|
||||
addi a2, a2, 15
|
||||
vsetivli zero, 16, e8, m1, ta, ma
|
||||
|
||||
.irp n 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23
|
||||
lbu t1, (a2)
|
||||
addi a2, a2, -1
|
||||
vmv.v.x v\n, t1
|
||||
.endr
|
||||
.irp n 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22
|
||||
vse8.v v\n, (a0)
|
||||
add a0, a0, a1
|
||||
.endr
|
||||
vse8.v v23, (a0)
|
||||
|
||||
ret
|
||||
endfunc
|
||||
|
||||
func ff_h_8x8_rvv, zve32x
|
||||
addi a2, a2, 7
|
||||
vsetivli zero, 8, e8, mf2, ta, ma
|
||||
|
||||
.irp n 8, 9, 10, 11, 12, 13, 14, 15
|
||||
lbu t1, (a2)
|
||||
addi a2, a2, -1
|
||||
vmv.v.x v\n, t1
|
||||
.endr
|
||||
.irp n 8, 9, 10, 11, 12, 13, 14
|
||||
vse8.v v\n, (a0)
|
||||
add a0, a0, a1
|
||||
.endr
|
||||
vse8.v v15, (a0)
|
||||
|
||||
ret
|
||||
endfunc
|
||||
|
@ -66,6 +66,12 @@ void ff_v_16x16_rvi(uint8_t *dst, ptrdiff_t stride, const uint8_t *l,
|
||||
const uint8_t *a);
|
||||
void ff_v_8x8_rvi(uint8_t *dst, ptrdiff_t stride, const uint8_t *l,
|
||||
const uint8_t *a);
|
||||
void ff_h_32x32_rvv(uint8_t *dst, ptrdiff_t stride, const uint8_t *l,
|
||||
const uint8_t *a);
|
||||
void ff_h_16x16_rvv(uint8_t *dst, ptrdiff_t stride, const uint8_t *l,
|
||||
const uint8_t *a);
|
||||
void ff_h_8x8_rvv(uint8_t *dst, ptrdiff_t stride, const uint8_t *l,
|
||||
const uint8_t *a);
|
||||
|
||||
#define VP9_8TAP_RISCV_RVV_FUNC(SIZE, type, type_idx) \
|
||||
void ff_put_8tap_##type##_##SIZE##h_rvv(uint8_t *dst, ptrdiff_t dststride, \
|
||||
|
@ -86,6 +86,9 @@ static av_cold void vp9dsp_intrapred_init_riscv(VP9DSPContext *dsp, int bpp)
|
||||
dsp->intra_pred[TX_16X16][DC_129_PRED] = ff_dc_129_16x16_rvv;
|
||||
dsp->intra_pred[TX_32X32][TOP_DC_PRED] = ff_dc_top_32x32_rvv;
|
||||
dsp->intra_pred[TX_16X16][TOP_DC_PRED] = ff_dc_top_16x16_rvv;
|
||||
dsp->intra_pred[TX_32X32][HOR_PRED] = ff_h_32x32_rvv;
|
||||
dsp->intra_pred[TX_16X16][HOR_PRED] = ff_h_16x16_rvv;
|
||||
dsp->intra_pred[TX_8X8][HOR_PRED] = ff_h_8x8_rvv;
|
||||
}
|
||||
#endif
|
||||
#endif
|
||||
|
Loading…
Reference in New Issue
Block a user