/* * Copyright © 2022-2024 Rémi Denis-Courmont. * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #ifndef AVUTIL_RISCV_INTMATH_H #define AVUTIL_RISCV_INTMATH_H #include #include "config.h" #include "libavutil/attributes.h" #include "libavutil/riscv/cpu.h" /* * The compiler is forced to sign-extend the result anyhow, so it is faster to * compute it explicitly and use it. */ #define av_clip_int8 av_clip_int8_rvi static av_always_inline av_const int8_t av_clip_int8_rvi(int a) { union { uint8_t u; int8_t s; } u = { .u = a }; if (a != u.s) a = ((a >> 31) ^ 0x7F); return a; } #define av_clip_int16 av_clip_int16_rvi static av_always_inline av_const int16_t av_clip_int16_rvi(int a) { union { uint16_t u; int16_t s; } u = { .u = a }; if (a != u.s) a = ((a >> 31) ^ 0x7FFF); return a; } #define av_clipl_int32 av_clipl_int32_rvi static av_always_inline av_const int32_t av_clipl_int32_rvi(int64_t a) { union { uint32_t u; int32_t s; } u = { .u = a }; if (a != u.s) a = ((a >> 63) ^ 0x7FFFFFFF); return a; } #define av_clip_intp2 av_clip_intp2_rvi static av_always_inline av_const int av_clip_intp2_rvi(int a, int p) { const int shift = 31 - p; int b = ((int)(((unsigned)a) << shift)) >> shift; if (a != b) b = (a >> 31) ^ ((1 << p) - 1); return b; } #if defined (__GNUC__) || defined (__clang__) static inline av_const int ff_ctz_rv(int x) { #if HAVE_RV && !defined(__riscv_zbb) if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" #if __riscv_xlen >= 64 "ctzw %0, %1\n" #else "ctz %0, %1\n" #endif ".option pop" : "=r" (y) : "r" (x)); if (y > 32) __builtin_unreachable(); return y; } #endif return __builtin_ctz(x); } #define ff_ctz ff_ctz_rv static inline av_const int ff_ctzll_rv(long long x) { #if HAVE_RV && !defined(__riscv_zbb) && __riscv_xlen == 64 if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" "ctz %0, %1\n" ".option pop" : "=r" (y) : "r" (x)); if (y > 64) __builtin_unreachable(); return y; } #endif return __builtin_ctzll(x); } #define ff_ctzll ff_ctzll_rv static inline av_const int ff_clz_rv(int x) { #if HAVE_RV && !defined(__riscv_zbb) if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" #if __riscv_xlen >= 64 "clzw %0, %1\n" #else "clz %0, %1\n" #endif ".option pop" : "=r" (y) : "r" (x)); if (y > 32) __builtin_unreachable(); return y; } #endif return __builtin_clz(x); } #define ff_clz ff_clz_rv #if __riscv_xlen == 64 static inline av_const int ff_clzll_rv(long long x) { #if HAVE_RV && !defined(__riscv_zbb) if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" "clz %0, %1\n" ".option pop" : "=r" (y) : "r" (x)); if (y > 64) __builtin_unreachable(); return y; } #endif return __builtin_clzll(x); } #define ff_clz ff_clz_rv #endif static inline av_const int ff_log2_rv(unsigned int x) { return 31 - ff_clz_rv(x | 1); } #define ff_log2 ff_log2_rv #define ff_log2_16bit ff_log2_rv static inline av_const int av_popcount_rv(unsigned int x) { #if HAVE_RV && !defined(__riscv_zbb) if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" #if __riscv_xlen >= 64 "cpopw %0, %1\n" #else "cpop %0, %1\n" #endif ".option pop" : "=r" (y) : "r" (x)); if (y > 32) __builtin_unreachable(); return y; } #endif return __builtin_popcount(x); } #define av_popcount av_popcount_rv static inline av_const int av_popcount64_rv(uint64_t x) { #if HAVE_RV && !defined(__riscv_zbb) && __riscv_xlen >= 64 if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" "cpop %0, %1\n" ".option pop" : "=r" (y) : "r" (x)); if (y > 64) __builtin_unreachable(); return y; } #endif return __builtin_popcountl(x); } #define av_popcount64 av_popcount64_rv static inline av_const int av_parity_rv(unsigned int x) { #if HAVE_RV && !defined(__riscv_zbb) if (!__builtin_constant_p(x) && __builtin_expect(ff_rv_zbb_support(), true)) { int y; __asm__ ( ".option push\n" ".option arch, +zbb\n" #if __riscv_xlen >= 64 "cpopw %0, %1\n" #else "cpop %0, %1\n" #endif ".option pop" : "=r" (y) : "r" (x)); return y & 1; } #endif return __builtin_parity(x); } #define av_parity av_parity_rv #endif #endif /* AVUTIL_RISCV_INTMATH_H */