/* * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include "libavutil/cpu.h" #include "libavutil/cpu_internal.h" #include "config.h" #if HAVE_GETAUXVAL || HAVE_ELF_AUX_INFO #include #include #define HWCAP_AARCH64_ASIMDDP (1 << 20) #define HWCAP_AARCH64_SVE (1 << 22) #define HWCAP2_AARCH64_SVE2 (1 << 1) #define HWCAP2_AARCH64_I8MM (1 << 13) static int detect_flags(void) { int flags = 0; unsigned long hwcap = ff_getauxval(AT_HWCAP); unsigned long hwcap2 = ff_getauxval(AT_HWCAP2); if (hwcap & HWCAP_AARCH64_ASIMDDP) flags |= AV_CPU_FLAG_DOTPROD; if (hwcap & HWCAP_AARCH64_SVE) flags |= AV_CPU_FLAG_SVE; if (hwcap2 & HWCAP2_AARCH64_SVE2) flags |= AV_CPU_FLAG_SVE2; if (hwcap2 & HWCAP2_AARCH64_I8MM) flags |= AV_CPU_FLAG_I8MM; return flags; } #elif defined(__APPLE__) && HAVE_SYSCTLBYNAME #include static int have_feature(const char *feature) { uint32_t value = 0; size_t size = sizeof(value); if (!sysctlbyname(feature, &value, &size, NULL, 0)) return value; return 0; } static int detect_flags(void) { int flags = 0; if (have_feature("hw.optional.arm.FEAT_DotProd")) flags |= AV_CPU_FLAG_DOTPROD; if (have_feature("hw.optional.arm.FEAT_I8MM")) flags |= AV_CPU_FLAG_I8MM; return flags; } #elif defined(__OpenBSD__) #include #include #include #include static int detect_flags(void) { int flags = 0; #ifdef CPU_ID_AA64ISAR0 int mib[2]; uint64_t isar0; uint64_t isar1; size_t len; mib[0] = CTL_MACHDEP; mib[1] = CPU_ID_AA64ISAR0; len = sizeof(isar0); if (sysctl(mib, 2, &isar0, &len, NULL, 0) != -1) { if (ID_AA64ISAR0_DP(isar0) >= ID_AA64ISAR0_DP_IMPL) flags |= AV_CPU_FLAG_DOTPROD; } mib[0] = CTL_MACHDEP; mib[1] = CPU_ID_AA64ISAR1; len = sizeof(isar1); if (sysctl(mib, 2, &isar1, &len, NULL, 0) != -1) { #ifdef ID_AA64ISAR1_I8MM_IMPL if (ID_AA64ISAR1_I8MM(isar1) >= ID_AA64ISAR1_I8MM_IMPL) flags |= AV_CPU_FLAG_I8MM; #endif } #endif return flags; } #elif defined(_WIN32) #include static int detect_flags(void) { int flags = 0; #ifdef PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE if (IsProcessorFeaturePresent(PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE)) flags |= AV_CPU_FLAG_DOTPROD; #endif #ifdef PF_ARM_SVE_I8MM_INSTRUCTIONS_AVAILABLE /* There's no PF_* flag that indicates whether plain I8MM is available * or not. But if SVE_I8MM is available, that also implies that * regular I8MM is available. */ if (IsProcessorFeaturePresent(PF_ARM_SVE_I8MM_INSTRUCTIONS_AVAILABLE)) flags |= AV_CPU_FLAG_I8MM; #endif #ifdef PF_ARM_SVE_INSTRUCTIONS_AVAILABLE if (IsProcessorFeaturePresent(PF_ARM_SVE_INSTRUCTIONS_AVAILABLE)) flags |= AV_CPU_FLAG_SVE; #endif #ifdef PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE if (IsProcessorFeaturePresent(PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE)) flags |= AV_CPU_FLAG_SVE2; #endif return flags; } #else static int detect_flags(void) { return 0; } #endif int ff_get_cpu_flags_aarch64(void) { int flags = AV_CPU_FLAG_ARMV8 * HAVE_ARMV8 | AV_CPU_FLAG_NEON * HAVE_NEON; #ifdef __ARM_FEATURE_DOTPROD flags |= AV_CPU_FLAG_DOTPROD; #endif #ifdef __ARM_FEATURE_MATMUL_INT8 flags |= AV_CPU_FLAG_I8MM; #endif #ifdef __ARM_FEATURE_SVE flags |= AV_CPU_FLAG_SVE; #endif #ifdef __ARM_FEATURE_SVE2 flags |= AV_CPU_FLAG_SVE2; #endif flags |= detect_flags(); return flags; } size_t ff_get_cpu_max_align_aarch64(void) { int flags = av_get_cpu_flags(); if (flags & AV_CPU_FLAG_NEON) return 16; return 8; }