mirror of
https://chromium.googlesource.com/libyuv/libyuv
synced 2026-05-01 03:19:18 +08:00
Removed all SSE functions, macros, dispatching logic, and related unit tests across the repository to reduce code size and complexity. Left cpuid detection intact. Supported architectures like AVX2, NEON, SVE, etc. are unaffected. R=rrwinterton@gmail.com Bug: None Test: Build and run libyuv_unittest Change-Id: Id19608dba35b79c4c8fc31f920a6a968883d300f
421 lines
13 KiB
C++
421 lines
13 KiB
C++
/*
|
|
* Copyright 2012 The LibYuv Project Authors. All rights reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#ifdef __linux__
|
|
#include <ctype.h>
|
|
#include <sys/utsname.h>
|
|
#endif
|
|
|
|
#include "../unit_test/unit_test.h"
|
|
#include "libyuv/basic_types.h"
|
|
#include "libyuv/cpu_id.h"
|
|
#include "libyuv/version.h"
|
|
|
|
namespace libyuv {
|
|
|
|
#if defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) || \
|
|
defined(_M_X64)
|
|
TEST_F(LibYUVBaseTest, TestCpuId) {
|
|
int has_x86 = TestCpuFlag(kCpuHasX86);
|
|
if (has_x86) {
|
|
int cpu_info[4];
|
|
// Vendor ID:
|
|
// AuthenticAMD AMD processor
|
|
// CentaurHauls Centaur processor
|
|
// CyrixInstead Cyrix processor
|
|
// GenuineIntel Intel processor
|
|
// GenuineTMx86 Transmeta processor
|
|
// Geode by NSC National Semiconductor processor
|
|
// NexGenDriven NexGen processor
|
|
// RiseRiseRise Rise Technology processor
|
|
// SiS SiS SiS SiS processor
|
|
// UMC UMC UMC UMC processor
|
|
CpuId(0, 0, cpu_info);
|
|
cpu_info[0] = cpu_info[1]; // Reorder output
|
|
cpu_info[1] = cpu_info[3];
|
|
cpu_info[3] = 0;
|
|
printf("Cpu Vendor: %s 0x%x 0x%x 0x%x\n",
|
|
reinterpret_cast<char*>(&cpu_info[0]), cpu_info[0], cpu_info[1],
|
|
cpu_info[2]);
|
|
EXPECT_EQ(12u, strlen(reinterpret_cast<char*>(&cpu_info[0])));
|
|
|
|
// CPU Family and Model
|
|
// 3:0 - Stepping
|
|
// 7:4 - Model
|
|
// 11:8 - Family
|
|
// 13:12 - Processor Type
|
|
// 19:16 - Extended Model
|
|
// 27:20 - Extended Family
|
|
CpuId(1, 0, cpu_info);
|
|
int family = ((cpu_info[0] >> 8) & 0x0f) | ((cpu_info[0] >> 16) & 0xff0);
|
|
int model = ((cpu_info[0] >> 4) & 0x0f) | ((cpu_info[0] >> 12) & 0xf0);
|
|
printf("Cpu Family %d (0x%x), Model %d (0x%x)\n", family, family, model,
|
|
model);
|
|
}
|
|
}
|
|
#endif
|
|
|
|
#ifdef __linux__
|
|
static void KernelVersion(int* version) {
|
|
struct utsname buffer;
|
|
int i = 0;
|
|
|
|
version[0] = version[1] = 0;
|
|
if (uname(&buffer) == 0) {
|
|
char* v = buffer.release;
|
|
for (i = 0; *v && i < 2; ++v) {
|
|
if (isdigit(*v)) {
|
|
version[i++] = (int)strtol(v, &v, 10);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
#endif
|
|
|
|
TEST_F(LibYUVBaseTest, TestCpuHas) {
|
|
#if defined(__linux__)
|
|
{
|
|
int kernelversion[2];
|
|
KernelVersion(kernelversion);
|
|
printf("Kernel Version %d.%d\n", kernelversion[0], kernelversion[1]);
|
|
}
|
|
#endif // defined(__linux__)
|
|
|
|
#if defined(__arm__) || defined(__aarch64__)
|
|
int has_arm = TestCpuFlag(kCpuHasARM);
|
|
if (has_arm) {
|
|
int has_neon = TestCpuFlag(kCpuHasNEON);
|
|
int has_neon_dotprod = TestCpuFlag(kCpuHasNeonDotProd);
|
|
int has_neon_i8mm = TestCpuFlag(kCpuHasNeonI8MM);
|
|
int has_sve = TestCpuFlag(kCpuHasSVE);
|
|
int has_sve2 = TestCpuFlag(kCpuHasSVE2);
|
|
int has_sve_f32mm = TestCpuFlag(kCpuHasSVEF32MM);
|
|
int has_sme = TestCpuFlag(kCpuHasSME);
|
|
int has_sme2 = TestCpuFlag(kCpuHasSME2);
|
|
printf("Has Arm 0x%x\n", has_arm);
|
|
printf("Has Neon 0x%x\n", has_neon);
|
|
printf("Has Neon DotProd 0x%x\n", has_neon_dotprod);
|
|
printf("Has Neon I8MM 0x%x\n", has_neon_i8mm);
|
|
printf("Has SVE 0x%x\n", has_sve);
|
|
printf("Has SVE2 0x%x\n", has_sve2);
|
|
printf("Has SVE F32MM 0x%x\n", has_sve_f32mm);
|
|
printf("Has SME 0x%x\n", has_sme);
|
|
printf("Has SME2 0x%x\n", has_sme2);
|
|
|
|
#if defined(__aarch64__)
|
|
// Read and print the SVE and SME vector lengths.
|
|
if (has_sve) {
|
|
int sve_vl;
|
|
asm(".inst 0x04bf5020 \n" // rdvl x0, #1
|
|
"mov %w[sve_vl], w0 \n"
|
|
: [sve_vl] "=r"(sve_vl) // %[sve_vl]
|
|
:
|
|
: "x0");
|
|
printf("SVE vector length: %d bytes\n", sve_vl);
|
|
}
|
|
if (has_sme) {
|
|
int sme_vl;
|
|
asm(".inst 0x04bf5820 \n" // rdsvl x0, #1
|
|
"mov %w[sme_vl], w0 \n"
|
|
: [sme_vl] "=r"(sme_vl) // %[sme_vl]
|
|
:
|
|
: "x0");
|
|
printf("SME vector length: %d bytes\n", sme_vl);
|
|
}
|
|
#endif // defined(__aarch64__)
|
|
}
|
|
#endif // if defined(__arm__) || defined(__aarch64__)
|
|
|
|
#if defined(__riscv)
|
|
int has_riscv = TestCpuFlag(kCpuHasRISCV);
|
|
if (has_riscv) {
|
|
int has_rvv = TestCpuFlag(kCpuHasRVV);
|
|
printf("Has RISCV 0x%x\n", has_riscv);
|
|
printf("Has RVV 0x%x\n", has_rvv);
|
|
|
|
// Read and print the RVV vector length.
|
|
if (has_rvv) {
|
|
register uint32_t vlenb __asm__("t0");
|
|
__asm__(".word 0xC22022F3" /* CSRR t0, vlenb */ : "=r"(vlenb));
|
|
printf("RVV vector length: %d bytes\n", vlenb);
|
|
}
|
|
}
|
|
#endif // defined(__riscv)
|
|
|
|
#if defined(__loongarch__)
|
|
int has_loongarch = TestCpuFlag(kCpuHasLOONGARCH);
|
|
if (has_loongarch) {
|
|
int has_lsx = TestCpuFlag(kCpuHasLSX);
|
|
int has_lasx = TestCpuFlag(kCpuHasLASX);
|
|
printf("Has LOONGARCH 0x%x\n", has_loongarch);
|
|
printf("Has LSX 0x%x\n", has_lsx);
|
|
printf("Has LASX 0x%x\n", has_lasx);
|
|
}
|
|
#endif // defined(__loongarch__)
|
|
|
|
#if defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) || \
|
|
defined(_M_X64)
|
|
int has_x86 = TestCpuFlag(kCpuHasX86);
|
|
if (has_x86) {
|
|
int has_avx = TestCpuFlag(kCpuHasAVX);
|
|
int has_avx2 = TestCpuFlag(kCpuHasAVX2);
|
|
int has_erms = TestCpuFlag(kCpuHasERMS);
|
|
int has_fsmr = TestCpuFlag(kCpuHasFSMR);
|
|
int has_fma3 = TestCpuFlag(kCpuHasFMA3);
|
|
int has_f16c = TestCpuFlag(kCpuHasF16C);
|
|
int has_avx512bw = TestCpuFlag(kCpuHasAVX512BW);
|
|
int has_avx512vl = TestCpuFlag(kCpuHasAVX512VL);
|
|
int has_avx512vnni = TestCpuFlag(kCpuHasAVX512VNNI);
|
|
int has_avx512vbmi = TestCpuFlag(kCpuHasAVX512VBMI);
|
|
int has_avx512vbmi2 = TestCpuFlag(kCpuHasAVX512VBMI2);
|
|
int has_avx512vbitalg = TestCpuFlag(kCpuHasAVX512VBITALG);
|
|
int has_avx10 = TestCpuFlag(kCpuHasAVX10);
|
|
int has_avx10_2 = TestCpuFlag(kCpuHasAVX10_2);
|
|
int has_avxvnni = TestCpuFlag(kCpuHasAVXVNNI);
|
|
int has_avxvnniint8 = TestCpuFlag(kCpuHasAVXVNNIINT8);
|
|
int has_amxint8 = TestCpuFlag(kCpuHasAMXINT8);
|
|
printf("Has X86 0x%x\n", has_x86);
|
|
printf("Has SSSE3 0x%x\n", has_ssse3);
|
|
printf("Has AVX 0x%x\n", has_avx);
|
|
printf("Has AVX2 0x%x\n", has_avx2);
|
|
printf("Has ERMS 0x%x\n", has_erms);
|
|
printf("Has FSMR 0x%x\n", has_fsmr);
|
|
printf("Has FMA3 0x%x\n", has_fma3);
|
|
printf("Has F16C 0x%x\n", has_f16c);
|
|
printf("Has AVX512BW 0x%x\n", has_avx512bw);
|
|
printf("Has AVX512VL 0x%x\n", has_avx512vl);
|
|
printf("Has AVX512VNNI 0x%x\n", has_avx512vnni);
|
|
printf("Has AVX512VBMI 0x%x\n", has_avx512vbmi);
|
|
printf("Has AVX512VBMI2 0x%x\n", has_avx512vbmi2);
|
|
printf("Has AVX512VBITALG 0x%x\n", has_avx512vbitalg);
|
|
printf("Has AVX10 0x%x\n", has_avx10);
|
|
printf("Has AVX10_2 0x%x\n", has_avx10_2);
|
|
printf("HAS AVXVNNI 0x%x\n", has_avxvnni);
|
|
printf("Has AVXVNNIINT8 0x%x\n", has_avxvnniint8);
|
|
printf("Has AMXINT8 0x%x\n", has_amxint8);
|
|
}
|
|
#endif // defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) ||
|
|
// defined(_M_X64)
|
|
}
|
|
|
|
TEST_F(LibYUVBaseTest, TestCompilerMacros) {
|
|
// Tests all macros used in public headers.
|
|
#ifdef __ATOMIC_RELAXED
|
|
printf("__ATOMIC_RELAXED %d\n", __ATOMIC_RELAXED);
|
|
#endif
|
|
#ifdef __cplusplus
|
|
printf("__cplusplus %ld\n", __cplusplus);
|
|
#endif
|
|
#ifdef __clang_major__
|
|
printf("__clang_major__ %d\n", __clang_major__);
|
|
#endif
|
|
#ifdef __clang_minor__
|
|
printf("__clang_minor__ %d\n", __clang_minor__);
|
|
#endif
|
|
#ifdef __GNUC__
|
|
printf("__GNUC__ %d\n", __GNUC__);
|
|
#endif
|
|
#ifdef __GNUC_MINOR__
|
|
printf("__GNUC_MINOR__ %d\n", __GNUC_MINOR__);
|
|
#endif
|
|
#ifdef __i386__
|
|
printf("__i386__ %d\n", __i386__);
|
|
#endif
|
|
#ifdef __x86_64__
|
|
printf("__x86_64__ %d\n", __x86_64__);
|
|
#endif
|
|
#ifdef _M_IX86
|
|
printf("_M_IX86 %d\n", _M_IX86);
|
|
#endif
|
|
#ifdef _M_X64
|
|
printf("_M_X64 %d\n", _M_X64);
|
|
#endif
|
|
#ifdef _MSC_VER
|
|
printf("_MSC_VER %d\n", _MSC_VER);
|
|
#endif
|
|
#ifdef __aarch64__
|
|
printf("__aarch64__ %d\n", __aarch64__);
|
|
#endif
|
|
#ifdef __arm__
|
|
printf("__arm__ %d\n", __arm__);
|
|
#endif
|
|
#ifdef __riscv
|
|
printf("__riscv %d\n", __riscv);
|
|
#endif
|
|
#ifdef __riscv_vector
|
|
printf("__riscv_vector %d\n", __riscv_vector);
|
|
#endif
|
|
#ifdef __riscv_v_intrinsic
|
|
printf("__riscv_v_intrinsic %d\n", __riscv_v_intrinsic);
|
|
#endif
|
|
#ifdef __riscv_zve64x
|
|
printf("__riscv_zve64x %d\n", __riscv_zve64x);
|
|
#endif
|
|
#ifdef __APPLE__
|
|
printf("__APPLE__ %d\n", __APPLE__);
|
|
#endif
|
|
#ifdef __clang__
|
|
printf("__clang__ %d\n", __clang__);
|
|
#endif
|
|
#ifdef __CLR_VER
|
|
printf("__CLR_VER %d\n", __CLR_VER);
|
|
#endif
|
|
#ifdef __CYGWIN__
|
|
printf("__CYGWIN__ %d\n", __CYGWIN__);
|
|
#endif
|
|
#ifdef __llvm__
|
|
printf("__llvm__ %d\n", __llvm__);
|
|
#endif
|
|
#ifdef __loongarch__
|
|
printf("__loongarch__ %d\n", __loongarch__);
|
|
#endif
|
|
#ifdef _WIN32
|
|
printf("_WIN32 %d\n", _WIN32);
|
|
#endif
|
|
#ifdef __native_client__
|
|
printf("__native_client__ %d\n", __native_client__);
|
|
#endif
|
|
#ifdef __pic__
|
|
printf("__pic__ %d\n", __pic__);
|
|
#endif
|
|
#ifdef __pnacl__
|
|
printf("__pnacl__ %d\n", __pnacl__);
|
|
#endif
|
|
#ifdef GG_LONGLONG
|
|
printf("GG_LONGLONG %lld\n", GG_LONGLONG(1));
|
|
#endif
|
|
#ifdef INT_TYPES_DEFINED
|
|
printf("INT_TYPES_DEFINED\n");
|
|
#endif
|
|
#ifdef __has_feature
|
|
printf("__has_feature\n");
|
|
#if __has_feature(memory_sanitizer)
|
|
printf("__has_feature(memory_sanitizer) %d\n",
|
|
__has_feature(memory_sanitizer));
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
static int FileExists(const char* file_name) {
|
|
FILE* f = fopen(file_name, "r");
|
|
if (!f) {
|
|
return 0;
|
|
}
|
|
fclose(f);
|
|
return 1;
|
|
}
|
|
|
|
TEST_F(LibYUVBaseTest, DISABLED_TestLinuxArm) {
|
|
if (FileExists("../../unit_test/testdata/arm_v7.txt")) {
|
|
printf("Note: testing to load \"../../unit_test/testdata/arm_v7.txt\"\n");
|
|
|
|
EXPECT_EQ(0, ArmCpuCaps("../../unit_test/testdata/arm_v7.txt"));
|
|
EXPECT_EQ(kCpuHasNEON, ArmCpuCaps("../../unit_test/testdata/tegra3.txt"));
|
|
} else {
|
|
printf("WARNING: unable to load \"../../unit_test/testdata/arm_v7.txt\"\n");
|
|
}
|
|
#if defined(__linux__) && defined(__ARM_NEON__) && !defined(__aarch64__)
|
|
if (FileExists("/proc/cpuinfo")) {
|
|
if (kCpuHasNEON != ArmCpuCaps("/proc/cpuinfo")) {
|
|
// This can happen on Arm emulator but /proc/cpuinfo is from host.
|
|
printf("WARNING: Neon build enabled but CPU does not have Neon\n");
|
|
}
|
|
} else {
|
|
printf("WARNING: unable to load \"/proc/cpuinfo\"\n");
|
|
}
|
|
#endif
|
|
}
|
|
|
|
#if defined(__linux__) && defined(__aarch64__)
|
|
TEST_F(LibYUVBaseTest, TestLinuxAArch64) {
|
|
// Values taken from a Cortex-A57 machine, only Neon available.
|
|
EXPECT_EQ(kCpuHasNEON, AArch64CpuCaps(0xffU, 0x0U));
|
|
|
|
// Values taken from a Google Pixel 7.
|
|
int expected = kCpuHasNEON | kCpuHasNeonDotProd;
|
|
EXPECT_EQ(expected, AArch64CpuCaps(0x119fffU, 0x0U));
|
|
|
|
// Values taken from a Google Pixel 8.
|
|
expected = kCpuHasNEON | kCpuHasNeonDotProd | kCpuHasNeonI8MM | kCpuHasSVE |
|
|
kCpuHasSVE2;
|
|
EXPECT_EQ(expected, AArch64CpuCaps(0x3fffffffU, 0x2f33fU));
|
|
|
|
// Values taken from a Neoverse N2 machine.
|
|
EXPECT_EQ(expected, AArch64CpuCaps(0x3fffffffU, 0x2f3ffU));
|
|
|
|
// Check for SME feature detection.
|
|
expected |= kCpuHasSME;
|
|
EXPECT_EQ(expected, AArch64CpuCaps(0x3fffffffU, 0x82f3ffU));
|
|
|
|
// TODO: Check for SME2 feature detection from Apple M4
|
|
}
|
|
#endif
|
|
|
|
TEST_F(LibYUVBaseTest, DISABLED_TestLinuxRVV) {
|
|
if (FileExists("../../unit_test/testdata/riscv64.txt")) {
|
|
printf("Note: testing to load \"../../unit_test/testdata/riscv64.txt\"\n");
|
|
|
|
EXPECT_EQ(0, RiscvCpuCaps("../../unit_test/testdata/riscv64.txt"));
|
|
EXPECT_EQ(kCpuHasRVV,
|
|
RiscvCpuCaps("../../unit_test/testdata/riscv64_rvv.txt"));
|
|
EXPECT_EQ(kCpuHasRVV | kCpuHasRVVZVFH,
|
|
RiscvCpuCaps("../../unit_test/testdata/riscv64_rvv_zvfh.txt"));
|
|
} else {
|
|
printf(
|
|
"WARNING: unable to load "
|
|
"\"../../unit_test/testdata/riscv64.txt\"\n");
|
|
}
|
|
#if defined(__linux__) && defined(__riscv)
|
|
if (FileExists("/proc/cpuinfo")) {
|
|
if (!(kCpuHasRVV & RiscvCpuCaps("/proc/cpuinfo"))) {
|
|
// This can happen on RVV emulator but /proc/cpuinfo is from host.
|
|
printf("WARNING: RVV build enabled but CPU does not have RVV\n");
|
|
}
|
|
} else {
|
|
printf("WARNING: unable to load \"/proc/cpuinfo\"\n");
|
|
}
|
|
#endif
|
|
}
|
|
|
|
#ifdef _WIN32
|
|
// This doesn't pass on Windows CQ.
|
|
#define MAYBE_TestSetCpuFlags DISABLED_TestSetCpuFlags
|
|
#else
|
|
#define MAYBE_TestSetCpuFlags TestSetCpuFlags
|
|
#endif
|
|
TEST_F(LibYUVBaseTest, MAYBE_TestSetCpuFlags) {
|
|
// Reset any masked flags that may have been set so auto init is enabled.
|
|
MaskCpuFlags(0);
|
|
|
|
int original_cpu_flags = TestCpuFlag(-1);
|
|
|
|
// Test setting different CPU configurations.
|
|
int cpu_flags = kCpuHasARM | kCpuHasNEON | kCpuInitialized;
|
|
SetCpuFlags(cpu_flags);
|
|
EXPECT_EQ(cpu_flags, TestCpuFlag(-1));
|
|
|
|
cpu_flags = kCpuHasX86 | kCpuInitialized;
|
|
SetCpuFlags(cpu_flags);
|
|
EXPECT_EQ(cpu_flags, TestCpuFlag(-1));
|
|
|
|
// Test that setting 0 turns auto-init back on.
|
|
SetCpuFlags(0);
|
|
EXPECT_EQ(original_cpu_flags, TestCpuFlag(-1));
|
|
|
|
// Restore the CPU flag mask.
|
|
MaskCpuFlags(benchmark_cpu_info_);
|
|
}
|
|
|
|
} // namespace libyuv
|