| /*! |
| * \copy |
| * Copyright (c) 2009-2013, Cisco Systems |
| * All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * |
| * * Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * |
| * * Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in |
| * the documentation and/or other materials provided with the |
| * distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS |
| * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE |
| * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, |
| * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, |
| * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
| * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
| * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN |
| * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| * POSSIBILITY OF SUCH DAMAGE. |
| * |
| * |
| * \file cpu.cpp |
| * |
| * \brief CPU compatibility detection |
| * |
| * \date 04/29/2009 Created |
| * |
| ************************************************************************************* |
| */ |
| #include <string.h> |
| #include <stdio.h> |
| #ifdef ANDROID_NDK |
| #include <cpu-features.h> |
| #endif |
| #include "cpu.h" |
| #include "cpu_core.h" |
| |
| |
| |
| #define CPU_Vendor_AMD "AuthenticAMD" |
| #define CPU_Vendor_INTEL "GenuineIntel" |
| #define CPU_Vendor_CYRIX "CyrixInstead" |
| |
| #if defined(X86_ASM) |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| uint32_t uiCPU = 0; |
| uint32_t uiFeatureA = 0, uiFeatureB = 0, uiFeatureC = 0, uiFeatureD = 0; |
| int32_t CacheLineSize = 0; |
| int8_t chVendorName[16] = { 0 }; |
| uint32_t uiMaxCpuidLevel = 0; |
| |
| if (!WelsCPUIdVerify()) { |
| /* cpuid is not supported in cpu */ |
| return 0; |
| } |
| |
| WelsCPUId (0, &uiFeatureA, (uint32_t*)&chVendorName[0], (uint32_t*)&chVendorName[8], (uint32_t*)&chVendorName[4]); |
| uiMaxCpuidLevel = uiFeatureA; |
| if (uiMaxCpuidLevel == 0) { |
| /* maximum input value for basic cpuid information */ |
| return 0; |
| } |
| |
| WelsCPUId (1, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| if ((uiFeatureD & 0x00800000) == 0) { |
| /* Basic MMX technology is not support in cpu, mean nothing for us so return here */ |
| return 0; |
| } |
| |
| uiCPU = WELS_CPU_MMX; |
| if (uiFeatureD & 0x02000000) { |
| /* SSE technology is identical to AMD MMX extensions */ |
| uiCPU |= WELS_CPU_MMXEXT | WELS_CPU_SSE; |
| } |
| if (uiFeatureD & 0x04000000) { |
| /* SSE2 support here */ |
| uiCPU |= WELS_CPU_SSE2; |
| } |
| if (uiFeatureD & 0x00000001) { |
| /* x87 FPU on-chip checking */ |
| uiCPU |= WELS_CPU_FPU; |
| } |
| if (uiFeatureD & 0x00008000) { |
| /* CMOV instruction checking */ |
| uiCPU |= WELS_CPU_CMOV; |
| } |
| if ((!strcmp ((const char*)chVendorName, CPU_Vendor_INTEL)) || |
| (!strcmp ((const char*)chVendorName, CPU_Vendor_AMD))) { // confirmed_safe_unsafe_usage |
| if (uiFeatureD & 0x10000000) { |
| /* Multi-Threading checking: contains of multiple logic processors */ |
| uiCPU |= WELS_CPU_HTT; |
| } |
| } |
| |
| if (uiFeatureC & 0x00000001) { |
| /* SSE3 support here */ |
| uiCPU |= WELS_CPU_SSE3; |
| } |
| if (uiFeatureC & 0x00000200) { |
| /* SSSE3 support here */ |
| uiCPU |= WELS_CPU_SSSE3; |
| } |
| if (uiFeatureC & 0x00080000) { |
| /* SSE4.1 support here, 45nm Penryn processor */ |
| uiCPU |= WELS_CPU_SSE41; |
| } |
| if (uiFeatureC & 0x00100000) { |
| /* SSE4.2 support here, next generation Nehalem processor */ |
| uiCPU |= WELS_CPU_SSE42; |
| } |
| if (WelsCPUSupportAVX (uiFeatureA, uiFeatureC)) { |
| /* AVX supported */ |
| uiCPU |= WELS_CPU_AVX; |
| } |
| if (WelsCPUSupportFMA (uiFeatureA, uiFeatureC)) { |
| /* AVX FMA supported */ |
| uiCPU |= WELS_CPU_FMA; |
| } |
| if (uiFeatureC & 0x02000000) { |
| /* AES checking */ |
| uiCPU |= WELS_CPU_AES; |
| } |
| if (uiFeatureC & 0x00400000) { |
| /* MOVBE checking */ |
| uiCPU |= WELS_CPU_MOVBE; |
| } |
| |
| if (uiMaxCpuidLevel >= 7) { |
| uiFeatureC = 0; |
| WelsCPUId (7, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| if ((uiCPU & WELS_CPU_AVX) && (uiFeatureB & 0x00000020)) { |
| /* AVX2 supported */ |
| uiCPU |= WELS_CPU_AVX2; |
| } |
| } |
| |
| if (uiMaxCpuidLevel >= 7) { |
| uiFeatureC = WelsCPUDetectAVX512(); |
| if (uiFeatureC & 0x10000) uiCPU |= WELS_CPU_AVX512F; |
| if (uiFeatureC & 0x10000000) uiCPU |= WELS_CPU_AVX512CD; |
| if (uiFeatureC & 0x20000) uiCPU |= WELS_CPU_AVX512DQ; |
| if (uiFeatureC & 0x40000000) uiCPU |= WELS_CPU_AVX512BW; |
| if (uiFeatureC & 0x80000000) uiCPU |= WELS_CPU_AVX512VL; |
| } |
| |
| if (pNumberOfLogicProcessors != NULL) { |
| if (uiCPU & WELS_CPU_HTT) { |
| *pNumberOfLogicProcessors = (uiFeatureB & 0x00ff0000) >> 16; // feature bits: 23-16 on returned EBX |
| } else { |
| *pNumberOfLogicProcessors = 0; |
| } |
| if (!strcmp ((const char*)chVendorName, CPU_Vendor_INTEL)) { |
| if (uiMaxCpuidLevel >= 4) { |
| uiFeatureC = 0; |
| WelsCPUId (0x4, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| if (uiFeatureA != 0) { |
| *pNumberOfLogicProcessors = ((uiFeatureA & 0xfc000000) >> 26) + 1; |
| } |
| } |
| } |
| } |
| |
| WelsCPUId (0x80000000, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| |
| if ((!strcmp ((const char*)chVendorName, CPU_Vendor_AMD)) |
| && (uiFeatureA >= 0x80000001)) { // confirmed_safe_unsafe_usage |
| WelsCPUId (0x80000001, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| if (uiFeatureD & 0x00400000) { |
| uiCPU |= WELS_CPU_MMXEXT; |
| } |
| if (uiFeatureD & 0x80000000) { |
| uiCPU |= WELS_CPU_3DNOW; |
| } |
| } |
| |
| if (!strcmp ((const char*)chVendorName, CPU_Vendor_INTEL)) { // confirmed_safe_unsafe_usage |
| int32_t family, model; |
| |
| WelsCPUId (1, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| family = ((uiFeatureA >> 8) & 0xf) + ((uiFeatureA >> 20) & 0xff); |
| model = ((uiFeatureA >> 4) & 0xf) + ((uiFeatureA >> 12) & 0xf0); |
| |
| if ((family == 6) && (model == 9 || model == 13 || model == 14)) { |
| uiCPU &= ~ (WELS_CPU_SSE2 | WELS_CPU_SSE3); |
| } |
| } |
| |
| // get cache line size |
| if ((!strcmp ((const char*)chVendorName, CPU_Vendor_INTEL)) |
| || ! (strcmp ((const char*)chVendorName, CPU_Vendor_CYRIX))) { // confirmed_safe_unsafe_usage |
| WelsCPUId (1, &uiFeatureA, &uiFeatureB, &uiFeatureC, &uiFeatureD); |
| |
| CacheLineSize = (uiFeatureB & 0xff00) >> |
| 5; // ((clflush_line_size >> 8) << 3), CLFLUSH_line_size * 8 = CacheLineSize_in_byte |
| |
| if (CacheLineSize == 128) { |
| uiCPU |= WELS_CPU_CACHELINE_128; |
| } else if (CacheLineSize == 64) { |
| uiCPU |= WELS_CPU_CACHELINE_64; |
| } else if (CacheLineSize == 32) { |
| uiCPU |= WELS_CPU_CACHELINE_32; |
| } else if (CacheLineSize == 16) { |
| uiCPU |= WELS_CPU_CACHELINE_16; |
| } |
| } |
| |
| return uiCPU; |
| } |
| |
| |
| void WelsCPURestore (const uint32_t kuiCPU) { |
| if (kuiCPU & (WELS_CPU_MMX | WELS_CPU_MMXEXT | WELS_CPU_3DNOW | WELS_CPU_3DNOWEXT)) { |
| WelsEmms(); |
| } |
| } |
| |
| #elif defined(HAVE_NEON) //For supporting both android platform and iOS platform |
| #if defined(ANDROID_NDK) |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| uint32_t uiCPU = 0; |
| AndroidCpuFamily cpuFamily = ANDROID_CPU_FAMILY_UNKNOWN; |
| uint64_t uiFeatures = 0; |
| cpuFamily = android_getCpuFamily(); |
| if (cpuFamily == ANDROID_CPU_FAMILY_ARM) { |
| uiFeatures = android_getCpuFeatures(); |
| if (uiFeatures & ANDROID_CPU_ARM_FEATURE_ARMv7) { |
| uiCPU |= WELS_CPU_ARMv7; |
| } |
| if (uiFeatures & ANDROID_CPU_ARM_FEATURE_VFPv3) { |
| uiCPU |= WELS_CPU_VFPv3; |
| } |
| if (uiFeatures & ANDROID_CPU_ARM_FEATURE_NEON) { |
| uiCPU |= WELS_CPU_NEON; |
| } |
| } |
| |
| if (pNumberOfLogicProcessors != NULL) { |
| *pNumberOfLogicProcessors = android_getCpuCount(); |
| } |
| |
| return uiCPU; |
| } |
| |
| #elif defined(__APPLE__) |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| uint32_t uiCPU = 0; |
| |
| #if defined(__ARM_NEON__) |
| uiCPU |= WELS_CPU_ARMv7; |
| uiCPU |= WELS_CPU_VFPv3; |
| uiCPU |= WELS_CPU_NEON; |
| #endif |
| return uiCPU; |
| } |
| #elif defined(__linux__) |
| |
| /* Generic arm/linux cpu feature detection */ |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| int flags = 0; |
| FILE* f = fopen ("/proc/cpuinfo", "r"); |
| |
| #if defined(__chromeos__) |
| flags |= WELS_CPU_NEON; |
| #endif |
| |
| if (!f) { |
| return flags; |
| } |
| |
| char buf[200]; |
| while (fgets (buf, sizeof (buf), f)) { |
| if (!strncmp (buf, "Features", strlen ("Features"))) { |
| // The asimd and fp features are listed on 64 bit ARMv8 kernels |
| if (strstr (buf, " neon ") || strstr (buf, " asimd ")) |
| flags |= WELS_CPU_NEON; |
| if (strstr (buf, " vfpv3 ") || strstr (buf, " fp ")) |
| flags |= WELS_CPU_VFPv3; |
| break; |
| } |
| } |
| fclose (f); |
| return flags; |
| } |
| |
| #else /* HAVE_NEON enabled but no runtime detection */ |
| |
| /* No runtime feature detection available, but built with HAVE_NEON - assume |
| * that NEON and all associated features are available. */ |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| return WELS_CPU_ARMv7 | |
| WELS_CPU_VFPv3 | |
| WELS_CPU_NEON; |
| } |
| #endif |
| #elif defined(HAVE_NEON_AARCH64) |
| |
| /* For AArch64, no runtime detection actually is necessary for now, since |
| * NEON and VFPv3 is mandatory on all such CPUs. (/proc/cpuinfo doesn't |
| * contain neon, and the android cpufeatures library doesn't return it |
| * either.) */ |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| return WELS_CPU_VFPv3 | |
| WELS_CPU_NEON; |
| } |
| |
| #elif defined(mips) |
| /* Get cpu features from cpuinfo. */ |
| static uint32_t get_cpu_flags_from_cpuinfo(void) |
| { |
| uint32_t flags = 0; |
| |
| # ifdef __linux__ |
| FILE* fp = fopen("/proc/cpuinfo", "r"); |
| if (!fp) |
| return flags; |
| |
| char buf[200]; |
| memset(buf, 0, sizeof(buf)); |
| while (fgets(buf, sizeof(buf), fp)) { |
| if (!strncmp(buf, "model name", strlen("model name"))) { |
| if (strstr(buf, "Loongson-3A") || strstr(buf, "Loongson-3B") || |
| strstr(buf, "Loongson-2K")) { |
| flags |= WELS_CPU_MMI; |
| } |
| break; |
| } |
| } |
| while (fgets(buf, sizeof(buf), fp)) { |
| if(!strncmp(buf, "ASEs implemented", strlen("ASEs implemented"))) { |
| if (strstr(buf, "loongson-mmi") && strstr(buf, "loongson-ext")) { |
| flags |= WELS_CPU_MMI; |
| } |
| if (strstr(buf, "msa")) { |
| flags |= WELS_CPU_MSA; |
| } |
| break; |
| } |
| } |
| fclose(fp); |
| # endif |
| |
| return flags; |
| } |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| return get_cpu_flags_from_cpuinfo(); |
| } |
| |
| #elif defined(__loongarch__) && defined(__linux__) |
| /* The getauxval is used to dynamically identify the characteristics |
| * of the loongarch in the running processor during software execution. */ |
| #include <sys/auxv.h> |
| #define LA_HWCAP_LSX (1 << 4) |
| #define LA_HWCAP_LASX (1 << 5) |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| uint32_t flags = 0; |
| uint32_t flag = (uint32_t)getauxval(AT_HWCAP); |
| if (flag & LA_HWCAP_LSX) |
| flags |= WELS_CPU_LSX; |
| if (flag & LA_HWCAP_LASX) |
| flags |= WELS_CPU_LASX; |
| return flags; |
| } |
| |
| #else /* Neither X86_ASM, HAVE_NEON, HAVE_NEON_AARCH64, loongarch nor mips */ |
| |
| uint32_t WelsCPUFeatureDetect (int32_t* pNumberOfLogicProcessors) { |
| return 0; |
| } |
| |
| #endif |