1*09537850SAkhilesh Sanikop /* 2*09537850SAkhilesh Sanikop * Copyright 2019 The libgav1 Authors 3*09537850SAkhilesh Sanikop * 4*09537850SAkhilesh Sanikop * Licensed under the Apache License, Version 2.0 (the "License"); 5*09537850SAkhilesh Sanikop * you may not use this file except in compliance with the License. 6*09537850SAkhilesh Sanikop * You may obtain a copy of the License at 7*09537850SAkhilesh Sanikop * 8*09537850SAkhilesh Sanikop * http://www.apache.org/licenses/LICENSE-2.0 9*09537850SAkhilesh Sanikop * 10*09537850SAkhilesh Sanikop * Unless required by applicable law or agreed to in writing, software 11*09537850SAkhilesh Sanikop * distributed under the License is distributed on an "AS IS" BASIS, 12*09537850SAkhilesh Sanikop * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*09537850SAkhilesh Sanikop * See the License for the specific language governing permissions and 14*09537850SAkhilesh Sanikop * limitations under the License. 15*09537850SAkhilesh Sanikop */ 16*09537850SAkhilesh Sanikop 17*09537850SAkhilesh Sanikop #ifndef LIBGAV1_SRC_UTILS_CPU_H_ 18*09537850SAkhilesh Sanikop #define LIBGAV1_SRC_UTILS_CPU_H_ 19*09537850SAkhilesh Sanikop 20*09537850SAkhilesh Sanikop #include <cstdint> 21*09537850SAkhilesh Sanikop 22*09537850SAkhilesh Sanikop namespace libgav1 { 23*09537850SAkhilesh Sanikop 24*09537850SAkhilesh Sanikop #if defined(__i386__) || defined(__x86_64__) 25*09537850SAkhilesh Sanikop #define LIBGAV1_X86 26*09537850SAkhilesh Sanikop #elif defined(_MSC_VER) && (defined(_M_IX86) || defined(_M_X64)) 27*09537850SAkhilesh Sanikop #define LIBGAV1_X86 28*09537850SAkhilesh Sanikop #define LIBGAV1_X86_MSVC 29*09537850SAkhilesh Sanikop #endif 30*09537850SAkhilesh Sanikop 31*09537850SAkhilesh Sanikop #if defined(LIBGAV1_X86) 32*09537850SAkhilesh Sanikop 33*09537850SAkhilesh Sanikop #if !defined(LIBGAV1_ENABLE_SSE4_1) 34*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_SSE4_1 1 35*09537850SAkhilesh Sanikop #endif 36*09537850SAkhilesh Sanikop 37*09537850SAkhilesh Sanikop #if LIBGAV1_ENABLE_SSE4_1 38*09537850SAkhilesh Sanikop #if !defined(LIBGAV1_ENABLE_AVX2) 39*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_AVX2 1 40*09537850SAkhilesh Sanikop #endif // !defined(LIBGAV1_ENABLE_AVX2) 41*09537850SAkhilesh Sanikop #else // !LIBGAV1_ENABLE_SSE4_1 42*09537850SAkhilesh Sanikop // Disable AVX2 when SSE4.1 is disabled as it may rely on shared components. 43*09537850SAkhilesh Sanikop #undef LIBGAV1_ENABLE_AVX2 44*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_AVX2 0 45*09537850SAkhilesh Sanikop #endif // LIBGAV1_ENABLE_SSE4_1 46*09537850SAkhilesh Sanikop 47*09537850SAkhilesh Sanikop #else // !LIBGAV1_X86 48*09537850SAkhilesh Sanikop 49*09537850SAkhilesh Sanikop #undef LIBGAV1_ENABLE_AVX2 50*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_AVX2 0 51*09537850SAkhilesh Sanikop #undef LIBGAV1_ENABLE_SSE4_1 52*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_SSE4_1 0 53*09537850SAkhilesh Sanikop 54*09537850SAkhilesh Sanikop #endif // LIBGAV1_X86 55*09537850SAkhilesh Sanikop 56*09537850SAkhilesh Sanikop // For x86 LIBGAV1_TARGETING_* indicate the source being built is targeting 57*09537850SAkhilesh Sanikop // (at least) that instruction set. This prevents disabling other instruction 58*09537850SAkhilesh Sanikop // sets if the current instruction set isn't a global target, e.g., building 59*09537850SAkhilesh Sanikop // *_avx2.cc w/-mavx2, but the remaining files without the flag. 60*09537850SAkhilesh Sanikop #if LIBGAV1_ENABLE_AVX2 && defined(__AVX2__) 61*09537850SAkhilesh Sanikop #define LIBGAV1_TARGETING_AVX2 1 62*09537850SAkhilesh Sanikop #else 63*09537850SAkhilesh Sanikop #define LIBGAV1_TARGETING_AVX2 0 64*09537850SAkhilesh Sanikop #endif 65*09537850SAkhilesh Sanikop 66*09537850SAkhilesh Sanikop // Note: LIBGAV1_X86_MSVC isn't completely correct for Visual Studio, but there 67*09537850SAkhilesh Sanikop // is no equivalent to __SSE4_1__. LIBGAV1_ENABLE_ALL_DSP_FUNCTIONS will be 68*09537850SAkhilesh Sanikop // enabled in dsp.h to compensate for this. 69*09537850SAkhilesh Sanikop #if LIBGAV1_ENABLE_SSE4_1 && (defined(__SSE4_1__) || defined(LIBGAV1_X86_MSVC)) 70*09537850SAkhilesh Sanikop #define LIBGAV1_TARGETING_SSE4_1 1 71*09537850SAkhilesh Sanikop #else 72*09537850SAkhilesh Sanikop #define LIBGAV1_TARGETING_SSE4_1 0 73*09537850SAkhilesh Sanikop #endif 74*09537850SAkhilesh Sanikop 75*09537850SAkhilesh Sanikop #undef LIBGAV1_X86 76*09537850SAkhilesh Sanikop 77*09537850SAkhilesh Sanikop #if !defined(LIBGAV1_ENABLE_NEON) 78*09537850SAkhilesh Sanikop // TODO(jzern): add support for _M_ARM64. 79*09537850SAkhilesh Sanikop #if defined(__ARM_NEON__) || defined(__aarch64__) || \ 80*09537850SAkhilesh Sanikop (defined(_MSC_VER) && defined(_M_ARM)) 81*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_NEON 1 82*09537850SAkhilesh Sanikop #else 83*09537850SAkhilesh Sanikop #define LIBGAV1_ENABLE_NEON 0 84*09537850SAkhilesh Sanikop #endif 85*09537850SAkhilesh Sanikop #endif // !defined(LIBGAV1_ENABLE_NEON) 86*09537850SAkhilesh Sanikop 87*09537850SAkhilesh Sanikop enum CpuFeatures : uint8_t { 88*09537850SAkhilesh Sanikop kSSE2 = 1 << 0, 89*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_SSE2 (1 << 0) 90*09537850SAkhilesh Sanikop kSSSE3 = 1 << 1, 91*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_SSSE3 (1 << 1) 92*09537850SAkhilesh Sanikop kSSE4_1 = 1 << 2, 93*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_SSE4_1 (1 << 2) 94*09537850SAkhilesh Sanikop kAVX = 1 << 3, 95*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_AVX (1 << 3) 96*09537850SAkhilesh Sanikop kAVX2 = 1 << 4, 97*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_AVX2 (1 << 4) 98*09537850SAkhilesh Sanikop kNEON = 1 << 5, 99*09537850SAkhilesh Sanikop #define LIBGAV1_CPU_NEON (1 << 5) 100*09537850SAkhilesh Sanikop }; 101*09537850SAkhilesh Sanikop 102*09537850SAkhilesh Sanikop // Returns a bit-wise OR of CpuFeatures supported by this platform. 103*09537850SAkhilesh Sanikop uint32_t GetCpuInfo(); 104*09537850SAkhilesh Sanikop 105*09537850SAkhilesh Sanikop } // namespace libgav1 106*09537850SAkhilesh Sanikop 107*09537850SAkhilesh Sanikop #endif // LIBGAV1_SRC_UTILS_CPU_H_ 108