xref: /aosp_15_r20/external/libdav1d/src/x86/cpu.c (revision c09093415860a1c2373dacd84c4fde00c507cdfd)
1*c0909341SAndroid Build Coastguard Worker /*
2*c0909341SAndroid Build Coastguard Worker  * Copyright © 2018, VideoLAN and dav1d authors
3*c0909341SAndroid Build Coastguard Worker  * Copyright © 2018, Two Orioles, LLC
4*c0909341SAndroid Build Coastguard Worker  * All rights reserved.
5*c0909341SAndroid Build Coastguard Worker  *
6*c0909341SAndroid Build Coastguard Worker  * Redistribution and use in source and binary forms, with or without
7*c0909341SAndroid Build Coastguard Worker  * modification, are permitted provided that the following conditions are met:
8*c0909341SAndroid Build Coastguard Worker  *
9*c0909341SAndroid Build Coastguard Worker  * 1. Redistributions of source code must retain the above copyright notice, this
10*c0909341SAndroid Build Coastguard Worker  *    list of conditions and the following disclaimer.
11*c0909341SAndroid Build Coastguard Worker  *
12*c0909341SAndroid Build Coastguard Worker  * 2. Redistributions in binary form must reproduce the above copyright notice,
13*c0909341SAndroid Build Coastguard Worker  *    this list of conditions and the following disclaimer in the documentation
14*c0909341SAndroid Build Coastguard Worker  *    and/or other materials provided with the distribution.
15*c0909341SAndroid Build Coastguard Worker  *
16*c0909341SAndroid Build Coastguard Worker  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17*c0909341SAndroid Build Coastguard Worker  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*c0909341SAndroid Build Coastguard Worker  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*c0909341SAndroid Build Coastguard Worker  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20*c0909341SAndroid Build Coastguard Worker  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21*c0909341SAndroid Build Coastguard Worker  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22*c0909341SAndroid Build Coastguard Worker  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23*c0909341SAndroid Build Coastguard Worker  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24*c0909341SAndroid Build Coastguard Worker  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*c0909341SAndroid Build Coastguard Worker  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*c0909341SAndroid Build Coastguard Worker  */
27*c0909341SAndroid Build Coastguard Worker 
28*c0909341SAndroid Build Coastguard Worker #include "config.h"
29*c0909341SAndroid Build Coastguard Worker 
30*c0909341SAndroid Build Coastguard Worker #include <stdint.h>
31*c0909341SAndroid Build Coastguard Worker #include <string.h>
32*c0909341SAndroid Build Coastguard Worker 
33*c0909341SAndroid Build Coastguard Worker #include "common/attributes.h"
34*c0909341SAndroid Build Coastguard Worker 
35*c0909341SAndroid Build Coastguard Worker #include "src/cpu.h"
36*c0909341SAndroid Build Coastguard Worker #include "src/x86/cpu.h"
37*c0909341SAndroid Build Coastguard Worker 
38*c0909341SAndroid Build Coastguard Worker typedef struct {
39*c0909341SAndroid Build Coastguard Worker     uint32_t eax, ebx, edx, ecx;
40*c0909341SAndroid Build Coastguard Worker } CpuidRegisters;
41*c0909341SAndroid Build Coastguard Worker 
42*c0909341SAndroid Build Coastguard Worker void dav1d_cpu_cpuid(CpuidRegisters *regs, unsigned leaf, unsigned subleaf);
43*c0909341SAndroid Build Coastguard Worker uint64_t dav1d_cpu_xgetbv(unsigned xcr);
44*c0909341SAndroid Build Coastguard Worker 
45*c0909341SAndroid Build Coastguard Worker #define X(reg, mask) (((reg) & (mask)) == (mask))
46*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_x86(void)47*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_x86(void) {
48*c0909341SAndroid Build Coastguard Worker     union {
49*c0909341SAndroid Build Coastguard Worker         CpuidRegisters r;
50*c0909341SAndroid Build Coastguard Worker         struct {
51*c0909341SAndroid Build Coastguard Worker             uint32_t max_leaf;
52*c0909341SAndroid Build Coastguard Worker             char vendor[12];
53*c0909341SAndroid Build Coastguard Worker         };
54*c0909341SAndroid Build Coastguard Worker     } cpu;
55*c0909341SAndroid Build Coastguard Worker     dav1d_cpu_cpuid(&cpu.r, 0, 0);
56*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
57*c0909341SAndroid Build Coastguard Worker 
58*c0909341SAndroid Build Coastguard Worker     if (cpu.max_leaf >= 1) {
59*c0909341SAndroid Build Coastguard Worker         CpuidRegisters r;
60*c0909341SAndroid Build Coastguard Worker         dav1d_cpu_cpuid(&r, 1, 0);
61*c0909341SAndroid Build Coastguard Worker         const unsigned family = ((r.eax >> 8) & 0x0f) + ((r.eax >> 20) & 0xff);
62*c0909341SAndroid Build Coastguard Worker 
63*c0909341SAndroid Build Coastguard Worker         if (X(r.edx, 0x06008000)) /* CMOV/SSE/SSE2 */ {
64*c0909341SAndroid Build Coastguard Worker             flags |= DAV1D_X86_CPU_FLAG_SSE2;
65*c0909341SAndroid Build Coastguard Worker             if (X(r.ecx, 0x00000201)) /* SSE3/SSSE3 */ {
66*c0909341SAndroid Build Coastguard Worker                 flags |= DAV1D_X86_CPU_FLAG_SSSE3;
67*c0909341SAndroid Build Coastguard Worker                 if (X(r.ecx, 0x00080000)) /* SSE4.1 */
68*c0909341SAndroid Build Coastguard Worker                     flags |= DAV1D_X86_CPU_FLAG_SSE41;
69*c0909341SAndroid Build Coastguard Worker             }
70*c0909341SAndroid Build Coastguard Worker         }
71*c0909341SAndroid Build Coastguard Worker #if ARCH_X86_64
72*c0909341SAndroid Build Coastguard Worker         /* We only support >128-bit SIMD on x86-64. */
73*c0909341SAndroid Build Coastguard Worker         if (X(r.ecx, 0x18000000)) /* OSXSAVE/AVX */ {
74*c0909341SAndroid Build Coastguard Worker             const uint64_t xcr0 = dav1d_cpu_xgetbv(0);
75*c0909341SAndroid Build Coastguard Worker             if (X(xcr0, 0x00000006)) /* XMM/YMM */ {
76*c0909341SAndroid Build Coastguard Worker                 if (cpu.max_leaf >= 7) {
77*c0909341SAndroid Build Coastguard Worker                     dav1d_cpu_cpuid(&r, 7, 0);
78*c0909341SAndroid Build Coastguard Worker                     if (X(r.ebx, 0x00000128)) /* BMI1/BMI2/AVX2 */ {
79*c0909341SAndroid Build Coastguard Worker                         flags |= DAV1D_X86_CPU_FLAG_AVX2;
80*c0909341SAndroid Build Coastguard Worker                         if (X(xcr0, 0x000000e0)) /* ZMM/OPMASK */ {
81*c0909341SAndroid Build Coastguard Worker                             if (X(r.ebx, 0xd0230000) && X(r.ecx, 0x00005f42))
82*c0909341SAndroid Build Coastguard Worker                                 flags |= DAV1D_X86_CPU_FLAG_AVX512ICL;
83*c0909341SAndroid Build Coastguard Worker                         }
84*c0909341SAndroid Build Coastguard Worker                     }
85*c0909341SAndroid Build Coastguard Worker                 }
86*c0909341SAndroid Build Coastguard Worker             }
87*c0909341SAndroid Build Coastguard Worker         }
88*c0909341SAndroid Build Coastguard Worker #endif
89*c0909341SAndroid Build Coastguard Worker         if (!memcmp(cpu.vendor, "AuthenticAMD", sizeof(cpu.vendor))) {
90*c0909341SAndroid Build Coastguard Worker             if ((flags & DAV1D_X86_CPU_FLAG_AVX2) && family <= 0x19) {
91*c0909341SAndroid Build Coastguard Worker                 /* Excavator, Zen, Zen+, Zen 2, Zen 3, Zen 3+, Zen 4 */
92*c0909341SAndroid Build Coastguard Worker                 flags |= DAV1D_X86_CPU_FLAG_SLOW_GATHER;
93*c0909341SAndroid Build Coastguard Worker             }
94*c0909341SAndroid Build Coastguard Worker         }
95*c0909341SAndroid Build Coastguard Worker     }
96*c0909341SAndroid Build Coastguard Worker 
97*c0909341SAndroid Build Coastguard Worker     return flags;
98*c0909341SAndroid Build Coastguard Worker }
99