1*c0909341SAndroid Build Coastguard Worker /*
2*c0909341SAndroid Build Coastguard Worker * Copyright © 2018, VideoLAN and dav1d authors
3*c0909341SAndroid Build Coastguard Worker * Copyright © 2018, Two Orioles, LLC
4*c0909341SAndroid Build Coastguard Worker * All rights reserved.
5*c0909341SAndroid Build Coastguard Worker *
6*c0909341SAndroid Build Coastguard Worker * Redistribution and use in source and binary forms, with or without
7*c0909341SAndroid Build Coastguard Worker * modification, are permitted provided that the following conditions are met:
8*c0909341SAndroid Build Coastguard Worker *
9*c0909341SAndroid Build Coastguard Worker * 1. Redistributions of source code must retain the above copyright notice, this
10*c0909341SAndroid Build Coastguard Worker * list of conditions and the following disclaimer.
11*c0909341SAndroid Build Coastguard Worker *
12*c0909341SAndroid Build Coastguard Worker * 2. Redistributions in binary form must reproduce the above copyright notice,
13*c0909341SAndroid Build Coastguard Worker * this list of conditions and the following disclaimer in the documentation
14*c0909341SAndroid Build Coastguard Worker * and/or other materials provided with the distribution.
15*c0909341SAndroid Build Coastguard Worker *
16*c0909341SAndroid Build Coastguard Worker * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17*c0909341SAndroid Build Coastguard Worker * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*c0909341SAndroid Build Coastguard Worker * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*c0909341SAndroid Build Coastguard Worker * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20*c0909341SAndroid Build Coastguard Worker * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21*c0909341SAndroid Build Coastguard Worker * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22*c0909341SAndroid Build Coastguard Worker * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23*c0909341SAndroid Build Coastguard Worker * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24*c0909341SAndroid Build Coastguard Worker * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*c0909341SAndroid Build Coastguard Worker * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*c0909341SAndroid Build Coastguard Worker */
27*c0909341SAndroid Build Coastguard Worker
28*c0909341SAndroid Build Coastguard Worker #include "config.h"
29*c0909341SAndroid Build Coastguard Worker
30*c0909341SAndroid Build Coastguard Worker #include <stdint.h>
31*c0909341SAndroid Build Coastguard Worker #include <string.h>
32*c0909341SAndroid Build Coastguard Worker
33*c0909341SAndroid Build Coastguard Worker #include "common/attributes.h"
34*c0909341SAndroid Build Coastguard Worker
35*c0909341SAndroid Build Coastguard Worker #include "src/cpu.h"
36*c0909341SAndroid Build Coastguard Worker #include "src/x86/cpu.h"
37*c0909341SAndroid Build Coastguard Worker
38*c0909341SAndroid Build Coastguard Worker typedef struct {
39*c0909341SAndroid Build Coastguard Worker uint32_t eax, ebx, edx, ecx;
40*c0909341SAndroid Build Coastguard Worker } CpuidRegisters;
41*c0909341SAndroid Build Coastguard Worker
42*c0909341SAndroid Build Coastguard Worker void dav1d_cpu_cpuid(CpuidRegisters *regs, unsigned leaf, unsigned subleaf);
43*c0909341SAndroid Build Coastguard Worker uint64_t dav1d_cpu_xgetbv(unsigned xcr);
44*c0909341SAndroid Build Coastguard Worker
45*c0909341SAndroid Build Coastguard Worker #define X(reg, mask) (((reg) & (mask)) == (mask))
46*c0909341SAndroid Build Coastguard Worker
dav1d_get_cpu_flags_x86(void)47*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_x86(void) {
48*c0909341SAndroid Build Coastguard Worker union {
49*c0909341SAndroid Build Coastguard Worker CpuidRegisters r;
50*c0909341SAndroid Build Coastguard Worker struct {
51*c0909341SAndroid Build Coastguard Worker uint32_t max_leaf;
52*c0909341SAndroid Build Coastguard Worker char vendor[12];
53*c0909341SAndroid Build Coastguard Worker };
54*c0909341SAndroid Build Coastguard Worker } cpu;
55*c0909341SAndroid Build Coastguard Worker dav1d_cpu_cpuid(&cpu.r, 0, 0);
56*c0909341SAndroid Build Coastguard Worker unsigned flags = dav1d_get_default_cpu_flags();
57*c0909341SAndroid Build Coastguard Worker
58*c0909341SAndroid Build Coastguard Worker if (cpu.max_leaf >= 1) {
59*c0909341SAndroid Build Coastguard Worker CpuidRegisters r;
60*c0909341SAndroid Build Coastguard Worker dav1d_cpu_cpuid(&r, 1, 0);
61*c0909341SAndroid Build Coastguard Worker const unsigned family = ((r.eax >> 8) & 0x0f) + ((r.eax >> 20) & 0xff);
62*c0909341SAndroid Build Coastguard Worker
63*c0909341SAndroid Build Coastguard Worker if (X(r.edx, 0x06008000)) /* CMOV/SSE/SSE2 */ {
64*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_SSE2;
65*c0909341SAndroid Build Coastguard Worker if (X(r.ecx, 0x00000201)) /* SSE3/SSSE3 */ {
66*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_SSSE3;
67*c0909341SAndroid Build Coastguard Worker if (X(r.ecx, 0x00080000)) /* SSE4.1 */
68*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_SSE41;
69*c0909341SAndroid Build Coastguard Worker }
70*c0909341SAndroid Build Coastguard Worker }
71*c0909341SAndroid Build Coastguard Worker #if ARCH_X86_64
72*c0909341SAndroid Build Coastguard Worker /* We only support >128-bit SIMD on x86-64. */
73*c0909341SAndroid Build Coastguard Worker if (X(r.ecx, 0x18000000)) /* OSXSAVE/AVX */ {
74*c0909341SAndroid Build Coastguard Worker const uint64_t xcr0 = dav1d_cpu_xgetbv(0);
75*c0909341SAndroid Build Coastguard Worker if (X(xcr0, 0x00000006)) /* XMM/YMM */ {
76*c0909341SAndroid Build Coastguard Worker if (cpu.max_leaf >= 7) {
77*c0909341SAndroid Build Coastguard Worker dav1d_cpu_cpuid(&r, 7, 0);
78*c0909341SAndroid Build Coastguard Worker if (X(r.ebx, 0x00000128)) /* BMI1/BMI2/AVX2 */ {
79*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_AVX2;
80*c0909341SAndroid Build Coastguard Worker if (X(xcr0, 0x000000e0)) /* ZMM/OPMASK */ {
81*c0909341SAndroid Build Coastguard Worker if (X(r.ebx, 0xd0230000) && X(r.ecx, 0x00005f42))
82*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_AVX512ICL;
83*c0909341SAndroid Build Coastguard Worker }
84*c0909341SAndroid Build Coastguard Worker }
85*c0909341SAndroid Build Coastguard Worker }
86*c0909341SAndroid Build Coastguard Worker }
87*c0909341SAndroid Build Coastguard Worker }
88*c0909341SAndroid Build Coastguard Worker #endif
89*c0909341SAndroid Build Coastguard Worker if (!memcmp(cpu.vendor, "AuthenticAMD", sizeof(cpu.vendor))) {
90*c0909341SAndroid Build Coastguard Worker if ((flags & DAV1D_X86_CPU_FLAG_AVX2) && family <= 0x19) {
91*c0909341SAndroid Build Coastguard Worker /* Excavator, Zen, Zen+, Zen 2, Zen 3, Zen 3+, Zen 4 */
92*c0909341SAndroid Build Coastguard Worker flags |= DAV1D_X86_CPU_FLAG_SLOW_GATHER;
93*c0909341SAndroid Build Coastguard Worker }
94*c0909341SAndroid Build Coastguard Worker }
95*c0909341SAndroid Build Coastguard Worker }
96*c0909341SAndroid Build Coastguard Worker
97*c0909341SAndroid Build Coastguard Worker return flags;
98*c0909341SAndroid Build Coastguard Worker }
99