xref: /aosp_15_r20/external/libdav1d/src/arm/cpu.c (revision c09093415860a1c2373dacd84c4fde00c507cdfd)
1*c0909341SAndroid Build Coastguard Worker /*
2*c0909341SAndroid Build Coastguard Worker  * Copyright © 2018, VideoLAN and dav1d authors
3*c0909341SAndroid Build Coastguard Worker  * Copyright © 2018, Janne Grunau
4*c0909341SAndroid Build Coastguard Worker  * All rights reserved.
5*c0909341SAndroid Build Coastguard Worker  *
6*c0909341SAndroid Build Coastguard Worker  * Redistribution and use in source and binary forms, with or without
7*c0909341SAndroid Build Coastguard Worker  * modification, are permitted provided that the following conditions are met:
8*c0909341SAndroid Build Coastguard Worker  *
9*c0909341SAndroid Build Coastguard Worker  * 1. Redistributions of source code must retain the above copyright notice, this
10*c0909341SAndroid Build Coastguard Worker  *    list of conditions and the following disclaimer.
11*c0909341SAndroid Build Coastguard Worker  *
12*c0909341SAndroid Build Coastguard Worker  * 2. Redistributions in binary form must reproduce the above copyright notice,
13*c0909341SAndroid Build Coastguard Worker  *    this list of conditions and the following disclaimer in the documentation
14*c0909341SAndroid Build Coastguard Worker  *    and/or other materials provided with the distribution.
15*c0909341SAndroid Build Coastguard Worker  *
16*c0909341SAndroid Build Coastguard Worker  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17*c0909341SAndroid Build Coastguard Worker  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*c0909341SAndroid Build Coastguard Worker  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*c0909341SAndroid Build Coastguard Worker  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20*c0909341SAndroid Build Coastguard Worker  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21*c0909341SAndroid Build Coastguard Worker  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22*c0909341SAndroid Build Coastguard Worker  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23*c0909341SAndroid Build Coastguard Worker  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24*c0909341SAndroid Build Coastguard Worker  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*c0909341SAndroid Build Coastguard Worker  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*c0909341SAndroid Build Coastguard Worker  */
27*c0909341SAndroid Build Coastguard Worker 
28*c0909341SAndroid Build Coastguard Worker #include "config.h"
29*c0909341SAndroid Build Coastguard Worker 
30*c0909341SAndroid Build Coastguard Worker #include "common/attributes.h"
31*c0909341SAndroid Build Coastguard Worker 
32*c0909341SAndroid Build Coastguard Worker #include "src/cpu.h"
33*c0909341SAndroid Build Coastguard Worker #include "src/arm/cpu.h"
34*c0909341SAndroid Build Coastguard Worker 
35*c0909341SAndroid Build Coastguard Worker #if HAVE_GETAUXVAL || HAVE_ELF_AUX_INFO
36*c0909341SAndroid Build Coastguard Worker #include <sys/auxv.h>
37*c0909341SAndroid Build Coastguard Worker 
38*c0909341SAndroid Build Coastguard Worker #if ARCH_AARCH64
39*c0909341SAndroid Build Coastguard Worker 
40*c0909341SAndroid Build Coastguard Worker #define HWCAP_AARCH64_ASIMDDP (1 << 20)
41*c0909341SAndroid Build Coastguard Worker #define HWCAP_AARCH64_SVE     (1 << 22)
42*c0909341SAndroid Build Coastguard Worker #define HWCAP2_AARCH64_SVE2   (1 << 1)
43*c0909341SAndroid Build Coastguard Worker #define HWCAP2_AARCH64_I8MM   (1 << 13)
44*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)45*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
46*c0909341SAndroid Build Coastguard Worker #if HAVE_GETAUXVAL
47*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap = getauxval(AT_HWCAP);
48*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap2 = getauxval(AT_HWCAP2);
49*c0909341SAndroid Build Coastguard Worker #else
50*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap = 0;
51*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap2 = 0;
52*c0909341SAndroid Build Coastguard Worker     elf_aux_info(AT_HWCAP, &hw_cap, sizeof(hw_cap));
53*c0909341SAndroid Build Coastguard Worker     elf_aux_info(AT_HWCAP2, &hw_cap2, sizeof(hw_cap2));
54*c0909341SAndroid Build Coastguard Worker #endif
55*c0909341SAndroid Build Coastguard Worker 
56*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
57*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap & HWCAP_AARCH64_ASIMDDP) ? DAV1D_ARM_CPU_FLAG_DOTPROD : 0;
58*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap2 & HWCAP2_AARCH64_I8MM) ? DAV1D_ARM_CPU_FLAG_I8MM : 0;
59*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap & HWCAP_AARCH64_SVE) ? DAV1D_ARM_CPU_FLAG_SVE : 0;
60*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap2 & HWCAP2_AARCH64_SVE2) ? DAV1D_ARM_CPU_FLAG_SVE2 : 0;
61*c0909341SAndroid Build Coastguard Worker     return flags;
62*c0909341SAndroid Build Coastguard Worker }
63*c0909341SAndroid Build Coastguard Worker #else  /* !ARCH_AARCH64 */
64*c0909341SAndroid Build Coastguard Worker 
65*c0909341SAndroid Build Coastguard Worker #ifndef HWCAP_ARM_NEON
66*c0909341SAndroid Build Coastguard Worker #define HWCAP_ARM_NEON    (1 << 12)
67*c0909341SAndroid Build Coastguard Worker #endif
68*c0909341SAndroid Build Coastguard Worker #define HWCAP_ARM_ASIMDDP (1 << 24)
69*c0909341SAndroid Build Coastguard Worker #define HWCAP_ARM_I8MM    (1 << 27)
70*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)71*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
72*c0909341SAndroid Build Coastguard Worker #if HAVE_GETAUXVAL
73*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap = getauxval(AT_HWCAP);
74*c0909341SAndroid Build Coastguard Worker #else
75*c0909341SAndroid Build Coastguard Worker     unsigned long hw_cap = 0;
76*c0909341SAndroid Build Coastguard Worker     elf_aux_info(AT_HWCAP, &hw_cap, sizeof(hw_cap));
77*c0909341SAndroid Build Coastguard Worker #endif
78*c0909341SAndroid Build Coastguard Worker 
79*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
80*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap & HWCAP_ARM_NEON) ? DAV1D_ARM_CPU_FLAG_NEON : 0;
81*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap & HWCAP_ARM_ASIMDDP) ? DAV1D_ARM_CPU_FLAG_DOTPROD : 0;
82*c0909341SAndroid Build Coastguard Worker     flags |= (hw_cap & HWCAP_ARM_I8MM) ? DAV1D_ARM_CPU_FLAG_I8MM : 0;
83*c0909341SAndroid Build Coastguard Worker     return flags;
84*c0909341SAndroid Build Coastguard Worker }
85*c0909341SAndroid Build Coastguard Worker #endif /* ARCH_AARCH64 */
86*c0909341SAndroid Build Coastguard Worker 
87*c0909341SAndroid Build Coastguard Worker #elif defined(__APPLE__)
88*c0909341SAndroid Build Coastguard Worker #include <sys/sysctl.h>
89*c0909341SAndroid Build Coastguard Worker 
have_feature(const char * feature)90*c0909341SAndroid Build Coastguard Worker static int have_feature(const char *feature) {
91*c0909341SAndroid Build Coastguard Worker     int supported = 0;
92*c0909341SAndroid Build Coastguard Worker     size_t size = sizeof(supported);
93*c0909341SAndroid Build Coastguard Worker     if (sysctlbyname(feature, &supported, &size, NULL, 0) != 0) {
94*c0909341SAndroid Build Coastguard Worker         return 0;
95*c0909341SAndroid Build Coastguard Worker     }
96*c0909341SAndroid Build Coastguard Worker     return supported;
97*c0909341SAndroid Build Coastguard Worker }
98*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)99*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
100*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
101*c0909341SAndroid Build Coastguard Worker     if (have_feature("hw.optional.arm.FEAT_DotProd"))
102*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_DOTPROD;
103*c0909341SAndroid Build Coastguard Worker     if (have_feature("hw.optional.arm.FEAT_I8MM"))
104*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_I8MM;
105*c0909341SAndroid Build Coastguard Worker     /* No SVE and SVE2 feature detection available on Apple platforms. */
106*c0909341SAndroid Build Coastguard Worker     return flags;
107*c0909341SAndroid Build Coastguard Worker }
108*c0909341SAndroid Build Coastguard Worker 
109*c0909341SAndroid Build Coastguard Worker #elif defined(__OpenBSD__) && ARCH_AARCH64
110*c0909341SAndroid Build Coastguard Worker #include <machine/armreg.h>
111*c0909341SAndroid Build Coastguard Worker #include <machine/cpu.h>
112*c0909341SAndroid Build Coastguard Worker #include <sys/types.h>
113*c0909341SAndroid Build Coastguard Worker #include <sys/sysctl.h>
114*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)115*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
116*c0909341SAndroid Build Coastguard Worker      unsigned flags = dav1d_get_default_cpu_flags();
117*c0909341SAndroid Build Coastguard Worker 
118*c0909341SAndroid Build Coastguard Worker #ifdef CPU_ID_AA64ISAR0
119*c0909341SAndroid Build Coastguard Worker      int mib[2];
120*c0909341SAndroid Build Coastguard Worker      uint64_t isar0;
121*c0909341SAndroid Build Coastguard Worker      uint64_t isar1;
122*c0909341SAndroid Build Coastguard Worker      size_t len;
123*c0909341SAndroid Build Coastguard Worker 
124*c0909341SAndroid Build Coastguard Worker      mib[0] = CTL_MACHDEP;
125*c0909341SAndroid Build Coastguard Worker      mib[1] = CPU_ID_AA64ISAR0;
126*c0909341SAndroid Build Coastguard Worker      len = sizeof(isar0);
127*c0909341SAndroid Build Coastguard Worker      if (sysctl(mib, 2, &isar0, &len, NULL, 0) != -1) {
128*c0909341SAndroid Build Coastguard Worker          if (ID_AA64ISAR0_DP(isar0) >= ID_AA64ISAR0_DP_IMPL)
129*c0909341SAndroid Build Coastguard Worker              flags |= DAV1D_ARM_CPU_FLAG_DOTPROD;
130*c0909341SAndroid Build Coastguard Worker      }
131*c0909341SAndroid Build Coastguard Worker 
132*c0909341SAndroid Build Coastguard Worker      mib[0] = CTL_MACHDEP;
133*c0909341SAndroid Build Coastguard Worker      mib[1] = CPU_ID_AA64ISAR1;
134*c0909341SAndroid Build Coastguard Worker      len = sizeof(isar1);
135*c0909341SAndroid Build Coastguard Worker      if (sysctl(mib, 2, &isar1, &len, NULL, 0) != -1) {
136*c0909341SAndroid Build Coastguard Worker #ifdef ID_AA64ISAR1_I8MM_IMPL
137*c0909341SAndroid Build Coastguard Worker          if (ID_AA64ISAR1_I8MM(isar1) >= ID_AA64ISAR1_I8MM_IMPL)
138*c0909341SAndroid Build Coastguard Worker              flags |= DAV1D_ARM_CPU_FLAG_I8MM;
139*c0909341SAndroid Build Coastguard Worker #endif
140*c0909341SAndroid Build Coastguard Worker      }
141*c0909341SAndroid Build Coastguard Worker #endif
142*c0909341SAndroid Build Coastguard Worker 
143*c0909341SAndroid Build Coastguard Worker      return flags;
144*c0909341SAndroid Build Coastguard Worker }
145*c0909341SAndroid Build Coastguard Worker 
146*c0909341SAndroid Build Coastguard Worker #elif defined(_WIN32)
147*c0909341SAndroid Build Coastguard Worker #include <windows.h>
148*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)149*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
150*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
151*c0909341SAndroid Build Coastguard Worker #ifdef PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE
152*c0909341SAndroid Build Coastguard Worker     if (IsProcessorFeaturePresent(PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE))
153*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_DOTPROD;
154*c0909341SAndroid Build Coastguard Worker #endif
155*c0909341SAndroid Build Coastguard Worker #ifdef PF_ARM_SVE_INSTRUCTIONS_AVAILABLE
156*c0909341SAndroid Build Coastguard Worker     if (IsProcessorFeaturePresent(PF_ARM_SVE_INSTRUCTIONS_AVAILABLE))
157*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_SVE;
158*c0909341SAndroid Build Coastguard Worker #endif
159*c0909341SAndroid Build Coastguard Worker #ifdef PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE
160*c0909341SAndroid Build Coastguard Worker     if (IsProcessorFeaturePresent(PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE))
161*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_SVE2;
162*c0909341SAndroid Build Coastguard Worker #endif
163*c0909341SAndroid Build Coastguard Worker #ifdef PF_ARM_SVE_I8MM_INSTRUCTIONS_AVAILABLE
164*c0909341SAndroid Build Coastguard Worker     /* There's no PF_* flag that indicates whether plain I8MM is available
165*c0909341SAndroid Build Coastguard Worker      * or not. But if SVE_I8MM is available, that also implies that
166*c0909341SAndroid Build Coastguard Worker      * regular I8MM is available. */
167*c0909341SAndroid Build Coastguard Worker     if (IsProcessorFeaturePresent(PF_ARM_SVE_I8MM_INSTRUCTIONS_AVAILABLE))
168*c0909341SAndroid Build Coastguard Worker         flags |= DAV1D_ARM_CPU_FLAG_I8MM;
169*c0909341SAndroid Build Coastguard Worker #endif
170*c0909341SAndroid Build Coastguard Worker     return flags;
171*c0909341SAndroid Build Coastguard Worker }
172*c0909341SAndroid Build Coastguard Worker 
173*c0909341SAndroid Build Coastguard Worker #elif defined(__ANDROID__)
174*c0909341SAndroid Build Coastguard Worker #include <ctype.h>
175*c0909341SAndroid Build Coastguard Worker #include <stdio.h>
176*c0909341SAndroid Build Coastguard Worker #include <string.h>
177*c0909341SAndroid Build Coastguard Worker 
parse_proc_cpuinfo(const char * flag)178*c0909341SAndroid Build Coastguard Worker static unsigned parse_proc_cpuinfo(const char *flag) {
179*c0909341SAndroid Build Coastguard Worker     FILE *file = fopen("/proc/cpuinfo", "r");
180*c0909341SAndroid Build Coastguard Worker     if (!file)
181*c0909341SAndroid Build Coastguard Worker         return 0;
182*c0909341SAndroid Build Coastguard Worker 
183*c0909341SAndroid Build Coastguard Worker     char line_buffer[120];
184*c0909341SAndroid Build Coastguard Worker     const char *line;
185*c0909341SAndroid Build Coastguard Worker 
186*c0909341SAndroid Build Coastguard Worker     size_t flaglen = strlen(flag);
187*c0909341SAndroid Build Coastguard Worker     while ((line = fgets(line_buffer, sizeof(line_buffer), file))) {
188*c0909341SAndroid Build Coastguard Worker         // check all occurances as whole words
189*c0909341SAndroid Build Coastguard Worker         const char *found = line;
190*c0909341SAndroid Build Coastguard Worker         while ((found = strstr(found, flag))) {
191*c0909341SAndroid Build Coastguard Worker             if ((found == line_buffer || !isgraph(found[-1])) &&
192*c0909341SAndroid Build Coastguard Worker                 (isspace(found[flaglen]) || feof(file))) {
193*c0909341SAndroid Build Coastguard Worker                 fclose(file);
194*c0909341SAndroid Build Coastguard Worker                 return 1;
195*c0909341SAndroid Build Coastguard Worker             }
196*c0909341SAndroid Build Coastguard Worker             found += flaglen;
197*c0909341SAndroid Build Coastguard Worker         }
198*c0909341SAndroid Build Coastguard Worker         // if line is incomplete seek back to avoid splitting the search
199*c0909341SAndroid Build Coastguard Worker         // string into two buffers
200*c0909341SAndroid Build Coastguard Worker         if (!strchr(line, '\n') && strlen(line) > flaglen) {
201*c0909341SAndroid Build Coastguard Worker             // use fseek since the 64 bit fseeko is only available since
202*c0909341SAndroid Build Coastguard Worker             // Android API level 24 and meson defines _FILE_OFFSET_BITS
203*c0909341SAndroid Build Coastguard Worker             // by default 64
204*c0909341SAndroid Build Coastguard Worker             if (fseek(file, -flaglen, SEEK_CUR))
205*c0909341SAndroid Build Coastguard Worker                 break;
206*c0909341SAndroid Build Coastguard Worker         }
207*c0909341SAndroid Build Coastguard Worker     }
208*c0909341SAndroid Build Coastguard Worker 
209*c0909341SAndroid Build Coastguard Worker     fclose(file);
210*c0909341SAndroid Build Coastguard Worker 
211*c0909341SAndroid Build Coastguard Worker     return 0;
212*c0909341SAndroid Build Coastguard Worker }
213*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)214*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
215*c0909341SAndroid Build Coastguard Worker     unsigned flags = dav1d_get_default_cpu_flags();
216*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("neon") ? DAV1D_ARM_CPU_FLAG_NEON : 0;
217*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("asimd") ? DAV1D_ARM_CPU_FLAG_NEON : 0;
218*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("asimddp") ? DAV1D_ARM_CPU_FLAG_DOTPROD : 0;
219*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("i8mm") ? DAV1D_ARM_CPU_FLAG_I8MM : 0;
220*c0909341SAndroid Build Coastguard Worker #if ARCH_AARCH64
221*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("sve") ? DAV1D_ARM_CPU_FLAG_SVE : 0;
222*c0909341SAndroid Build Coastguard Worker     flags |= parse_proc_cpuinfo("sve2") ? DAV1D_ARM_CPU_FLAG_SVE2 : 0;
223*c0909341SAndroid Build Coastguard Worker #endif /* ARCH_AARCH64 */
224*c0909341SAndroid Build Coastguard Worker     return flags;
225*c0909341SAndroid Build Coastguard Worker }
226*c0909341SAndroid Build Coastguard Worker 
227*c0909341SAndroid Build Coastguard Worker #else  /* Unsupported OS */
228*c0909341SAndroid Build Coastguard Worker 
dav1d_get_cpu_flags_arm(void)229*c0909341SAndroid Build Coastguard Worker COLD unsigned dav1d_get_cpu_flags_arm(void) {
230*c0909341SAndroid Build Coastguard Worker     return dav1d_get_default_cpu_flags();
231*c0909341SAndroid Build Coastguard Worker }
232*c0909341SAndroid Build Coastguard Worker 
233*c0909341SAndroid Build Coastguard Worker #endif
234