xref: /aosp_15_r20/external/libopus/celt/x86/x86cpu.c (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1 /* Copyright (c) 2014, Cisco Systems, INC
2    Written by XiangMingZhu WeiZhou MinPeng YanWang
3 
4    Redistribution and use in source and binary forms, with or without
5    modification, are permitted provided that the following conditions
6    are met:
7 
8    - Redistributions of source code must retain the above copyright
9    notice, this list of conditions and the following disclaimer.
10 
11    - Redistributions in binary form must reproduce the above copyright
12    notice, this list of conditions and the following disclaimer in the
13    documentation and/or other materials provided with the distribution.
14 
15    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
19    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 */
27 
28 #ifdef HAVE_CONFIG_H
29 #include "config.h"
30 #endif
31 
32 #include "cpu_support.h"
33 #include "macros.h"
34 #include "main.h"
35 #include "pitch.h"
36 #include "x86cpu.h"
37 
38 #if defined(OPUS_HAVE_RTCD) && \
39   ((defined(OPUS_X86_MAY_HAVE_SSE) && !defined(OPUS_X86_PRESUME_SSE)) || \
40   (defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2)) || \
41   (defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1)) || \
42   (defined(OPUS_X86_MAY_HAVE_AVX2) && !defined(OPUS_X86_PRESUME_AVX2)))
43 
44 #if defined(_MSC_VER)
45 
46 #include <intrin.h>
cpuid(unsigned int CPUInfo[4],unsigned int InfoType)47 static _inline void cpuid(unsigned int CPUInfo[4], unsigned int InfoType)
48 {
49     __cpuid((int*)CPUInfo, InfoType);
50 }
51 
52 #else
53 
54 #if defined(CPU_INFO_BY_C)
55 #include <cpuid.h>
56 #endif
57 
cpuid(unsigned int CPUInfo[4],unsigned int InfoType)58 static void cpuid(unsigned int CPUInfo[4], unsigned int InfoType)
59 {
60 #if defined(CPU_INFO_BY_ASM)
61 #if defined(__i386__) && defined(__PIC__)
62 /* %ebx is PIC register in 32-bit, so mustn't clobber it. */
63     __asm__ __volatile__ (
64         "xchg %%ebx, %1\n"
65         "cpuid\n"
66         "xchg %%ebx, %1\n":
67         "=a" (CPUInfo[0]),
68         "=r" (CPUInfo[1]),
69         "=c" (CPUInfo[2]),
70         "=d" (CPUInfo[3]) :
71         /* We clear ECX to avoid a valgrind false-positive prior to v3.17.0. */
72         "0" (InfoType), "2" (0)
73     );
74 #else
75     __asm__ __volatile__ (
76         "cpuid":
77         "=a" (CPUInfo[0]),
78         "=b" (CPUInfo[1]),
79         "=c" (CPUInfo[2]),
80         "=d" (CPUInfo[3]) :
81         /* We clear ECX to avoid a valgrind false-positive prior to v3.17.0. */
82         "0" (InfoType), "2" (0)
83     );
84 #endif
85 #elif defined(CPU_INFO_BY_C)
86     /* We use __get_cpuid_count to clear ECX to avoid a valgrind false-positive
87         prior to v3.17.0.*/
88     if (!__get_cpuid_count(InfoType, 0, &(CPUInfo[0]), &(CPUInfo[1]), &(CPUInfo[2]), &(CPUInfo[3]))) {
89         /* Our function cannot fail, but __get_cpuid{_count} can.
90            Returning all zeroes will effectively disable all SIMD, which is
91             what we want on CPUs that don't support CPUID. */
92         CPUInfo[3] = CPUInfo[2] = CPUInfo[1] = CPUInfo[0] = 0;
93     }
94 #else
95 # error "Configured to use x86 RTCD, but no CPU detection method available. " \
96  "Reconfigure with --disable-rtcd (or send patches)."
97 #endif
98 }
99 
100 #endif
101 
102 typedef struct CPU_Feature{
103     /*  SIMD: 128-bit */
104     int HW_SSE;
105     int HW_SSE2;
106     int HW_SSE41;
107     /*  SIMD: 256-bit */
108     int HW_AVX2;
109 } CPU_Feature;
110 
opus_cpu_feature_check(CPU_Feature * cpu_feature)111 static void opus_cpu_feature_check(CPU_Feature *cpu_feature)
112 {
113     unsigned int info[4];
114     unsigned int nIds = 0;
115 
116     cpuid(info, 0);
117     nIds = info[0];
118 
119     if (nIds >= 1){
120         cpuid(info, 1);
121         cpu_feature->HW_SSE = (info[3] & (1 << 25)) != 0;
122         cpu_feature->HW_SSE2 = (info[3] & (1 << 26)) != 0;
123         cpu_feature->HW_SSE41 = (info[2] & (1 << 19)) != 0;
124         cpu_feature->HW_AVX2 = (info[2] & (1 << 28)) != 0 && (info[2] & (1 << 12)) != 0;
125         if (cpu_feature->HW_AVX2 && nIds >= 7) {
126             cpuid(info, 7);
127             cpu_feature->HW_AVX2 = cpu_feature->HW_AVX2 && (info[1] & (1 << 5)) != 0;
128         } else {
129             cpu_feature->HW_AVX2 = 0;
130         }
131     }
132     else {
133         cpu_feature->HW_SSE = 0;
134         cpu_feature->HW_SSE2 = 0;
135         cpu_feature->HW_SSE41 = 0;
136         cpu_feature->HW_AVX2 = 0;
137     }
138 }
139 
opus_select_arch_impl(void)140 static int opus_select_arch_impl(void)
141 {
142     CPU_Feature cpu_feature;
143     int arch;
144 
145     opus_cpu_feature_check(&cpu_feature);
146 
147     arch = 0;
148     if (!cpu_feature.HW_SSE)
149     {
150        return arch;
151     }
152     arch++;
153 
154     if (!cpu_feature.HW_SSE2)
155     {
156        return arch;
157     }
158     arch++;
159 
160     if (!cpu_feature.HW_SSE41)
161     {
162         return arch;
163     }
164     arch++;
165 
166     if (!cpu_feature.HW_AVX2)
167     {
168         return arch;
169     }
170     arch++;
171 
172     return arch;
173 }
174 
opus_select_arch(void)175 int opus_select_arch(void) {
176     int arch = opus_select_arch_impl();
177 #ifdef FUZZING
178     /* Randomly downgrade the architecture. */
179     arch = rand()%(arch+1);
180 #endif
181     return arch;
182 }
183 
184 #endif
185