xref: /aosp_15_r20/external/llvm/test/CodeGen/X86/fma_patterns.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by update_llc_test_checks.py
2*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA
4*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma4,+fma -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA4
5*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma4 -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA4
6*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512dq,+avx512vl -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=AVX512
7*9880d681SAndroid Build Coastguard Worker
8*9880d681SAndroid Build Coastguard Worker;
9*9880d681SAndroid Build Coastguard Worker; Pattern: (fadd (fmul x, y), z) -> (fmadd x,y,z)
10*9880d681SAndroid Build Coastguard Worker;
11*9880d681SAndroid Build Coastguard Worker
12*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fmadd(float %a0, float %a1, float %a2) {
13*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fmadd:
14*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
15*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ss %xmm2, %xmm1, %xmm0
16*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
17*9880d681SAndroid Build Coastguard Worker;
18*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fmadd:
19*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
20*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddss %xmm2, %xmm1, %xmm0, %xmm0
21*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
22*9880d681SAndroid Build Coastguard Worker;
23*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fmadd:
24*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
25*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ss %xmm2, %xmm0, %xmm1
26*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
27*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
28*9880d681SAndroid Build Coastguard Worker  %x = fmul float %a0, %a1
29*9880d681SAndroid Build Coastguard Worker  %res = fadd float %x, %a2
30*9880d681SAndroid Build Coastguard Worker  ret float %res
31*9880d681SAndroid Build Coastguard Worker}
32*9880d681SAndroid Build Coastguard Worker
33*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) {
34*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmadd:
35*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
36*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm2, %xmm1, %xmm0
37*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
38*9880d681SAndroid Build Coastguard Worker;
39*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmadd:
40*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
41*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm2, %xmm1, %xmm0, %xmm0
42*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
43*9880d681SAndroid Build Coastguard Worker;
44*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmadd:
45*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
46*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm2, %xmm1, %xmm0
47*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
48*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x float> %a0, %a1
49*9880d681SAndroid Build Coastguard Worker  %res = fadd <4 x float> %x, %a2
50*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %res
51*9880d681SAndroid Build Coastguard Worker}
52*9880d681SAndroid Build Coastguard Worker
53*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fmadd(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) {
54*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fmadd:
55*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
56*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %ymm2, %ymm1, %ymm0
57*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
58*9880d681SAndroid Build Coastguard Worker;
59*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fmadd:
60*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
61*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %ymm2, %ymm1, %ymm0, %ymm0
62*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
63*9880d681SAndroid Build Coastguard Worker;
64*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fmadd:
65*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
66*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %ymm2, %ymm1, %ymm0
67*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
68*9880d681SAndroid Build Coastguard Worker  %x = fmul <8 x float> %a0, %a1
69*9880d681SAndroid Build Coastguard Worker  %res = fadd <8 x float> %x, %a2
70*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %res
71*9880d681SAndroid Build Coastguard Worker}
72*9880d681SAndroid Build Coastguard Worker
73*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fmadd(double %a0, double %a1, double %a2) {
74*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fmadd:
75*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
76*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213sd %xmm2, %xmm1, %xmm0
77*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
78*9880d681SAndroid Build Coastguard Worker;
79*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fmadd:
80*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
81*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddsd %xmm2, %xmm1, %xmm0, %xmm0
82*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
83*9880d681SAndroid Build Coastguard Worker;
84*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fmadd:
85*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
86*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213sd %xmm2, %xmm0, %xmm1
87*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
88*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
89*9880d681SAndroid Build Coastguard Worker  %x = fmul double %a0, %a1
90*9880d681SAndroid Build Coastguard Worker  %res = fadd double %x, %a2
91*9880d681SAndroid Build Coastguard Worker  ret double %res
92*9880d681SAndroid Build Coastguard Worker}
93*9880d681SAndroid Build Coastguard Worker
94*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmadd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) {
95*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmadd:
96*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
97*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213pd %xmm2, %xmm1, %xmm0
98*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
99*9880d681SAndroid Build Coastguard Worker;
100*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmadd:
101*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
102*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddpd %xmm2, %xmm1, %xmm0, %xmm0
103*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
104*9880d681SAndroid Build Coastguard Worker;
105*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmadd:
106*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
107*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213pd %xmm2, %xmm1, %xmm0
108*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
109*9880d681SAndroid Build Coastguard Worker  %x = fmul <2 x double> %a0, %a1
110*9880d681SAndroid Build Coastguard Worker  %res = fadd <2 x double> %x, %a2
111*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %res
112*9880d681SAndroid Build Coastguard Worker}
113*9880d681SAndroid Build Coastguard Worker
114*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fmadd(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) {
115*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fmadd:
116*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
117*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213pd %ymm2, %ymm1, %ymm0
118*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
119*9880d681SAndroid Build Coastguard Worker;
120*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fmadd:
121*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
122*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddpd %ymm2, %ymm1, %ymm0, %ymm0
123*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
124*9880d681SAndroid Build Coastguard Worker;
125*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fmadd:
126*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
127*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213pd %ymm2, %ymm1, %ymm0
128*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
129*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x double> %a0, %a1
130*9880d681SAndroid Build Coastguard Worker  %res = fadd <4 x double> %x, %a2
131*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %res
132*9880d681SAndroid Build Coastguard Worker}
133*9880d681SAndroid Build Coastguard Worker
134*9880d681SAndroid Build Coastguard Worker;
135*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub (fmul x, y), z) -> (fmsub x, y, z)
136*9880d681SAndroid Build Coastguard Worker;
137*9880d681SAndroid Build Coastguard Worker
138*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fmsub(float %a0, float %a1, float %a2) {
139*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fmsub:
140*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
141*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ss %xmm2, %xmm1, %xmm0
142*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
143*9880d681SAndroid Build Coastguard Worker;
144*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fmsub:
145*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
146*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubss %xmm2, %xmm1, %xmm0, %xmm0
147*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
148*9880d681SAndroid Build Coastguard Worker;
149*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fmsub:
150*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
151*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ss %xmm2, %xmm0, %xmm1
152*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
153*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
154*9880d681SAndroid Build Coastguard Worker  %x = fmul float %a0, %a1
155*9880d681SAndroid Build Coastguard Worker  %res = fsub float %x, %a2
156*9880d681SAndroid Build Coastguard Worker  ret float %res
157*9880d681SAndroid Build Coastguard Worker}
158*9880d681SAndroid Build Coastguard Worker
159*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmsub(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) {
160*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmsub:
161*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
162*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm2, %xmm1, %xmm0
163*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
164*9880d681SAndroid Build Coastguard Worker;
165*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmsub:
166*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
167*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm2, %xmm1, %xmm0, %xmm0
168*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
169*9880d681SAndroid Build Coastguard Worker;
170*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmsub:
171*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
172*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm2, %xmm1, %xmm0
173*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
174*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x float> %a0, %a1
175*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x float> %x, %a2
176*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %res
177*9880d681SAndroid Build Coastguard Worker}
178*9880d681SAndroid Build Coastguard Worker
179*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fmsub(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) {
180*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fmsub:
181*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
182*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %ymm2, %ymm1, %ymm0
183*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
184*9880d681SAndroid Build Coastguard Worker;
185*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fmsub:
186*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
187*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %ymm2, %ymm1, %ymm0, %ymm0
188*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
189*9880d681SAndroid Build Coastguard Worker;
190*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fmsub:
191*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
192*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %ymm2, %ymm1, %ymm0
193*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
194*9880d681SAndroid Build Coastguard Worker  %x = fmul <8 x float> %a0, %a1
195*9880d681SAndroid Build Coastguard Worker  %res = fsub <8 x float> %x, %a2
196*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %res
197*9880d681SAndroid Build Coastguard Worker}
198*9880d681SAndroid Build Coastguard Worker
199*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fmsub(double %a0, double %a1, double %a2) {
200*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fmsub:
201*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
202*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213sd %xmm2, %xmm1, %xmm0
203*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
204*9880d681SAndroid Build Coastguard Worker;
205*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fmsub:
206*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
207*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubsd %xmm2, %xmm1, %xmm0, %xmm0
208*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
209*9880d681SAndroid Build Coastguard Worker;
210*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fmsub:
211*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
212*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213sd %xmm2, %xmm0, %xmm1
213*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
214*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
215*9880d681SAndroid Build Coastguard Worker  %x = fmul double %a0, %a1
216*9880d681SAndroid Build Coastguard Worker  %res = fsub double %x, %a2
217*9880d681SAndroid Build Coastguard Worker  ret double %res
218*9880d681SAndroid Build Coastguard Worker}
219*9880d681SAndroid Build Coastguard Worker
220*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmsub(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) {
221*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmsub:
222*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
223*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213pd %xmm2, %xmm1, %xmm0
224*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
225*9880d681SAndroid Build Coastguard Worker;
226*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmsub:
227*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
228*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubpd %xmm2, %xmm1, %xmm0, %xmm0
229*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
230*9880d681SAndroid Build Coastguard Worker;
231*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmsub:
232*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
233*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213pd %xmm2, %xmm1, %xmm0
234*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
235*9880d681SAndroid Build Coastguard Worker  %x = fmul <2 x double> %a0, %a1
236*9880d681SAndroid Build Coastguard Worker  %res = fsub <2 x double> %x, %a2
237*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %res
238*9880d681SAndroid Build Coastguard Worker}
239*9880d681SAndroid Build Coastguard Worker
240*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) {
241*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fmsub:
242*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
243*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213pd %ymm2, %ymm1, %ymm0
244*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
245*9880d681SAndroid Build Coastguard Worker;
246*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fmsub:
247*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
248*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubpd %ymm2, %ymm1, %ymm0, %ymm0
249*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
250*9880d681SAndroid Build Coastguard Worker;
251*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fmsub:
252*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
253*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213pd %ymm2, %ymm1, %ymm0
254*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
255*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x double> %a0, %a1
256*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x double> %x, %a2
257*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %res
258*9880d681SAndroid Build Coastguard Worker}
259*9880d681SAndroid Build Coastguard Worker
260*9880d681SAndroid Build Coastguard Worker;
261*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub z, (fmul x, y)) -> (fnmadd x, y, z)
262*9880d681SAndroid Build Coastguard Worker;
263*9880d681SAndroid Build Coastguard Worker
264*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fnmadd(float %a0, float %a1, float %a2) {
265*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fnmadd:
266*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
267*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ss %xmm2, %xmm1, %xmm0
268*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
269*9880d681SAndroid Build Coastguard Worker;
270*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fnmadd:
271*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
272*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddss %xmm2, %xmm1, %xmm0, %xmm0
273*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
274*9880d681SAndroid Build Coastguard Worker;
275*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fnmadd:
276*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
277*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ss %xmm2, %xmm0, %xmm1
278*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
279*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
280*9880d681SAndroid Build Coastguard Worker  %x = fmul float %a0, %a1
281*9880d681SAndroid Build Coastguard Worker  %res = fsub float %a2, %x
282*9880d681SAndroid Build Coastguard Worker  ret float %res
283*9880d681SAndroid Build Coastguard Worker}
284*9880d681SAndroid Build Coastguard Worker
285*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fnmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) {
286*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fnmadd:
287*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
288*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %xmm2, %xmm1, %xmm0
289*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
290*9880d681SAndroid Build Coastguard Worker;
291*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fnmadd:
292*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
293*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %xmm2, %xmm1, %xmm0, %xmm0
294*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
295*9880d681SAndroid Build Coastguard Worker;
296*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fnmadd:
297*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
298*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %xmm2, %xmm1, %xmm0
299*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
300*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x float> %a0, %a1
301*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x float> %a2, %x
302*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %res
303*9880d681SAndroid Build Coastguard Worker}
304*9880d681SAndroid Build Coastguard Worker
305*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fnmadd(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) {
306*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fnmadd:
307*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
308*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %ymm2, %ymm1, %ymm0
309*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
310*9880d681SAndroid Build Coastguard Worker;
311*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fnmadd:
312*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
313*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %ymm2, %ymm1, %ymm0, %ymm0
314*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
315*9880d681SAndroid Build Coastguard Worker;
316*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fnmadd:
317*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
318*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %ymm2, %ymm1, %ymm0
319*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
320*9880d681SAndroid Build Coastguard Worker  %x = fmul <8 x float> %a0, %a1
321*9880d681SAndroid Build Coastguard Worker  %res = fsub <8 x float> %a2, %x
322*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %res
323*9880d681SAndroid Build Coastguard Worker}
324*9880d681SAndroid Build Coastguard Worker
325*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fnmadd(double %a0, double %a1, double %a2) {
326*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fnmadd:
327*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
328*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213sd %xmm2, %xmm1, %xmm0
329*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
330*9880d681SAndroid Build Coastguard Worker;
331*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fnmadd:
332*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
333*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddsd %xmm2, %xmm1, %xmm0, %xmm0
334*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
335*9880d681SAndroid Build Coastguard Worker;
336*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fnmadd:
337*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
338*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213sd %xmm2, %xmm0, %xmm1
339*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
340*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
341*9880d681SAndroid Build Coastguard Worker  %x = fmul double %a0, %a1
342*9880d681SAndroid Build Coastguard Worker  %res = fsub double %a2, %x
343*9880d681SAndroid Build Coastguard Worker  ret double %res
344*9880d681SAndroid Build Coastguard Worker}
345*9880d681SAndroid Build Coastguard Worker
346*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fnmadd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) {
347*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fnmadd:
348*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
349*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213pd %xmm2, %xmm1, %xmm0
350*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
351*9880d681SAndroid Build Coastguard Worker;
352*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fnmadd:
353*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
354*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddpd %xmm2, %xmm1, %xmm0, %xmm0
355*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
356*9880d681SAndroid Build Coastguard Worker;
357*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fnmadd:
358*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
359*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213pd %xmm2, %xmm1, %xmm0
360*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
361*9880d681SAndroid Build Coastguard Worker  %x = fmul <2 x double> %a0, %a1
362*9880d681SAndroid Build Coastguard Worker  %res = fsub <2 x double> %a2, %x
363*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %res
364*9880d681SAndroid Build Coastguard Worker}
365*9880d681SAndroid Build Coastguard Worker
366*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fnmadd(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) {
367*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fnmadd:
368*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
369*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213pd %ymm2, %ymm1, %ymm0
370*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
371*9880d681SAndroid Build Coastguard Worker;
372*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fnmadd:
373*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
374*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddpd %ymm2, %ymm1, %ymm0, %ymm0
375*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
376*9880d681SAndroid Build Coastguard Worker;
377*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fnmadd:
378*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
379*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213pd %ymm2, %ymm1, %ymm0
380*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
381*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x double> %a0, %a1
382*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x double> %a2, %x
383*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %res
384*9880d681SAndroid Build Coastguard Worker}
385*9880d681SAndroid Build Coastguard Worker
386*9880d681SAndroid Build Coastguard Worker;
387*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub (fneg (fmul x, y)), z) -> (fnmsub x, y, z)
388*9880d681SAndroid Build Coastguard Worker;
389*9880d681SAndroid Build Coastguard Worker
390*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fnmsub(float %a0, float %a1, float %a2) {
391*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fnmsub:
392*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
393*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ss %xmm2, %xmm1, %xmm0
394*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
395*9880d681SAndroid Build Coastguard Worker;
396*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fnmsub:
397*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
398*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubss %xmm2, %xmm1, %xmm0, %xmm0
399*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
400*9880d681SAndroid Build Coastguard Worker;
401*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fnmsub:
402*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
403*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ss %xmm2, %xmm0, %xmm1
404*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
405*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
406*9880d681SAndroid Build Coastguard Worker  %x = fmul float %a0, %a1
407*9880d681SAndroid Build Coastguard Worker  %y = fsub float -0.000000e+00, %x
408*9880d681SAndroid Build Coastguard Worker  %res = fsub float %y, %a2
409*9880d681SAndroid Build Coastguard Worker  ret float %res
410*9880d681SAndroid Build Coastguard Worker}
411*9880d681SAndroid Build Coastguard Worker
412*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fnmsub(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) {
413*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fnmsub:
414*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
415*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
416*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
417*9880d681SAndroid Build Coastguard Worker;
418*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fnmsub:
419*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
420*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0
421*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
422*9880d681SAndroid Build Coastguard Worker;
423*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fnmsub:
424*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
425*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
426*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
427*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x float> %a0, %a1
428*9880d681SAndroid Build Coastguard Worker  %y = fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %x
429*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x float> %y, %a2
430*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %res
431*9880d681SAndroid Build Coastguard Worker}
432*9880d681SAndroid Build Coastguard Worker
433*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fnmsub(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) {
434*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fnmsub:
435*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
436*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %ymm2, %ymm1, %ymm0
437*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
438*9880d681SAndroid Build Coastguard Worker;
439*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fnmsub:
440*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
441*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %ymm2, %ymm1, %ymm0, %ymm0
442*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
443*9880d681SAndroid Build Coastguard Worker;
444*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fnmsub:
445*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
446*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %ymm2, %ymm1, %ymm0
447*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
448*9880d681SAndroid Build Coastguard Worker  %x = fmul <8 x float> %a0, %a1
449*9880d681SAndroid Build Coastguard Worker  %y = fsub <8 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %x
450*9880d681SAndroid Build Coastguard Worker  %res = fsub <8 x float> %y, %a2
451*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %res
452*9880d681SAndroid Build Coastguard Worker}
453*9880d681SAndroid Build Coastguard Worker
454*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fnmsub(double %a0, double %a1, double %a2) {
455*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fnmsub:
456*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
457*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213sd %xmm2, %xmm1, %xmm0
458*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
459*9880d681SAndroid Build Coastguard Worker;
460*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fnmsub:
461*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
462*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubsd %xmm2, %xmm1, %xmm0, %xmm0
463*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
464*9880d681SAndroid Build Coastguard Worker;
465*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fnmsub:
466*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
467*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213sd %xmm2, %xmm0, %xmm1
468*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
469*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
470*9880d681SAndroid Build Coastguard Worker  %x = fmul double %a0, %a1
471*9880d681SAndroid Build Coastguard Worker  %y = fsub double -0.000000e+00, %x
472*9880d681SAndroid Build Coastguard Worker  %res = fsub double %y, %a2
473*9880d681SAndroid Build Coastguard Worker  ret double %res
474*9880d681SAndroid Build Coastguard Worker}
475*9880d681SAndroid Build Coastguard Worker
476*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fnmsub(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) {
477*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fnmsub:
478*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
479*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213pd %xmm2, %xmm1, %xmm0
480*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
481*9880d681SAndroid Build Coastguard Worker;
482*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fnmsub:
483*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
484*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubpd %xmm2, %xmm1, %xmm0, %xmm0
485*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
486*9880d681SAndroid Build Coastguard Worker;
487*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fnmsub:
488*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
489*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213pd %xmm2, %xmm1, %xmm0
490*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
491*9880d681SAndroid Build Coastguard Worker  %x = fmul <2 x double> %a0, %a1
492*9880d681SAndroid Build Coastguard Worker  %y = fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %x
493*9880d681SAndroid Build Coastguard Worker  %res = fsub <2 x double> %y, %a2
494*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %res
495*9880d681SAndroid Build Coastguard Worker}
496*9880d681SAndroid Build Coastguard Worker
497*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fnmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) {
498*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fnmsub:
499*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
500*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213pd %ymm2, %ymm1, %ymm0
501*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
502*9880d681SAndroid Build Coastguard Worker;
503*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fnmsub:
504*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
505*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubpd %ymm2, %ymm1, %ymm0, %ymm0
506*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
507*9880d681SAndroid Build Coastguard Worker;
508*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fnmsub:
509*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
510*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213pd %ymm2, %ymm1, %ymm0
511*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
512*9880d681SAndroid Build Coastguard Worker  %x = fmul <4 x double> %a0, %a1
513*9880d681SAndroid Build Coastguard Worker  %y = fsub <4 x double> <double -0.000000e+00, double -0.000000e+00, double -0.000000e+00, double -0.000000e+00>, %x
514*9880d681SAndroid Build Coastguard Worker  %res = fsub <4 x double> %y, %a2
515*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %res
516*9880d681SAndroid Build Coastguard Worker}
517*9880d681SAndroid Build Coastguard Worker
518*9880d681SAndroid Build Coastguard Worker;
519*9880d681SAndroid Build Coastguard Worker; Load Folding Patterns
520*9880d681SAndroid Build Coastguard Worker;
521*9880d681SAndroid Build Coastguard Worker
522*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmadd_load(<4 x float>* %a0, <4 x float> %a1, <4 x float> %a2) {
523*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmadd_load:
524*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
525*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd132ps (%rdi), %xmm1, %xmm0
526*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
527*9880d681SAndroid Build Coastguard Worker;
528*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmadd_load:
529*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
530*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, (%rdi), %xmm0, %xmm0
531*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
532*9880d681SAndroid Build Coastguard Worker;
533*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmadd_load:
534*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
535*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps (%rdi), %xmm2
536*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm1, %xmm0, %xmm2
537*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm0
538*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
539*9880d681SAndroid Build Coastguard Worker  %x = load <4 x float>, <4 x float>* %a0
540*9880d681SAndroid Build Coastguard Worker  %y = fmul <4 x float> %x, %a1
541*9880d681SAndroid Build Coastguard Worker  %res = fadd <4 x float> %y, %a2
542*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %res
543*9880d681SAndroid Build Coastguard Worker}
544*9880d681SAndroid Build Coastguard Worker
545*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmsub_load(<2 x double>* %a0, <2 x double> %a1, <2 x double> %a2) {
546*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmsub_load:
547*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
548*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub132pd (%rdi), %xmm1, %xmm0
549*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
550*9880d681SAndroid Build Coastguard Worker;
551*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmsub_load:
552*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
553*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubpd %xmm1, (%rdi), %xmm0, %xmm0
554*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
555*9880d681SAndroid Build Coastguard Worker;
556*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmsub_load:
557*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
558*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovapd (%rdi), %xmm2
559*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213pd %xmm1, %xmm0, %xmm2
560*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm0
561*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
562*9880d681SAndroid Build Coastguard Worker  %x = load <2 x double>, <2 x double>* %a0
563*9880d681SAndroid Build Coastguard Worker  %y = fmul <2 x double> %x, %a1
564*9880d681SAndroid Build Coastguard Worker  %res = fsub <2 x double> %y, %a2
565*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %res
566*9880d681SAndroid Build Coastguard Worker}
567*9880d681SAndroid Build Coastguard Worker
568*9880d681SAndroid Build Coastguard Worker;
569*9880d681SAndroid Build Coastguard Worker; Patterns (+ fneg variants): mul(add(1.0,x),y), mul(sub(1.0,x),y), mul(sub(x,1.0),y)
570*9880d681SAndroid Build Coastguard Worker;
571*9880d681SAndroid Build Coastguard Worker
572*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_add_x_one_y(<4 x float> %x, <4 x float> %y) {
573*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_add_x_one_y:
574*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
575*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
576*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
577*9880d681SAndroid Build Coastguard Worker;
578*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_add_x_one_y:
579*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
580*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, %xmm1, %xmm0, %xmm0
581*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
582*9880d681SAndroid Build Coastguard Worker;
583*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_add_x_one_y:
584*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
585*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
586*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
587*9880d681SAndroid Build Coastguard Worker  %a = fadd <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0>
588*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %a, %y
589*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
590*9880d681SAndroid Build Coastguard Worker}
591*9880d681SAndroid Build Coastguard Worker
592*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_add_x_one(<4 x float> %x, <4 x float> %y) {
593*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_add_x_one:
594*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
595*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
596*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
597*9880d681SAndroid Build Coastguard Worker;
598*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_add_x_one:
599*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
600*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, %xmm1, %xmm0, %xmm0
601*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
602*9880d681SAndroid Build Coastguard Worker;
603*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_add_x_one:
604*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
605*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
606*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
607*9880d681SAndroid Build Coastguard Worker  %a = fadd <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0>
608*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %a
609*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
610*9880d681SAndroid Build Coastguard Worker}
611*9880d681SAndroid Build Coastguard Worker
612*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_add_x_negone_y(<4 x float> %x, <4 x float> %y) {
613*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_add_x_negone_y:
614*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
615*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
616*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
617*9880d681SAndroid Build Coastguard Worker;
618*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_add_x_negone_y:
619*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
620*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm1, %xmm1, %xmm0, %xmm0
621*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
622*9880d681SAndroid Build Coastguard Worker;
623*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_add_x_negone_y:
624*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
625*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
626*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
627*9880d681SAndroid Build Coastguard Worker  %a = fadd <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0>
628*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %a, %y
629*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
630*9880d681SAndroid Build Coastguard Worker}
631*9880d681SAndroid Build Coastguard Worker
632*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_add_x_negone(<4 x float> %x, <4 x float> %y) {
633*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_add_x_negone:
634*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
635*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
636*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
637*9880d681SAndroid Build Coastguard Worker;
638*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_add_x_negone:
639*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
640*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm1, %xmm1, %xmm0, %xmm0
641*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
642*9880d681SAndroid Build Coastguard Worker;
643*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_add_x_negone:
644*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
645*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
646*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
647*9880d681SAndroid Build Coastguard Worker  %a = fadd <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0>
648*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %a
649*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
650*9880d681SAndroid Build Coastguard Worker}
651*9880d681SAndroid Build Coastguard Worker
652*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_one_x_y(<4 x float> %x, <4 x float> %y) {
653*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_one_x_y:
654*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
655*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %xmm1, %xmm1, %xmm0
656*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
657*9880d681SAndroid Build Coastguard Worker;
658*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_one_x_y:
659*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
660*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %xmm1, %xmm1, %xmm0, %xmm0
661*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
662*9880d681SAndroid Build Coastguard Worker;
663*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_one_x_y:
664*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
665*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %xmm1, %xmm1, %xmm0
666*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
667*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x
668*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %s, %y
669*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
670*9880d681SAndroid Build Coastguard Worker}
671*9880d681SAndroid Build Coastguard Worker
672*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_one_x(<4 x float> %x, <4 x float> %y) {
673*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_one_x:
674*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
675*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %xmm1, %xmm1, %xmm0
676*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
677*9880d681SAndroid Build Coastguard Worker;
678*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_one_x:
679*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
680*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %xmm1, %xmm1, %xmm0, %xmm0
681*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
682*9880d681SAndroid Build Coastguard Worker;
683*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_one_x:
684*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
685*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %xmm1, %xmm1, %xmm0
686*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
687*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x
688*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %s
689*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
690*9880d681SAndroid Build Coastguard Worker}
691*9880d681SAndroid Build Coastguard Worker
692*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_negone_x_y(<4 x float> %x, <4 x float> %y) {
693*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_negone_x_y:
694*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
695*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %xmm1, %xmm1, %xmm0
696*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
697*9880d681SAndroid Build Coastguard Worker;
698*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_negone_x_y:
699*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
700*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %xmm1, %xmm1, %xmm0, %xmm0
701*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
702*9880d681SAndroid Build Coastguard Worker;
703*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_negone_x_y:
704*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
705*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %xmm1, %xmm1, %xmm0
706*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
707*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> <float -1.0, float -1.0, float -1.0, float -1.0>, %x
708*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %s, %y
709*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
710*9880d681SAndroid Build Coastguard Worker}
711*9880d681SAndroid Build Coastguard Worker
712*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_negone_x(<4 x float> %x, <4 x float> %y) {
713*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_negone_x:
714*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
715*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %xmm1, %xmm1, %xmm0
716*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
717*9880d681SAndroid Build Coastguard Worker;
718*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_negone_x:
719*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
720*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %xmm1, %xmm1, %xmm0, %xmm0
721*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
722*9880d681SAndroid Build Coastguard Worker;
723*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_negone_x:
724*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
725*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %xmm1, %xmm1, %xmm0
726*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
727*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> <float -1.0, float -1.0, float -1.0, float -1.0>, %x
728*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %s
729*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
730*9880d681SAndroid Build Coastguard Worker}
731*9880d681SAndroid Build Coastguard Worker
732*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_x_one_y(<4 x float> %x, <4 x float> %y) {
733*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_x_one_y:
734*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
735*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
736*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
737*9880d681SAndroid Build Coastguard Worker;
738*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_x_one_y:
739*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
740*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm1, %xmm1, %xmm0, %xmm0
741*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
742*9880d681SAndroid Build Coastguard Worker;
743*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_x_one_y:
744*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
745*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
746*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
747*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0>
748*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %s, %y
749*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
750*9880d681SAndroid Build Coastguard Worker}
751*9880d681SAndroid Build Coastguard Worker
752*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_x_one(<4 x float> %x, <4 x float> %y) {
753*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_x_one:
754*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
755*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
756*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
757*9880d681SAndroid Build Coastguard Worker;
758*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_x_one:
759*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
760*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm1, %xmm1, %xmm0, %xmm0
761*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
762*9880d681SAndroid Build Coastguard Worker;
763*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_x_one:
764*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
765*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm1, %xmm1, %xmm0
766*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
767*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0>
768*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %s
769*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
770*9880d681SAndroid Build Coastguard Worker}
771*9880d681SAndroid Build Coastguard Worker
772*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_x_negone_y(<4 x float> %x, <4 x float> %y) {
773*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_x_negone_y:
774*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
775*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
776*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
777*9880d681SAndroid Build Coastguard Worker;
778*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_x_negone_y:
779*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
780*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, %xmm1, %xmm0, %xmm0
781*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
782*9880d681SAndroid Build Coastguard Worker;
783*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_x_negone_y:
784*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
785*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
786*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
787*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0>
788*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %s, %y
789*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
790*9880d681SAndroid Build Coastguard Worker}
791*9880d681SAndroid Build Coastguard Worker
792*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_x_negone(<4 x float> %x, <4 x float> %y) {
793*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_x_negone:
794*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
795*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
796*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
797*9880d681SAndroid Build Coastguard Worker;
798*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_x_negone:
799*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
800*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, %xmm1, %xmm0, %xmm0
801*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
802*9880d681SAndroid Build Coastguard Worker;
803*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_x_negone:
804*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
805*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm1, %xmm1, %xmm0
806*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
807*9880d681SAndroid Build Coastguard Worker  %s = fsub <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0>
808*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x float> %y, %s
809*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %m
810*9880d681SAndroid Build Coastguard Worker}
811*9880d681SAndroid Build Coastguard Worker
812*9880d681SAndroid Build Coastguard Worker;
813*9880d681SAndroid Build Coastguard Worker; Interpolation Patterns: add(mul(x,t),mul(sub(1.0,t),y))
814*9880d681SAndroid Build Coastguard Worker;
815*9880d681SAndroid Build Coastguard Worker
816*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_interp(float %x, float %y, float %t) {
817*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_interp:
818*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
819*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ss %xmm1, %xmm2, %xmm1
820*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ss %xmm1, %xmm2, %xmm0
821*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
822*9880d681SAndroid Build Coastguard Worker;
823*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_interp:
824*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
825*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddss %xmm1, %xmm1, %xmm2, %xmm1
826*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddss %xmm1, %xmm2, %xmm0, %xmm0
827*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
828*9880d681SAndroid Build Coastguard Worker;
829*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_interp:
830*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
831*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ss %xmm1, %xmm2, %xmm1
832*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ss %xmm1, %xmm0, %xmm2
833*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm0
834*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
835*9880d681SAndroid Build Coastguard Worker  %t1 = fsub float 1.0, %t
836*9880d681SAndroid Build Coastguard Worker  %tx = fmul float %x, %t
837*9880d681SAndroid Build Coastguard Worker  %ty = fmul float %y, %t1
838*9880d681SAndroid Build Coastguard Worker  %r = fadd float %tx, %ty
839*9880d681SAndroid Build Coastguard Worker  ret float %r
840*9880d681SAndroid Build Coastguard Worker}
841*9880d681SAndroid Build Coastguard Worker
842*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_interp(<4 x float> %x, <4 x float> %y, <4 x float> %t) {
843*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_interp:
844*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
845*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %xmm1, %xmm2, %xmm1
846*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %xmm1, %xmm2, %xmm0
847*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
848*9880d681SAndroid Build Coastguard Worker;
849*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_interp:
850*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
851*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %xmm1, %xmm1, %xmm2, %xmm1
852*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, %xmm2, %xmm0, %xmm0
853*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
854*9880d681SAndroid Build Coastguard Worker;
855*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_interp:
856*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
857*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm3
858*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %xmm1, %xmm1, %xmm3
859*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %xmm3, %xmm2, %xmm0
860*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
861*9880d681SAndroid Build Coastguard Worker  %t1 = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %t
862*9880d681SAndroid Build Coastguard Worker  %tx = fmul <4 x float> %x, %t
863*9880d681SAndroid Build Coastguard Worker  %ty = fmul <4 x float> %y, %t1
864*9880d681SAndroid Build Coastguard Worker  %r = fadd <4 x float> %tx, %ty
865*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %r
866*9880d681SAndroid Build Coastguard Worker}
867*9880d681SAndroid Build Coastguard Worker
868*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_v8f32_interp(<8 x float> %x, <8 x float> %y, <8 x float> %t) {
869*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v8f32_interp:
870*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
871*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213ps %ymm1, %ymm2, %ymm1
872*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213ps %ymm1, %ymm2, %ymm0
873*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
874*9880d681SAndroid Build Coastguard Worker;
875*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v8f32_interp:
876*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
877*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddps %ymm1, %ymm1, %ymm2, %ymm1
878*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %ymm1, %ymm2, %ymm0, %ymm0
879*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
880*9880d681SAndroid Build Coastguard Worker;
881*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v8f32_interp:
882*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
883*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm3
884*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213ps %ymm1, %ymm1, %ymm3
885*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213ps %ymm3, %ymm2, %ymm0
886*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
887*9880d681SAndroid Build Coastguard Worker  %t1 = fsub <8 x float> <float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0>, %t
888*9880d681SAndroid Build Coastguard Worker  %tx = fmul <8 x float> %x, %t
889*9880d681SAndroid Build Coastguard Worker  %ty = fmul <8 x float> %y, %t1
890*9880d681SAndroid Build Coastguard Worker  %r = fadd <8 x float> %tx, %ty
891*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %r
892*9880d681SAndroid Build Coastguard Worker}
893*9880d681SAndroid Build Coastguard Worker
894*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_interp(double %x, double %y, double %t) {
895*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_interp:
896*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
897*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213sd %xmm1, %xmm2, %xmm1
898*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213sd %xmm1, %xmm2, %xmm0
899*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
900*9880d681SAndroid Build Coastguard Worker;
901*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_interp:
902*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
903*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddsd %xmm1, %xmm1, %xmm2, %xmm1
904*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddsd %xmm1, %xmm2, %xmm0, %xmm0
905*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
906*9880d681SAndroid Build Coastguard Worker;
907*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_interp:
908*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
909*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213sd %xmm1, %xmm2, %xmm1
910*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213sd %xmm1, %xmm0, %xmm2
911*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm0
912*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
913*9880d681SAndroid Build Coastguard Worker  %t1 = fsub double 1.0, %t
914*9880d681SAndroid Build Coastguard Worker  %tx = fmul double %x, %t
915*9880d681SAndroid Build Coastguard Worker  %ty = fmul double %y, %t1
916*9880d681SAndroid Build Coastguard Worker  %r = fadd double %tx, %ty
917*9880d681SAndroid Build Coastguard Worker  ret double %r
918*9880d681SAndroid Build Coastguard Worker}
919*9880d681SAndroid Build Coastguard Worker
920*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_v2f64_interp(<2 x double> %x, <2 x double> %y, <2 x double> %t) {
921*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v2f64_interp:
922*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
923*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213pd %xmm1, %xmm2, %xmm1
924*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213pd %xmm1, %xmm2, %xmm0
925*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
926*9880d681SAndroid Build Coastguard Worker;
927*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v2f64_interp:
928*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
929*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddpd %xmm1, %xmm1, %xmm2, %xmm1
930*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddpd %xmm1, %xmm2, %xmm0, %xmm0
931*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
932*9880d681SAndroid Build Coastguard Worker;
933*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v2f64_interp:
934*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
935*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm3
936*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213pd %xmm1, %xmm1, %xmm3
937*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213pd %xmm3, %xmm2, %xmm0
938*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
939*9880d681SAndroid Build Coastguard Worker  %t1 = fsub <2 x double> <double 1.0, double 1.0>, %t
940*9880d681SAndroid Build Coastguard Worker  %tx = fmul <2 x double> %x, %t
941*9880d681SAndroid Build Coastguard Worker  %ty = fmul <2 x double> %y, %t1
942*9880d681SAndroid Build Coastguard Worker  %r = fadd <2 x double> %tx, %ty
943*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %r
944*9880d681SAndroid Build Coastguard Worker}
945*9880d681SAndroid Build Coastguard Worker
946*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_interp(<4 x double> %x, <4 x double> %y, <4 x double> %t) {
947*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_interp:
948*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
949*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213pd %ymm1, %ymm2, %ymm1
950*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213pd %ymm1, %ymm2, %ymm0
951*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
952*9880d681SAndroid Build Coastguard Worker;
953*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_interp:
954*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
955*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddpd %ymm1, %ymm1, %ymm2, %ymm1
956*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddpd %ymm1, %ymm2, %ymm0, %ymm0
957*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
958*9880d681SAndroid Build Coastguard Worker;
959*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_interp:
960*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
961*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm2, %zmm3
962*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213pd %ymm1, %ymm1, %ymm3
963*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213pd %ymm3, %ymm2, %ymm0
964*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
965*9880d681SAndroid Build Coastguard Worker  %t1 = fsub <4 x double> <double 1.0, double 1.0, double 1.0, double 1.0>, %t
966*9880d681SAndroid Build Coastguard Worker  %tx = fmul <4 x double> %x, %t
967*9880d681SAndroid Build Coastguard Worker  %ty = fmul <4 x double> %y, %t1
968*9880d681SAndroid Build Coastguard Worker  %r = fadd <4 x double> %tx, %ty
969*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %r
970*9880d681SAndroid Build Coastguard Worker}
971*9880d681SAndroid Build Coastguard Worker
972*9880d681SAndroid Build Coastguard Worker;
973*9880d681SAndroid Build Coastguard Worker; Pattern: (fneg (fma x, y, z)) -> (fma x, -y, -z)
974*9880d681SAndroid Build Coastguard Worker;
975*9880d681SAndroid Build Coastguard Worker
976*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) #0 {
977*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fmadd:
978*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
979*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
980*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
981*9880d681SAndroid Build Coastguard Worker;
982*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fmadd:
983*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
984*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0
985*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
986*9880d681SAndroid Build Coastguard Worker;
987*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fmadd:
988*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
989*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
990*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
991*9880d681SAndroid Build Coastguard Worker  %mul = fmul <4 x float> %a0, %a1
992*9880d681SAndroid Build Coastguard Worker  %add = fadd <4 x float> %mul, %a2
993*9880d681SAndroid Build Coastguard Worker  %neg = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %add
994*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %neg
995*9880d681SAndroid Build Coastguard Worker}
996*9880d681SAndroid Build Coastguard Worker
997*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) #0 {
998*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fmsub:
999*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1000*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmadd213pd %ymm2, %ymm1, %ymm0
1001*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1002*9880d681SAndroid Build Coastguard Worker;
1003*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fmsub:
1004*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1005*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmaddpd %ymm2, %ymm1, %ymm0, %ymm0
1006*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1007*9880d681SAndroid Build Coastguard Worker;
1008*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fmsub:
1009*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1010*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmadd213pd %ymm2, %ymm1, %ymm0
1011*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1012*9880d681SAndroid Build Coastguard Worker  %mul = fmul <4 x double> %a0, %a1
1013*9880d681SAndroid Build Coastguard Worker  %sub = fsub <4 x double> %mul, %a2
1014*9880d681SAndroid Build Coastguard Worker  %neg = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %sub
1015*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %neg
1016*9880d681SAndroid Build Coastguard Worker}
1017*9880d681SAndroid Build Coastguard Worker
1018*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fnmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) #0 {
1019*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fnmadd:
1020*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1021*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmsub213ps %xmm2, %xmm1, %xmm0
1022*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1023*9880d681SAndroid Build Coastguard Worker;
1024*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fnmadd:
1025*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1026*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmsubps %xmm2, %xmm1, %xmm0, %xmm0
1027*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1028*9880d681SAndroid Build Coastguard Worker;
1029*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fnmadd:
1030*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1031*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmsub213ps %xmm2, %xmm1, %xmm0
1032*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1033*9880d681SAndroid Build Coastguard Worker  %mul = fmul <4 x float> %a0, %a1
1034*9880d681SAndroid Build Coastguard Worker  %neg0 = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %mul
1035*9880d681SAndroid Build Coastguard Worker  %add = fadd <4 x float> %neg0, %a2
1036*9880d681SAndroid Build Coastguard Worker  %neg1 = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %add
1037*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %neg1
1038*9880d681SAndroid Build Coastguard Worker}
1039*9880d681SAndroid Build Coastguard Worker
1040*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fnmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) #0 {
1041*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fnmsub:
1042*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1043*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd213pd %ymm2, %ymm1, %ymm0
1044*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1045*9880d681SAndroid Build Coastguard Worker;
1046*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fnmsub:
1047*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1048*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddpd %ymm2, %ymm1, %ymm0, %ymm0
1049*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1050*9880d681SAndroid Build Coastguard Worker;
1051*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fnmsub:
1052*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1053*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd213pd %ymm2, %ymm1, %ymm0
1054*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1055*9880d681SAndroid Build Coastguard Worker  %mul = fmul <4 x double> %a0, %a1
1056*9880d681SAndroid Build Coastguard Worker  %neg0 = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %mul
1057*9880d681SAndroid Build Coastguard Worker  %sub = fsub <4 x double> %neg0, %a2
1058*9880d681SAndroid Build Coastguard Worker  %neg1 = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %sub
1059*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %neg1
1060*9880d681SAndroid Build Coastguard Worker}
1061*9880d681SAndroid Build Coastguard Worker
1062*9880d681SAndroid Build Coastguard Worker;
1063*9880d681SAndroid Build Coastguard Worker; Pattern: (fma x, c1, (fmul x, c2)) -> (fmul x, c1+c2)
1064*9880d681SAndroid Build Coastguard Worker;
1065*9880d681SAndroid Build Coastguard Worker
1066*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fma_x_c1_fmul_x_c2(<4 x float> %x) #0 {
1067*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fma_x_c1_fmul_x_c2:
1068*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1069*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vmulps {{.*}}(%rip), %xmm0, %xmm0
1070*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1071*9880d681SAndroid Build Coastguard Worker;
1072*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fma_x_c1_fmul_x_c2:
1073*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1074*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vmulps {{.*}}(%rip), %xmm0, %xmm0
1075*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1076*9880d681SAndroid Build Coastguard Worker;
1077*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fma_x_c1_fmul_x_c2:
1078*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1079*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmulps {{.*}}(%rip){1to4}, %xmm0, %xmm0
1080*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1081*9880d681SAndroid Build Coastguard Worker  %m0 = fmul <4 x float> %x, <float 1.0, float 2.0, float 3.0, float 4.0>
1082*9880d681SAndroid Build Coastguard Worker  %m1 = fmul <4 x float> %x, <float 4.0, float 3.0, float 2.0, float 1.0>
1083*9880d681SAndroid Build Coastguard Worker  %a  = fadd <4 x float> %m0, %m1
1084*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %a
1085*9880d681SAndroid Build Coastguard Worker}
1086*9880d681SAndroid Build Coastguard Worker
1087*9880d681SAndroid Build Coastguard Worker;
1088*9880d681SAndroid Build Coastguard Worker; Pattern: (fma (fmul x, c1), c2, y) -> (fma x, c1*c2, y)
1089*9880d681SAndroid Build Coastguard Worker;
1090*9880d681SAndroid Build Coastguard Worker
1091*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fma_fmul_x_c1_c2_y(<4 x float> %x, <4 x float> %y) #0 {
1092*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fma_fmul_x_c1_c2_y:
1093*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1094*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfmadd132ps {{.*}}(%rip), %xmm1, %xmm0
1095*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1096*9880d681SAndroid Build Coastguard Worker;
1097*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fma_fmul_x_c1_c2_y:
1098*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1099*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfmaddps %xmm1, {{.*}}(%rip), %xmm0, %xmm0
1100*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1101*9880d681SAndroid Build Coastguard Worker;
1102*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fma_fmul_x_c1_c2_y:
1103*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1104*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfmadd231ps {{.*}}(%rip), %xmm0, %xmm1
1105*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
1106*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1107*9880d681SAndroid Build Coastguard Worker  %m0 = fmul <4 x float> %x,  <float 1.0, float 2.0, float 3.0, float 4.0>
1108*9880d681SAndroid Build Coastguard Worker  %m1 = fmul <4 x float> %m0, <float 4.0, float 3.0, float 2.0, float 1.0>
1109*9880d681SAndroid Build Coastguard Worker  %a  = fadd <4 x float> %m1, %y
1110*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %a
1111*9880d681SAndroid Build Coastguard Worker}
1112*9880d681SAndroid Build Coastguard Worker
1113*9880d681SAndroid Build Coastguard Worker; Pattern: (fneg (fmul x, y)) -> (fnmsub x, y, 0)
1114*9880d681SAndroid Build Coastguard Worker
1115*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fneg_fmul(double %x, double %y) #0 {
1116*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fneg_fmul:
1117*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1118*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vxorpd %xmm2, %xmm2, %xmm2
1119*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213sd %xmm2, %xmm1, %xmm0
1120*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1121*9880d681SAndroid Build Coastguard Worker;
1122*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fneg_fmul:
1123*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1124*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vxorpd %xmm2, %xmm2, %xmm2
1125*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubsd %xmm2, %xmm1, %xmm0, %xmm0
1126*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1127*9880d681SAndroid Build Coastguard Worker;
1128*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fneg_fmul:
1129*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1130*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vxorps %xmm2, %xmm2, %xmm2
1131*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213sd %xmm2, %xmm0, %xmm1
1132*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vmovaps %zmm1, %zmm0
1133*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1134*9880d681SAndroid Build Coastguard Worker  %m = fmul nsz double %x, %y
1135*9880d681SAndroid Build Coastguard Worker  %n = fsub double -0.0, %m
1136*9880d681SAndroid Build Coastguard Worker  ret double %n
1137*9880d681SAndroid Build Coastguard Worker}
1138*9880d681SAndroid Build Coastguard Worker
1139*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fmul(<4 x float> %x, <4 x float> %y) #0 {
1140*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fmul:
1141*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1142*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vxorps %xmm2, %xmm2, %xmm2
1143*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
1144*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1145*9880d681SAndroid Build Coastguard Worker;
1146*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fmul:
1147*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1148*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vxorps %xmm2, %xmm2, %xmm2
1149*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0
1150*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1151*9880d681SAndroid Build Coastguard Worker;
1152*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fmul:
1153*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1154*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vpxord %xmm2, %xmm2, %xmm2
1155*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213ps %xmm2, %xmm1, %xmm0
1156*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1157*9880d681SAndroid Build Coastguard Worker  %m = fmul nsz <4 x float> %x, %y
1158*9880d681SAndroid Build Coastguard Worker  %n = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %m
1159*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %n
1160*9880d681SAndroid Build Coastguard Worker}
1161*9880d681SAndroid Build Coastguard Worker
1162*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmul(<4 x double> %x, <4 x double> %y) #0 {
1163*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fmul:
1164*9880d681SAndroid Build Coastguard Worker; FMA:       # BB#0:
1165*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vxorpd %ymm2, %ymm2, %ymm2
1166*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    vfnmsub213pd %ymm2, %ymm1, %ymm0
1167*9880d681SAndroid Build Coastguard Worker; FMA-NEXT:    retq
1168*9880d681SAndroid Build Coastguard Worker;
1169*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fmul:
1170*9880d681SAndroid Build Coastguard Worker; FMA4:       # BB#0:
1171*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vxorpd %ymm2, %ymm2, %ymm2
1172*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    vfnmsubpd %ymm2, %ymm1, %ymm0, %ymm0
1173*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT:    retq
1174*9880d681SAndroid Build Coastguard Worker;
1175*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fmul:
1176*9880d681SAndroid Build Coastguard Worker; AVX512:       # BB#0:
1177*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vpxord %ymm2, %ymm2, %ymm2
1178*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    vfnmsub213pd %ymm2, %ymm1, %ymm0
1179*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT:    retq
1180*9880d681SAndroid Build Coastguard Worker  %m = fmul nsz <4 x double> %x, %y
1181*9880d681SAndroid Build Coastguard Worker  %n = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %m
1182*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %n
1183*9880d681SAndroid Build Coastguard Worker}
1184*9880d681SAndroid Build Coastguard Worker
1185*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmul_no_nsz(<4 x double> %x, <4 x double> %y) #0 {
1186*9880d681SAndroid Build Coastguard Worker; ALL-LABEL: test_v4f64_fneg_fmul_no_nsz:
1187*9880d681SAndroid Build Coastguard Worker; ALL:       # BB#0:
1188*9880d681SAndroid Build Coastguard Worker; ALL-NEXT:    vmulpd %ymm1, %ymm0, %ymm0
1189*9880d681SAndroid Build Coastguard Worker; ALL-NEXT:    vxorpd {{.*}}(%rip), %ymm0, %ymm0
1190*9880d681SAndroid Build Coastguard Worker; ALL-NEXT:    retq
1191*9880d681SAndroid Build Coastguard Worker  %m = fmul <4 x double> %x, %y
1192*9880d681SAndroid Build Coastguard Worker  %n = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %m
1193*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %n
1194*9880d681SAndroid Build Coastguard Worker}
1195*9880d681SAndroid Build Coastguard Worker
1196*9880d681SAndroid Build Coastguard Workerattributes #0 = { "unsafe-fp-math"="true" }
1197