1*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by update_llc_test_checks.py 2*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA 4*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma4,+fma -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA4 5*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx,+fma4 -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=FMA4 6*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512dq,+avx512vl -fp-contract=fast | FileCheck %s --check-prefix=ALL --check-prefix=AVX512 7*9880d681SAndroid Build Coastguard Worker 8*9880d681SAndroid Build Coastguard Worker; 9*9880d681SAndroid Build Coastguard Worker; Pattern: (fadd (fmul x, y), z) -> (fmadd x,y,z) 10*9880d681SAndroid Build Coastguard Worker; 11*9880d681SAndroid Build Coastguard Worker 12*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fmadd(float %a0, float %a1, float %a2) { 13*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fmadd: 14*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 15*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ss %xmm2, %xmm1, %xmm0 16*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 17*9880d681SAndroid Build Coastguard Worker; 18*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fmadd: 19*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 20*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddss %xmm2, %xmm1, %xmm0, %xmm0 21*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 22*9880d681SAndroid Build Coastguard Worker; 23*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fmadd: 24*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 25*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ss %xmm2, %xmm0, %xmm1 26*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 27*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 28*9880d681SAndroid Build Coastguard Worker %x = fmul float %a0, %a1 29*9880d681SAndroid Build Coastguard Worker %res = fadd float %x, %a2 30*9880d681SAndroid Build Coastguard Worker ret float %res 31*9880d681SAndroid Build Coastguard Worker} 32*9880d681SAndroid Build Coastguard Worker 33*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) { 34*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmadd: 35*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 36*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 37*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 38*9880d681SAndroid Build Coastguard Worker; 39*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmadd: 40*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 41*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm2, %xmm1, %xmm0, %xmm0 42*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 43*9880d681SAndroid Build Coastguard Worker; 44*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmadd: 45*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 46*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm2, %xmm1, %xmm0 47*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 48*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x float> %a0, %a1 49*9880d681SAndroid Build Coastguard Worker %res = fadd <4 x float> %x, %a2 50*9880d681SAndroid Build Coastguard Worker ret <4 x float> %res 51*9880d681SAndroid Build Coastguard Worker} 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fmadd(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) { 54*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fmadd: 55*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 56*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 57*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 58*9880d681SAndroid Build Coastguard Worker; 59*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fmadd: 60*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 61*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %ymm2, %ymm1, %ymm0, %ymm0 62*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 63*9880d681SAndroid Build Coastguard Worker; 64*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fmadd: 65*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 66*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %ymm2, %ymm1, %ymm0 67*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 68*9880d681SAndroid Build Coastguard Worker %x = fmul <8 x float> %a0, %a1 69*9880d681SAndroid Build Coastguard Worker %res = fadd <8 x float> %x, %a2 70*9880d681SAndroid Build Coastguard Worker ret <8 x float> %res 71*9880d681SAndroid Build Coastguard Worker} 72*9880d681SAndroid Build Coastguard Worker 73*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fmadd(double %a0, double %a1, double %a2) { 74*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fmadd: 75*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 76*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 77*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 78*9880d681SAndroid Build Coastguard Worker; 79*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fmadd: 80*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 81*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddsd %xmm2, %xmm1, %xmm0, %xmm0 82*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 83*9880d681SAndroid Build Coastguard Worker; 84*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fmadd: 85*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 86*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213sd %xmm2, %xmm0, %xmm1 87*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 88*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 89*9880d681SAndroid Build Coastguard Worker %x = fmul double %a0, %a1 90*9880d681SAndroid Build Coastguard Worker %res = fadd double %x, %a2 91*9880d681SAndroid Build Coastguard Worker ret double %res 92*9880d681SAndroid Build Coastguard Worker} 93*9880d681SAndroid Build Coastguard Worker 94*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmadd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) { 95*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmadd: 96*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 97*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 98*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 99*9880d681SAndroid Build Coastguard Worker; 100*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmadd: 101*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 102*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddpd %xmm2, %xmm1, %xmm0, %xmm0 103*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 104*9880d681SAndroid Build Coastguard Worker; 105*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmadd: 106*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 107*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213pd %xmm2, %xmm1, %xmm0 108*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 109*9880d681SAndroid Build Coastguard Worker %x = fmul <2 x double> %a0, %a1 110*9880d681SAndroid Build Coastguard Worker %res = fadd <2 x double> %x, %a2 111*9880d681SAndroid Build Coastguard Worker ret <2 x double> %res 112*9880d681SAndroid Build Coastguard Worker} 113*9880d681SAndroid Build Coastguard Worker 114*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fmadd(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) { 115*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fmadd: 116*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 117*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 118*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 119*9880d681SAndroid Build Coastguard Worker; 120*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fmadd: 121*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 122*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddpd %ymm2, %ymm1, %ymm0, %ymm0 123*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 124*9880d681SAndroid Build Coastguard Worker; 125*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fmadd: 126*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 127*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 128*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 129*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x double> %a0, %a1 130*9880d681SAndroid Build Coastguard Worker %res = fadd <4 x double> %x, %a2 131*9880d681SAndroid Build Coastguard Worker ret <4 x double> %res 132*9880d681SAndroid Build Coastguard Worker} 133*9880d681SAndroid Build Coastguard Worker 134*9880d681SAndroid Build Coastguard Worker; 135*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub (fmul x, y), z) -> (fmsub x, y, z) 136*9880d681SAndroid Build Coastguard Worker; 137*9880d681SAndroid Build Coastguard Worker 138*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fmsub(float %a0, float %a1, float %a2) { 139*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fmsub: 140*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 141*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ss %xmm2, %xmm1, %xmm0 142*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 143*9880d681SAndroid Build Coastguard Worker; 144*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fmsub: 145*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 146*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubss %xmm2, %xmm1, %xmm0, %xmm0 147*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 148*9880d681SAndroid Build Coastguard Worker; 149*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fmsub: 150*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 151*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ss %xmm2, %xmm0, %xmm1 152*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 153*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 154*9880d681SAndroid Build Coastguard Worker %x = fmul float %a0, %a1 155*9880d681SAndroid Build Coastguard Worker %res = fsub float %x, %a2 156*9880d681SAndroid Build Coastguard Worker ret float %res 157*9880d681SAndroid Build Coastguard Worker} 158*9880d681SAndroid Build Coastguard Worker 159*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmsub(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) { 160*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmsub: 161*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 162*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 163*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 164*9880d681SAndroid Build Coastguard Worker; 165*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmsub: 166*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 167*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm2, %xmm1, %xmm0, %xmm0 168*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 169*9880d681SAndroid Build Coastguard Worker; 170*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmsub: 171*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 172*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 173*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 174*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x float> %a0, %a1 175*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x float> %x, %a2 176*9880d681SAndroid Build Coastguard Worker ret <4 x float> %res 177*9880d681SAndroid Build Coastguard Worker} 178*9880d681SAndroid Build Coastguard Worker 179*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fmsub(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) { 180*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fmsub: 181*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 182*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 183*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 184*9880d681SAndroid Build Coastguard Worker; 185*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fmsub: 186*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 187*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %ymm2, %ymm1, %ymm0, %ymm0 188*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 189*9880d681SAndroid Build Coastguard Worker; 190*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fmsub: 191*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 192*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %ymm2, %ymm1, %ymm0 193*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 194*9880d681SAndroid Build Coastguard Worker %x = fmul <8 x float> %a0, %a1 195*9880d681SAndroid Build Coastguard Worker %res = fsub <8 x float> %x, %a2 196*9880d681SAndroid Build Coastguard Worker ret <8 x float> %res 197*9880d681SAndroid Build Coastguard Worker} 198*9880d681SAndroid Build Coastguard Worker 199*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fmsub(double %a0, double %a1, double %a2) { 200*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fmsub: 201*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 202*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213sd %xmm2, %xmm1, %xmm0 203*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 204*9880d681SAndroid Build Coastguard Worker; 205*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fmsub: 206*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 207*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubsd %xmm2, %xmm1, %xmm0, %xmm0 208*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 209*9880d681SAndroid Build Coastguard Worker; 210*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fmsub: 211*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 212*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213sd %xmm2, %xmm0, %xmm1 213*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 214*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 215*9880d681SAndroid Build Coastguard Worker %x = fmul double %a0, %a1 216*9880d681SAndroid Build Coastguard Worker %res = fsub double %x, %a2 217*9880d681SAndroid Build Coastguard Worker ret double %res 218*9880d681SAndroid Build Coastguard Worker} 219*9880d681SAndroid Build Coastguard Worker 220*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmsub(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) { 221*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmsub: 222*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 223*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 224*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 225*9880d681SAndroid Build Coastguard Worker; 226*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmsub: 227*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 228*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubpd %xmm2, %xmm1, %xmm0, %xmm0 229*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 230*9880d681SAndroid Build Coastguard Worker; 231*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmsub: 232*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 233*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213pd %xmm2, %xmm1, %xmm0 234*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 235*9880d681SAndroid Build Coastguard Worker %x = fmul <2 x double> %a0, %a1 236*9880d681SAndroid Build Coastguard Worker %res = fsub <2 x double> %x, %a2 237*9880d681SAndroid Build Coastguard Worker ret <2 x double> %res 238*9880d681SAndroid Build Coastguard Worker} 239*9880d681SAndroid Build Coastguard Worker 240*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) { 241*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fmsub: 242*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 243*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 244*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 245*9880d681SAndroid Build Coastguard Worker; 246*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fmsub: 247*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 248*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubpd %ymm2, %ymm1, %ymm0, %ymm0 249*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 250*9880d681SAndroid Build Coastguard Worker; 251*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fmsub: 252*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 253*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213pd %ymm2, %ymm1, %ymm0 254*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 255*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x double> %a0, %a1 256*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x double> %x, %a2 257*9880d681SAndroid Build Coastguard Worker ret <4 x double> %res 258*9880d681SAndroid Build Coastguard Worker} 259*9880d681SAndroid Build Coastguard Worker 260*9880d681SAndroid Build Coastguard Worker; 261*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub z, (fmul x, y)) -> (fnmadd x, y, z) 262*9880d681SAndroid Build Coastguard Worker; 263*9880d681SAndroid Build Coastguard Worker 264*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fnmadd(float %a0, float %a1, float %a2) { 265*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fnmadd: 266*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 267*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ss %xmm2, %xmm1, %xmm0 268*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 269*9880d681SAndroid Build Coastguard Worker; 270*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fnmadd: 271*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 272*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddss %xmm2, %xmm1, %xmm0, %xmm0 273*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 274*9880d681SAndroid Build Coastguard Worker; 275*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fnmadd: 276*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 277*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ss %xmm2, %xmm0, %xmm1 278*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 279*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 280*9880d681SAndroid Build Coastguard Worker %x = fmul float %a0, %a1 281*9880d681SAndroid Build Coastguard Worker %res = fsub float %a2, %x 282*9880d681SAndroid Build Coastguard Worker ret float %res 283*9880d681SAndroid Build Coastguard Worker} 284*9880d681SAndroid Build Coastguard Worker 285*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fnmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) { 286*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fnmadd: 287*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 288*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 289*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 290*9880d681SAndroid Build Coastguard Worker; 291*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fnmadd: 292*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 293*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %xmm2, %xmm1, %xmm0, %xmm0 294*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 295*9880d681SAndroid Build Coastguard Worker; 296*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fnmadd: 297*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 298*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %xmm2, %xmm1, %xmm0 299*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 300*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x float> %a0, %a1 301*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x float> %a2, %x 302*9880d681SAndroid Build Coastguard Worker ret <4 x float> %res 303*9880d681SAndroid Build Coastguard Worker} 304*9880d681SAndroid Build Coastguard Worker 305*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fnmadd(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) { 306*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fnmadd: 307*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 308*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 309*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 310*9880d681SAndroid Build Coastguard Worker; 311*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fnmadd: 312*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 313*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %ymm2, %ymm1, %ymm0, %ymm0 314*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 315*9880d681SAndroid Build Coastguard Worker; 316*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fnmadd: 317*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 318*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %ymm2, %ymm1, %ymm0 319*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 320*9880d681SAndroid Build Coastguard Worker %x = fmul <8 x float> %a0, %a1 321*9880d681SAndroid Build Coastguard Worker %res = fsub <8 x float> %a2, %x 322*9880d681SAndroid Build Coastguard Worker ret <8 x float> %res 323*9880d681SAndroid Build Coastguard Worker} 324*9880d681SAndroid Build Coastguard Worker 325*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fnmadd(double %a0, double %a1, double %a2) { 326*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fnmadd: 327*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 328*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213sd %xmm2, %xmm1, %xmm0 329*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 330*9880d681SAndroid Build Coastguard Worker; 331*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fnmadd: 332*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 333*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddsd %xmm2, %xmm1, %xmm0, %xmm0 334*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 335*9880d681SAndroid Build Coastguard Worker; 336*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fnmadd: 337*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 338*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213sd %xmm2, %xmm0, %xmm1 339*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 340*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 341*9880d681SAndroid Build Coastguard Worker %x = fmul double %a0, %a1 342*9880d681SAndroid Build Coastguard Worker %res = fsub double %a2, %x 343*9880d681SAndroid Build Coastguard Worker ret double %res 344*9880d681SAndroid Build Coastguard Worker} 345*9880d681SAndroid Build Coastguard Worker 346*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fnmadd(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) { 347*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fnmadd: 348*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 349*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 350*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 351*9880d681SAndroid Build Coastguard Worker; 352*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fnmadd: 353*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 354*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddpd %xmm2, %xmm1, %xmm0, %xmm0 355*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 356*9880d681SAndroid Build Coastguard Worker; 357*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fnmadd: 358*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 359*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213pd %xmm2, %xmm1, %xmm0 360*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 361*9880d681SAndroid Build Coastguard Worker %x = fmul <2 x double> %a0, %a1 362*9880d681SAndroid Build Coastguard Worker %res = fsub <2 x double> %a2, %x 363*9880d681SAndroid Build Coastguard Worker ret <2 x double> %res 364*9880d681SAndroid Build Coastguard Worker} 365*9880d681SAndroid Build Coastguard Worker 366*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fnmadd(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) { 367*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fnmadd: 368*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 369*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 370*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 371*9880d681SAndroid Build Coastguard Worker; 372*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fnmadd: 373*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 374*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddpd %ymm2, %ymm1, %ymm0, %ymm0 375*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 376*9880d681SAndroid Build Coastguard Worker; 377*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fnmadd: 378*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 379*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 380*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 381*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x double> %a0, %a1 382*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x double> %a2, %x 383*9880d681SAndroid Build Coastguard Worker ret <4 x double> %res 384*9880d681SAndroid Build Coastguard Worker} 385*9880d681SAndroid Build Coastguard Worker 386*9880d681SAndroid Build Coastguard Worker; 387*9880d681SAndroid Build Coastguard Worker; Pattern: (fsub (fneg (fmul x, y)), z) -> (fnmsub x, y, z) 388*9880d681SAndroid Build Coastguard Worker; 389*9880d681SAndroid Build Coastguard Worker 390*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_fnmsub(float %a0, float %a1, float %a2) { 391*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_fnmsub: 392*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 393*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ss %xmm2, %xmm1, %xmm0 394*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 395*9880d681SAndroid Build Coastguard Worker; 396*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_fnmsub: 397*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 398*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubss %xmm2, %xmm1, %xmm0, %xmm0 399*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 400*9880d681SAndroid Build Coastguard Worker; 401*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_fnmsub: 402*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 403*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ss %xmm2, %xmm0, %xmm1 404*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 405*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 406*9880d681SAndroid Build Coastguard Worker %x = fmul float %a0, %a1 407*9880d681SAndroid Build Coastguard Worker %y = fsub float -0.000000e+00, %x 408*9880d681SAndroid Build Coastguard Worker %res = fsub float %y, %a2 409*9880d681SAndroid Build Coastguard Worker ret float %res 410*9880d681SAndroid Build Coastguard Worker} 411*9880d681SAndroid Build Coastguard Worker 412*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fnmsub(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) { 413*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fnmsub: 414*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 415*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 416*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 417*9880d681SAndroid Build Coastguard Worker; 418*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fnmsub: 419*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 420*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0 421*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 422*9880d681SAndroid Build Coastguard Worker; 423*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fnmsub: 424*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 425*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 426*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 427*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x float> %a0, %a1 428*9880d681SAndroid Build Coastguard Worker %y = fsub <4 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %x 429*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x float> %y, %a2 430*9880d681SAndroid Build Coastguard Worker ret <4 x float> %res 431*9880d681SAndroid Build Coastguard Worker} 432*9880d681SAndroid Build Coastguard Worker 433*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_8f32_fnmsub(<8 x float> %a0, <8 x float> %a1, <8 x float> %a2) { 434*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_8f32_fnmsub: 435*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 436*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 437*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 438*9880d681SAndroid Build Coastguard Worker; 439*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_8f32_fnmsub: 440*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 441*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %ymm2, %ymm1, %ymm0, %ymm0 442*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 443*9880d681SAndroid Build Coastguard Worker; 444*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_8f32_fnmsub: 445*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 446*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %ymm2, %ymm1, %ymm0 447*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 448*9880d681SAndroid Build Coastguard Worker %x = fmul <8 x float> %a0, %a1 449*9880d681SAndroid Build Coastguard Worker %y = fsub <8 x float> <float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00, float -0.000000e+00>, %x 450*9880d681SAndroid Build Coastguard Worker %res = fsub <8 x float> %y, %a2 451*9880d681SAndroid Build Coastguard Worker ret <8 x float> %res 452*9880d681SAndroid Build Coastguard Worker} 453*9880d681SAndroid Build Coastguard Worker 454*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fnmsub(double %a0, double %a1, double %a2) { 455*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fnmsub: 456*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 457*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 458*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 459*9880d681SAndroid Build Coastguard Worker; 460*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fnmsub: 461*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 462*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubsd %xmm2, %xmm1, %xmm0, %xmm0 463*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 464*9880d681SAndroid Build Coastguard Worker; 465*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fnmsub: 466*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 467*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213sd %xmm2, %xmm0, %xmm1 468*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 469*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 470*9880d681SAndroid Build Coastguard Worker %x = fmul double %a0, %a1 471*9880d681SAndroid Build Coastguard Worker %y = fsub double -0.000000e+00, %x 472*9880d681SAndroid Build Coastguard Worker %res = fsub double %y, %a2 473*9880d681SAndroid Build Coastguard Worker ret double %res 474*9880d681SAndroid Build Coastguard Worker} 475*9880d681SAndroid Build Coastguard Worker 476*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fnmsub(<2 x double> %a0, <2 x double> %a1, <2 x double> %a2) { 477*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fnmsub: 478*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 479*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 480*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 481*9880d681SAndroid Build Coastguard Worker; 482*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fnmsub: 483*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 484*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubpd %xmm2, %xmm1, %xmm0, %xmm0 485*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 486*9880d681SAndroid Build Coastguard Worker; 487*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fnmsub: 488*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 489*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213pd %xmm2, %xmm1, %xmm0 490*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 491*9880d681SAndroid Build Coastguard Worker %x = fmul <2 x double> %a0, %a1 492*9880d681SAndroid Build Coastguard Worker %y = fsub <2 x double> <double -0.000000e+00, double -0.000000e+00>, %x 493*9880d681SAndroid Build Coastguard Worker %res = fsub <2 x double> %y, %a2 494*9880d681SAndroid Build Coastguard Worker ret <2 x double> %res 495*9880d681SAndroid Build Coastguard Worker} 496*9880d681SAndroid Build Coastguard Worker 497*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_4f64_fnmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) { 498*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f64_fnmsub: 499*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 500*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 501*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 502*9880d681SAndroid Build Coastguard Worker; 503*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f64_fnmsub: 504*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 505*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubpd %ymm2, %ymm1, %ymm0, %ymm0 506*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 507*9880d681SAndroid Build Coastguard Worker; 508*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f64_fnmsub: 509*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 510*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 511*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 512*9880d681SAndroid Build Coastguard Worker %x = fmul <4 x double> %a0, %a1 513*9880d681SAndroid Build Coastguard Worker %y = fsub <4 x double> <double -0.000000e+00, double -0.000000e+00, double -0.000000e+00, double -0.000000e+00>, %x 514*9880d681SAndroid Build Coastguard Worker %res = fsub <4 x double> %y, %a2 515*9880d681SAndroid Build Coastguard Worker ret <4 x double> %res 516*9880d681SAndroid Build Coastguard Worker} 517*9880d681SAndroid Build Coastguard Worker 518*9880d681SAndroid Build Coastguard Worker; 519*9880d681SAndroid Build Coastguard Worker; Load Folding Patterns 520*9880d681SAndroid Build Coastguard Worker; 521*9880d681SAndroid Build Coastguard Worker 522*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_4f32_fmadd_load(<4 x float>* %a0, <4 x float> %a1, <4 x float> %a2) { 523*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_4f32_fmadd_load: 524*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 525*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd132ps (%rdi), %xmm1, %xmm0 526*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 527*9880d681SAndroid Build Coastguard Worker; 528*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_4f32_fmadd_load: 529*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 530*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, (%rdi), %xmm0, %xmm0 531*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 532*9880d681SAndroid Build Coastguard Worker; 533*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_4f32_fmadd_load: 534*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 535*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps (%rdi), %xmm2 536*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm1, %xmm0, %xmm2 537*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm0 538*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 539*9880d681SAndroid Build Coastguard Worker %x = load <4 x float>, <4 x float>* %a0 540*9880d681SAndroid Build Coastguard Worker %y = fmul <4 x float> %x, %a1 541*9880d681SAndroid Build Coastguard Worker %res = fadd <4 x float> %y, %a2 542*9880d681SAndroid Build Coastguard Worker ret <4 x float> %res 543*9880d681SAndroid Build Coastguard Worker} 544*9880d681SAndroid Build Coastguard Worker 545*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_2f64_fmsub_load(<2 x double>* %a0, <2 x double> %a1, <2 x double> %a2) { 546*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_2f64_fmsub_load: 547*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 548*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub132pd (%rdi), %xmm1, %xmm0 549*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 550*9880d681SAndroid Build Coastguard Worker; 551*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_2f64_fmsub_load: 552*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 553*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubpd %xmm1, (%rdi), %xmm0, %xmm0 554*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 555*9880d681SAndroid Build Coastguard Worker; 556*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_2f64_fmsub_load: 557*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 558*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovapd (%rdi), %xmm2 559*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213pd %xmm1, %xmm0, %xmm2 560*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm0 561*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 562*9880d681SAndroid Build Coastguard Worker %x = load <2 x double>, <2 x double>* %a0 563*9880d681SAndroid Build Coastguard Worker %y = fmul <2 x double> %x, %a1 564*9880d681SAndroid Build Coastguard Worker %res = fsub <2 x double> %y, %a2 565*9880d681SAndroid Build Coastguard Worker ret <2 x double> %res 566*9880d681SAndroid Build Coastguard Worker} 567*9880d681SAndroid Build Coastguard Worker 568*9880d681SAndroid Build Coastguard Worker; 569*9880d681SAndroid Build Coastguard Worker; Patterns (+ fneg variants): mul(add(1.0,x),y), mul(sub(1.0,x),y), mul(sub(x,1.0),y) 570*9880d681SAndroid Build Coastguard Worker; 571*9880d681SAndroid Build Coastguard Worker 572*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_add_x_one_y(<4 x float> %x, <4 x float> %y) { 573*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_add_x_one_y: 574*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 575*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 576*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 577*9880d681SAndroid Build Coastguard Worker; 578*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_add_x_one_y: 579*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 580*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, %xmm1, %xmm0, %xmm0 581*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 582*9880d681SAndroid Build Coastguard Worker; 583*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_add_x_one_y: 584*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 585*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 586*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 587*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0> 588*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %a, %y 589*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 590*9880d681SAndroid Build Coastguard Worker} 591*9880d681SAndroid Build Coastguard Worker 592*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_add_x_one(<4 x float> %x, <4 x float> %y) { 593*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_add_x_one: 594*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 595*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 596*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 597*9880d681SAndroid Build Coastguard Worker; 598*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_add_x_one: 599*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 600*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, %xmm1, %xmm0, %xmm0 601*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 602*9880d681SAndroid Build Coastguard Worker; 603*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_add_x_one: 604*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 605*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 606*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 607*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0> 608*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %a 609*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 610*9880d681SAndroid Build Coastguard Worker} 611*9880d681SAndroid Build Coastguard Worker 612*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_add_x_negone_y(<4 x float> %x, <4 x float> %y) { 613*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_add_x_negone_y: 614*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 615*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 616*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 617*9880d681SAndroid Build Coastguard Worker; 618*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_add_x_negone_y: 619*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 620*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm1, %xmm1, %xmm0, %xmm0 621*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 622*9880d681SAndroid Build Coastguard Worker; 623*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_add_x_negone_y: 624*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 625*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 626*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 627*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0> 628*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %a, %y 629*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 630*9880d681SAndroid Build Coastguard Worker} 631*9880d681SAndroid Build Coastguard Worker 632*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_add_x_negone(<4 x float> %x, <4 x float> %y) { 633*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_add_x_negone: 634*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 635*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 636*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 637*9880d681SAndroid Build Coastguard Worker; 638*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_add_x_negone: 639*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 640*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm1, %xmm1, %xmm0, %xmm0 641*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 642*9880d681SAndroid Build Coastguard Worker; 643*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_add_x_negone: 644*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 645*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 646*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 647*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0> 648*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %a 649*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 650*9880d681SAndroid Build Coastguard Worker} 651*9880d681SAndroid Build Coastguard Worker 652*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_one_x_y(<4 x float> %x, <4 x float> %y) { 653*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_one_x_y: 654*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 655*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %xmm1, %xmm1, %xmm0 656*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 657*9880d681SAndroid Build Coastguard Worker; 658*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_one_x_y: 659*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 660*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %xmm1, %xmm1, %xmm0, %xmm0 661*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 662*9880d681SAndroid Build Coastguard Worker; 663*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_one_x_y: 664*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 665*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %xmm1, %xmm1, %xmm0 666*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 667*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x 668*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %s, %y 669*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 670*9880d681SAndroid Build Coastguard Worker} 671*9880d681SAndroid Build Coastguard Worker 672*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_one_x(<4 x float> %x, <4 x float> %y) { 673*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_one_x: 674*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 675*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %xmm1, %xmm1, %xmm0 676*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 677*9880d681SAndroid Build Coastguard Worker; 678*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_one_x: 679*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 680*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %xmm1, %xmm1, %xmm0, %xmm0 681*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 682*9880d681SAndroid Build Coastguard Worker; 683*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_one_x: 684*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 685*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %xmm1, %xmm1, %xmm0 686*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 687*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x 688*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %s 689*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 690*9880d681SAndroid Build Coastguard Worker} 691*9880d681SAndroid Build Coastguard Worker 692*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_negone_x_y(<4 x float> %x, <4 x float> %y) { 693*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_negone_x_y: 694*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 695*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %xmm1, %xmm1, %xmm0 696*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 697*9880d681SAndroid Build Coastguard Worker; 698*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_negone_x_y: 699*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 700*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %xmm1, %xmm1, %xmm0, %xmm0 701*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 702*9880d681SAndroid Build Coastguard Worker; 703*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_negone_x_y: 704*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 705*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %xmm1, %xmm1, %xmm0 706*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 707*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> <float -1.0, float -1.0, float -1.0, float -1.0>, %x 708*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %s, %y 709*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 710*9880d681SAndroid Build Coastguard Worker} 711*9880d681SAndroid Build Coastguard Worker 712*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_negone_x(<4 x float> %x, <4 x float> %y) { 713*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_negone_x: 714*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 715*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %xmm1, %xmm1, %xmm0 716*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 717*9880d681SAndroid Build Coastguard Worker; 718*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_negone_x: 719*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 720*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %xmm1, %xmm1, %xmm0, %xmm0 721*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 722*9880d681SAndroid Build Coastguard Worker; 723*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_negone_x: 724*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 725*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %xmm1, %xmm1, %xmm0 726*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 727*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> <float -1.0, float -1.0, float -1.0, float -1.0>, %x 728*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %s 729*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 730*9880d681SAndroid Build Coastguard Worker} 731*9880d681SAndroid Build Coastguard Worker 732*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_x_one_y(<4 x float> %x, <4 x float> %y) { 733*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_x_one_y: 734*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 735*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 736*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 737*9880d681SAndroid Build Coastguard Worker; 738*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_x_one_y: 739*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 740*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm1, %xmm1, %xmm0, %xmm0 741*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 742*9880d681SAndroid Build Coastguard Worker; 743*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_x_one_y: 744*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 745*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 746*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 747*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0> 748*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %s, %y 749*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 750*9880d681SAndroid Build Coastguard Worker} 751*9880d681SAndroid Build Coastguard Worker 752*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_x_one(<4 x float> %x, <4 x float> %y) { 753*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_x_one: 754*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 755*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 756*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 757*9880d681SAndroid Build Coastguard Worker; 758*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_x_one: 759*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 760*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm1, %xmm1, %xmm0, %xmm0 761*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 762*9880d681SAndroid Build Coastguard Worker; 763*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_x_one: 764*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 765*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm1, %xmm1, %xmm0 766*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 767*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> %x, <float 1.0, float 1.0, float 1.0, float 1.0> 768*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %s 769*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 770*9880d681SAndroid Build Coastguard Worker} 771*9880d681SAndroid Build Coastguard Worker 772*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_sub_x_negone_y(<4 x float> %x, <4 x float> %y) { 773*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_sub_x_negone_y: 774*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 775*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 776*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 777*9880d681SAndroid Build Coastguard Worker; 778*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_sub_x_negone_y: 779*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 780*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, %xmm1, %xmm0, %xmm0 781*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 782*9880d681SAndroid Build Coastguard Worker; 783*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_sub_x_negone_y: 784*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 785*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 786*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 787*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0> 788*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %s, %y 789*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 790*9880d681SAndroid Build Coastguard Worker} 791*9880d681SAndroid Build Coastguard Worker 792*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_mul_y_sub_x_negone(<4 x float> %x, <4 x float> %y) { 793*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_mul_y_sub_x_negone: 794*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 795*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 796*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 797*9880d681SAndroid Build Coastguard Worker; 798*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_mul_y_sub_x_negone: 799*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 800*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, %xmm1, %xmm0, %xmm0 801*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 802*9880d681SAndroid Build Coastguard Worker; 803*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_mul_y_sub_x_negone: 804*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 805*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm1, %xmm1, %xmm0 806*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 807*9880d681SAndroid Build Coastguard Worker %s = fsub <4 x float> %x, <float -1.0, float -1.0, float -1.0, float -1.0> 808*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x float> %y, %s 809*9880d681SAndroid Build Coastguard Worker ret <4 x float> %m 810*9880d681SAndroid Build Coastguard Worker} 811*9880d681SAndroid Build Coastguard Worker 812*9880d681SAndroid Build Coastguard Worker; 813*9880d681SAndroid Build Coastguard Worker; Interpolation Patterns: add(mul(x,t),mul(sub(1.0,t),y)) 814*9880d681SAndroid Build Coastguard Worker; 815*9880d681SAndroid Build Coastguard Worker 816*9880d681SAndroid Build Coastguard Workerdefine float @test_f32_interp(float %x, float %y, float %t) { 817*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f32_interp: 818*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 819*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ss %xmm1, %xmm2, %xmm1 820*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ss %xmm1, %xmm2, %xmm0 821*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 822*9880d681SAndroid Build Coastguard Worker; 823*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f32_interp: 824*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 825*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddss %xmm1, %xmm1, %xmm2, %xmm1 826*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddss %xmm1, %xmm2, %xmm0, %xmm0 827*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 828*9880d681SAndroid Build Coastguard Worker; 829*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f32_interp: 830*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 831*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ss %xmm1, %xmm2, %xmm1 832*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ss %xmm1, %xmm0, %xmm2 833*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm0 834*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 835*9880d681SAndroid Build Coastguard Worker %t1 = fsub float 1.0, %t 836*9880d681SAndroid Build Coastguard Worker %tx = fmul float %x, %t 837*9880d681SAndroid Build Coastguard Worker %ty = fmul float %y, %t1 838*9880d681SAndroid Build Coastguard Worker %r = fadd float %tx, %ty 839*9880d681SAndroid Build Coastguard Worker ret float %r 840*9880d681SAndroid Build Coastguard Worker} 841*9880d681SAndroid Build Coastguard Worker 842*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_interp(<4 x float> %x, <4 x float> %y, <4 x float> %t) { 843*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_interp: 844*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 845*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %xmm1, %xmm2, %xmm1 846*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %xmm1, %xmm2, %xmm0 847*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 848*9880d681SAndroid Build Coastguard Worker; 849*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_interp: 850*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 851*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %xmm1, %xmm1, %xmm2, %xmm1 852*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, %xmm2, %xmm0, %xmm0 853*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 854*9880d681SAndroid Build Coastguard Worker; 855*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_interp: 856*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 857*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm3 858*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %xmm1, %xmm1, %xmm3 859*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %xmm3, %xmm2, %xmm0 860*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 861*9880d681SAndroid Build Coastguard Worker %t1 = fsub <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %t 862*9880d681SAndroid Build Coastguard Worker %tx = fmul <4 x float> %x, %t 863*9880d681SAndroid Build Coastguard Worker %ty = fmul <4 x float> %y, %t1 864*9880d681SAndroid Build Coastguard Worker %r = fadd <4 x float> %tx, %ty 865*9880d681SAndroid Build Coastguard Worker ret <4 x float> %r 866*9880d681SAndroid Build Coastguard Worker} 867*9880d681SAndroid Build Coastguard Worker 868*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @test_v8f32_interp(<8 x float> %x, <8 x float> %y, <8 x float> %t) { 869*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v8f32_interp: 870*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 871*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213ps %ymm1, %ymm2, %ymm1 872*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213ps %ymm1, %ymm2, %ymm0 873*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 874*9880d681SAndroid Build Coastguard Worker; 875*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v8f32_interp: 876*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 877*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddps %ymm1, %ymm1, %ymm2, %ymm1 878*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %ymm1, %ymm2, %ymm0, %ymm0 879*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 880*9880d681SAndroid Build Coastguard Worker; 881*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v8f32_interp: 882*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 883*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm3 884*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213ps %ymm1, %ymm1, %ymm3 885*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213ps %ymm3, %ymm2, %ymm0 886*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 887*9880d681SAndroid Build Coastguard Worker %t1 = fsub <8 x float> <float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0>, %t 888*9880d681SAndroid Build Coastguard Worker %tx = fmul <8 x float> %x, %t 889*9880d681SAndroid Build Coastguard Worker %ty = fmul <8 x float> %y, %t1 890*9880d681SAndroid Build Coastguard Worker %r = fadd <8 x float> %tx, %ty 891*9880d681SAndroid Build Coastguard Worker ret <8 x float> %r 892*9880d681SAndroid Build Coastguard Worker} 893*9880d681SAndroid Build Coastguard Worker 894*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_interp(double %x, double %y, double %t) { 895*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_interp: 896*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 897*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213sd %xmm1, %xmm2, %xmm1 898*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213sd %xmm1, %xmm2, %xmm0 899*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 900*9880d681SAndroid Build Coastguard Worker; 901*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_interp: 902*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 903*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddsd %xmm1, %xmm1, %xmm2, %xmm1 904*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddsd %xmm1, %xmm2, %xmm0, %xmm0 905*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 906*9880d681SAndroid Build Coastguard Worker; 907*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_interp: 908*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 909*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213sd %xmm1, %xmm2, %xmm1 910*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213sd %xmm1, %xmm0, %xmm2 911*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm0 912*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 913*9880d681SAndroid Build Coastguard Worker %t1 = fsub double 1.0, %t 914*9880d681SAndroid Build Coastguard Worker %tx = fmul double %x, %t 915*9880d681SAndroid Build Coastguard Worker %ty = fmul double %y, %t1 916*9880d681SAndroid Build Coastguard Worker %r = fadd double %tx, %ty 917*9880d681SAndroid Build Coastguard Worker ret double %r 918*9880d681SAndroid Build Coastguard Worker} 919*9880d681SAndroid Build Coastguard Worker 920*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @test_v2f64_interp(<2 x double> %x, <2 x double> %y, <2 x double> %t) { 921*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v2f64_interp: 922*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 923*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213pd %xmm1, %xmm2, %xmm1 924*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213pd %xmm1, %xmm2, %xmm0 925*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 926*9880d681SAndroid Build Coastguard Worker; 927*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v2f64_interp: 928*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 929*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddpd %xmm1, %xmm1, %xmm2, %xmm1 930*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddpd %xmm1, %xmm2, %xmm0, %xmm0 931*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 932*9880d681SAndroid Build Coastguard Worker; 933*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v2f64_interp: 934*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 935*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm3 936*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213pd %xmm1, %xmm1, %xmm3 937*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213pd %xmm3, %xmm2, %xmm0 938*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 939*9880d681SAndroid Build Coastguard Worker %t1 = fsub <2 x double> <double 1.0, double 1.0>, %t 940*9880d681SAndroid Build Coastguard Worker %tx = fmul <2 x double> %x, %t 941*9880d681SAndroid Build Coastguard Worker %ty = fmul <2 x double> %y, %t1 942*9880d681SAndroid Build Coastguard Worker %r = fadd <2 x double> %tx, %ty 943*9880d681SAndroid Build Coastguard Worker ret <2 x double> %r 944*9880d681SAndroid Build Coastguard Worker} 945*9880d681SAndroid Build Coastguard Worker 946*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_interp(<4 x double> %x, <4 x double> %y, <4 x double> %t) { 947*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_interp: 948*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 949*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213pd %ymm1, %ymm2, %ymm1 950*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213pd %ymm1, %ymm2, %ymm0 951*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 952*9880d681SAndroid Build Coastguard Worker; 953*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_interp: 954*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 955*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddpd %ymm1, %ymm1, %ymm2, %ymm1 956*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddpd %ymm1, %ymm2, %ymm0, %ymm0 957*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 958*9880d681SAndroid Build Coastguard Worker; 959*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_interp: 960*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 961*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm2, %zmm3 962*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213pd %ymm1, %ymm1, %ymm3 963*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213pd %ymm3, %ymm2, %ymm0 964*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 965*9880d681SAndroid Build Coastguard Worker %t1 = fsub <4 x double> <double 1.0, double 1.0, double 1.0, double 1.0>, %t 966*9880d681SAndroid Build Coastguard Worker %tx = fmul <4 x double> %x, %t 967*9880d681SAndroid Build Coastguard Worker %ty = fmul <4 x double> %y, %t1 968*9880d681SAndroid Build Coastguard Worker %r = fadd <4 x double> %tx, %ty 969*9880d681SAndroid Build Coastguard Worker ret <4 x double> %r 970*9880d681SAndroid Build Coastguard Worker} 971*9880d681SAndroid Build Coastguard Worker 972*9880d681SAndroid Build Coastguard Worker; 973*9880d681SAndroid Build Coastguard Worker; Pattern: (fneg (fma x, y, z)) -> (fma x, -y, -z) 974*9880d681SAndroid Build Coastguard Worker; 975*9880d681SAndroid Build Coastguard Worker 976*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) #0 { 977*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fmadd: 978*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 979*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 980*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 981*9880d681SAndroid Build Coastguard Worker; 982*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fmadd: 983*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 984*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0 985*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 986*9880d681SAndroid Build Coastguard Worker; 987*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fmadd: 988*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 989*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 990*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 991*9880d681SAndroid Build Coastguard Worker %mul = fmul <4 x float> %a0, %a1 992*9880d681SAndroid Build Coastguard Worker %add = fadd <4 x float> %mul, %a2 993*9880d681SAndroid Build Coastguard Worker %neg = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %add 994*9880d681SAndroid Build Coastguard Worker ret <4 x float> %neg 995*9880d681SAndroid Build Coastguard Worker} 996*9880d681SAndroid Build Coastguard Worker 997*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) #0 { 998*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fmsub: 999*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1000*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 1001*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1002*9880d681SAndroid Build Coastguard Worker; 1003*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fmsub: 1004*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1005*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmaddpd %ymm2, %ymm1, %ymm0, %ymm0 1006*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1007*9880d681SAndroid Build Coastguard Worker; 1008*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fmsub: 1009*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1010*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmadd213pd %ymm2, %ymm1, %ymm0 1011*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1012*9880d681SAndroid Build Coastguard Worker %mul = fmul <4 x double> %a0, %a1 1013*9880d681SAndroid Build Coastguard Worker %sub = fsub <4 x double> %mul, %a2 1014*9880d681SAndroid Build Coastguard Worker %neg = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %sub 1015*9880d681SAndroid Build Coastguard Worker ret <4 x double> %neg 1016*9880d681SAndroid Build Coastguard Worker} 1017*9880d681SAndroid Build Coastguard Worker 1018*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fnmadd(<4 x float> %a0, <4 x float> %a1, <4 x float> %a2) #0 { 1019*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fnmadd: 1020*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1021*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 1022*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1023*9880d681SAndroid Build Coastguard Worker; 1024*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fnmadd: 1025*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1026*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmsubps %xmm2, %xmm1, %xmm0, %xmm0 1027*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1028*9880d681SAndroid Build Coastguard Worker; 1029*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fnmadd: 1030*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1031*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmsub213ps %xmm2, %xmm1, %xmm0 1032*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1033*9880d681SAndroid Build Coastguard Worker %mul = fmul <4 x float> %a0, %a1 1034*9880d681SAndroid Build Coastguard Worker %neg0 = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %mul 1035*9880d681SAndroid Build Coastguard Worker %add = fadd <4 x float> %neg0, %a2 1036*9880d681SAndroid Build Coastguard Worker %neg1 = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %add 1037*9880d681SAndroid Build Coastguard Worker ret <4 x float> %neg1 1038*9880d681SAndroid Build Coastguard Worker} 1039*9880d681SAndroid Build Coastguard Worker 1040*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fnmsub(<4 x double> %a0, <4 x double> %a1, <4 x double> %a2) #0 { 1041*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fnmsub: 1042*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1043*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 1044*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1045*9880d681SAndroid Build Coastguard Worker; 1046*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fnmsub: 1047*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1048*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddpd %ymm2, %ymm1, %ymm0, %ymm0 1049*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1050*9880d681SAndroid Build Coastguard Worker; 1051*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fnmsub: 1052*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1053*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd213pd %ymm2, %ymm1, %ymm0 1054*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1055*9880d681SAndroid Build Coastguard Worker %mul = fmul <4 x double> %a0, %a1 1056*9880d681SAndroid Build Coastguard Worker %neg0 = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %mul 1057*9880d681SAndroid Build Coastguard Worker %sub = fsub <4 x double> %neg0, %a2 1058*9880d681SAndroid Build Coastguard Worker %neg1 = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %sub 1059*9880d681SAndroid Build Coastguard Worker ret <4 x double> %neg1 1060*9880d681SAndroid Build Coastguard Worker} 1061*9880d681SAndroid Build Coastguard Worker 1062*9880d681SAndroid Build Coastguard Worker; 1063*9880d681SAndroid Build Coastguard Worker; Pattern: (fma x, c1, (fmul x, c2)) -> (fmul x, c1+c2) 1064*9880d681SAndroid Build Coastguard Worker; 1065*9880d681SAndroid Build Coastguard Worker 1066*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fma_x_c1_fmul_x_c2(<4 x float> %x) #0 { 1067*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fma_x_c1_fmul_x_c2: 1068*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1069*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 1070*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1071*9880d681SAndroid Build Coastguard Worker; 1072*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fma_x_c1_fmul_x_c2: 1073*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1074*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vmulps {{.*}}(%rip), %xmm0, %xmm0 1075*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1076*9880d681SAndroid Build Coastguard Worker; 1077*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fma_x_c1_fmul_x_c2: 1078*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1079*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmulps {{.*}}(%rip){1to4}, %xmm0, %xmm0 1080*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1081*9880d681SAndroid Build Coastguard Worker %m0 = fmul <4 x float> %x, <float 1.0, float 2.0, float 3.0, float 4.0> 1082*9880d681SAndroid Build Coastguard Worker %m1 = fmul <4 x float> %x, <float 4.0, float 3.0, float 2.0, float 1.0> 1083*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %m0, %m1 1084*9880d681SAndroid Build Coastguard Worker ret <4 x float> %a 1085*9880d681SAndroid Build Coastguard Worker} 1086*9880d681SAndroid Build Coastguard Worker 1087*9880d681SAndroid Build Coastguard Worker; 1088*9880d681SAndroid Build Coastguard Worker; Pattern: (fma (fmul x, c1), c2, y) -> (fma x, c1*c2, y) 1089*9880d681SAndroid Build Coastguard Worker; 1090*9880d681SAndroid Build Coastguard Worker 1091*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fma_fmul_x_c1_c2_y(<4 x float> %x, <4 x float> %y) #0 { 1092*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fma_fmul_x_c1_c2_y: 1093*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1094*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfmadd132ps {{.*}}(%rip), %xmm1, %xmm0 1095*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1096*9880d681SAndroid Build Coastguard Worker; 1097*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fma_fmul_x_c1_c2_y: 1098*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1099*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfmaddps %xmm1, {{.*}}(%rip), %xmm0, %xmm0 1100*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1101*9880d681SAndroid Build Coastguard Worker; 1102*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fma_fmul_x_c1_c2_y: 1103*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1104*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfmadd231ps {{.*}}(%rip), %xmm0, %xmm1 1105*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 1106*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1107*9880d681SAndroid Build Coastguard Worker %m0 = fmul <4 x float> %x, <float 1.0, float 2.0, float 3.0, float 4.0> 1108*9880d681SAndroid Build Coastguard Worker %m1 = fmul <4 x float> %m0, <float 4.0, float 3.0, float 2.0, float 1.0> 1109*9880d681SAndroid Build Coastguard Worker %a = fadd <4 x float> %m1, %y 1110*9880d681SAndroid Build Coastguard Worker ret <4 x float> %a 1111*9880d681SAndroid Build Coastguard Worker} 1112*9880d681SAndroid Build Coastguard Worker 1113*9880d681SAndroid Build Coastguard Worker; Pattern: (fneg (fmul x, y)) -> (fnmsub x, y, 0) 1114*9880d681SAndroid Build Coastguard Worker 1115*9880d681SAndroid Build Coastguard Workerdefine double @test_f64_fneg_fmul(double %x, double %y) #0 { 1116*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_f64_fneg_fmul: 1117*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1118*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vxorpd %xmm2, %xmm2, %xmm2 1119*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0 1120*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1121*9880d681SAndroid Build Coastguard Worker; 1122*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_f64_fneg_fmul: 1123*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1124*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vxorpd %xmm2, %xmm2, %xmm2 1125*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubsd %xmm2, %xmm1, %xmm0, %xmm0 1126*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1127*9880d681SAndroid Build Coastguard Worker; 1128*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_f64_fneg_fmul: 1129*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1130*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vxorps %xmm2, %xmm2, %xmm2 1131*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213sd %xmm2, %xmm0, %xmm1 1132*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vmovaps %zmm1, %zmm0 1133*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1134*9880d681SAndroid Build Coastguard Worker %m = fmul nsz double %x, %y 1135*9880d681SAndroid Build Coastguard Worker %n = fsub double -0.0, %m 1136*9880d681SAndroid Build Coastguard Worker ret double %n 1137*9880d681SAndroid Build Coastguard Worker} 1138*9880d681SAndroid Build Coastguard Worker 1139*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @test_v4f32_fneg_fmul(<4 x float> %x, <4 x float> %y) #0 { 1140*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f32_fneg_fmul: 1141*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1142*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vxorps %xmm2, %xmm2, %xmm2 1143*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 1144*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1145*9880d681SAndroid Build Coastguard Worker; 1146*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f32_fneg_fmul: 1147*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1148*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vxorps %xmm2, %xmm2, %xmm2 1149*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubps %xmm2, %xmm1, %xmm0, %xmm0 1150*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1151*9880d681SAndroid Build Coastguard Worker; 1152*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f32_fneg_fmul: 1153*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1154*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vpxord %xmm2, %xmm2, %xmm2 1155*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213ps %xmm2, %xmm1, %xmm0 1156*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1157*9880d681SAndroid Build Coastguard Worker %m = fmul nsz <4 x float> %x, %y 1158*9880d681SAndroid Build Coastguard Worker %n = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %m 1159*9880d681SAndroid Build Coastguard Worker ret <4 x float> %n 1160*9880d681SAndroid Build Coastguard Worker} 1161*9880d681SAndroid Build Coastguard Worker 1162*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmul(<4 x double> %x, <4 x double> %y) #0 { 1163*9880d681SAndroid Build Coastguard Worker; FMA-LABEL: test_v4f64_fneg_fmul: 1164*9880d681SAndroid Build Coastguard Worker; FMA: # BB#0: 1165*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vxorpd %ymm2, %ymm2, %ymm2 1166*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 1167*9880d681SAndroid Build Coastguard Worker; FMA-NEXT: retq 1168*9880d681SAndroid Build Coastguard Worker; 1169*9880d681SAndroid Build Coastguard Worker; FMA4-LABEL: test_v4f64_fneg_fmul: 1170*9880d681SAndroid Build Coastguard Worker; FMA4: # BB#0: 1171*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vxorpd %ymm2, %ymm2, %ymm2 1172*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: vfnmsubpd %ymm2, %ymm1, %ymm0, %ymm0 1173*9880d681SAndroid Build Coastguard Worker; FMA4-NEXT: retq 1174*9880d681SAndroid Build Coastguard Worker; 1175*9880d681SAndroid Build Coastguard Worker; AVX512-LABEL: test_v4f64_fneg_fmul: 1176*9880d681SAndroid Build Coastguard Worker; AVX512: # BB#0: 1177*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vpxord %ymm2, %ymm2, %ymm2 1178*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: vfnmsub213pd %ymm2, %ymm1, %ymm0 1179*9880d681SAndroid Build Coastguard Worker; AVX512-NEXT: retq 1180*9880d681SAndroid Build Coastguard Worker %m = fmul nsz <4 x double> %x, %y 1181*9880d681SAndroid Build Coastguard Worker %n = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %m 1182*9880d681SAndroid Build Coastguard Worker ret <4 x double> %n 1183*9880d681SAndroid Build Coastguard Worker} 1184*9880d681SAndroid Build Coastguard Worker 1185*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @test_v4f64_fneg_fmul_no_nsz(<4 x double> %x, <4 x double> %y) #0 { 1186*9880d681SAndroid Build Coastguard Worker; ALL-LABEL: test_v4f64_fneg_fmul_no_nsz: 1187*9880d681SAndroid Build Coastguard Worker; ALL: # BB#0: 1188*9880d681SAndroid Build Coastguard Worker; ALL-NEXT: vmulpd %ymm1, %ymm0, %ymm0 1189*9880d681SAndroid Build Coastguard Worker; ALL-NEXT: vxorpd {{.*}}(%rip), %ymm0, %ymm0 1190*9880d681SAndroid Build Coastguard Worker; ALL-NEXT: retq 1191*9880d681SAndroid Build Coastguard Worker %m = fmul <4 x double> %x, %y 1192*9880d681SAndroid Build Coastguard Worker %n = fsub <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %m 1193*9880d681SAndroid Build Coastguard Worker ret <4 x double> %n 1194*9880d681SAndroid Build Coastguard Worker} 1195*9880d681SAndroid Build Coastguard Worker 1196*9880d681SAndroid Build Coastguard Workerattributes #0 = { "unsafe-fp-math"="true" } 1197