1*9880d681SAndroid Build Coastguard Worker; Test vector subtraction. 2*9880d681SAndroid Build Coastguard Worker; 3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s 4*9880d681SAndroid Build Coastguard Worker 5*9880d681SAndroid Build Coastguard Worker; Test a v16i8 subtraction. 6*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f1(<16 x i8> %dummy, <16 x i8> %val1, <16 x i8> %val2) { 7*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f1: 8*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28 9*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 10*9880d681SAndroid Build Coastguard Worker %ret = sub <16 x i8> %val1, %val2 11*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %ret 12*9880d681SAndroid Build Coastguard Worker} 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Worker; Test a v8i16 subtraction. 15*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @f2(<8 x i16> %dummy, <8 x i16> %val1, <8 x i16> %val2) { 16*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f2: 17*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28 18*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 19*9880d681SAndroid Build Coastguard Worker %ret = sub <8 x i16> %val1, %val2 20*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %ret 21*9880d681SAndroid Build Coastguard Worker} 22*9880d681SAndroid Build Coastguard Worker 23*9880d681SAndroid Build Coastguard Worker; Test a v4i32 subtraction. 24*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @f3(<4 x i32> %dummy, <4 x i32> %val1, <4 x i32> %val2) { 25*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f3: 26*9880d681SAndroid Build Coastguard Worker; CHECK: vsf %v24, %v26, %v28 27*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 28*9880d681SAndroid Build Coastguard Worker %ret = sub <4 x i32> %val1, %val2 29*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %ret 30*9880d681SAndroid Build Coastguard Worker} 31*9880d681SAndroid Build Coastguard Worker 32*9880d681SAndroid Build Coastguard Worker; Test a v2i64 subtraction. 33*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @f4(<2 x i64> %dummy, <2 x i64> %val1, <2 x i64> %val2) { 34*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f4: 35*9880d681SAndroid Build Coastguard Worker; CHECK: vsg %v24, %v26, %v28 36*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 37*9880d681SAndroid Build Coastguard Worker %ret = sub <2 x i64> %val1, %val2 38*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %ret 39*9880d681SAndroid Build Coastguard Worker} 40*9880d681SAndroid Build Coastguard Worker 41*9880d681SAndroid Build Coastguard Worker; Test a v4f32 subtraction, as an example of an operation that needs to be 42*9880d681SAndroid Build Coastguard Worker; scalarized and reassembled. At present there's an unnecessary move that 43*9880d681SAndroid Build Coastguard Worker; could be avoided with smarter ordering. It also isn't important whether 44*9880d681SAndroid Build Coastguard Worker; the VSLDBs use the result of the VLRs or use %v24 and %v26 directly. 45*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @f5(<4 x float> %val1, <4 x float> %val2) { 46*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f5: 47*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vlr %v[[A1:[0-5]]], %v24 48*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vlr %v[[A2:[0-5]]], %v26 49*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[B1:[0-5]]], %v[[A1]], 1 50*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[B2:[0-5]]], %v[[A2]], 1 51*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[C1:[0-5]]], %v[[A1]], 2 52*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[C2:[0-5]]], %v[[A2]], 2 53*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[D1:[0-5]]], %v[[A1]], 3 54*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[D2:[0-5]]], %v[[A2]], 3 55*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: ldr %f[[A1copy:[0-5]]], %f[[A1]] 56*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[A1copy]], %f[[A2]] 57*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[B1]], %f[[B2]] 58*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[C1]], %f[[C2]] 59*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[D1]], %f[[D2]] 60*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vmrhf [[HIGH:%v[0-9]+]], %v[[A1copy]], %v[[B1]] 61*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vmrhf [[LOW:%v[0-9]+]], %v[[C1]], %v[[D1]] 62*9880d681SAndroid Build Coastguard Worker; CHECK: vmrhg %v24, [[HIGH]], [[LOW]] 63*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 64*9880d681SAndroid Build Coastguard Worker %ret = fsub <4 x float> %val1, %val2 65*9880d681SAndroid Build Coastguard Worker ret <4 x float> %ret 66*9880d681SAndroid Build Coastguard Worker} 67*9880d681SAndroid Build Coastguard Worker 68*9880d681SAndroid Build Coastguard Worker; Test a v2f64 subtraction. 69*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @f6(<2 x double> %dummy, <2 x double> %val1, 70*9880d681SAndroid Build Coastguard Worker <2 x double> %val2) { 71*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f6: 72*9880d681SAndroid Build Coastguard Worker; CHECK: vfsdb %v24, %v26, %v28 73*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 74*9880d681SAndroid Build Coastguard Worker %ret = fsub <2 x double> %val1, %val2 75*9880d681SAndroid Build Coastguard Worker ret <2 x double> %ret 76*9880d681SAndroid Build Coastguard Worker} 77*9880d681SAndroid Build Coastguard Worker 78*9880d681SAndroid Build Coastguard Worker; Test an f64 subtraction that uses vector registers. 79*9880d681SAndroid Build Coastguard Workerdefine double @f7(<2 x double> %val1, <2 x double> %val2) { 80*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f7: 81*9880d681SAndroid Build Coastguard Worker; CHECK: wfsdb %f0, %v24, %v26 82*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 83*9880d681SAndroid Build Coastguard Worker %scalar1 = extractelement <2 x double> %val1, i32 0 84*9880d681SAndroid Build Coastguard Worker %scalar2 = extractelement <2 x double> %val2, i32 0 85*9880d681SAndroid Build Coastguard Worker %ret = fsub double %scalar1, %scalar2 86*9880d681SAndroid Build Coastguard Worker ret double %ret 87*9880d681SAndroid Build Coastguard Worker} 88*9880d681SAndroid Build Coastguard Worker 89*9880d681SAndroid Build Coastguard Worker; Test a v2i8 subtraction, which gets promoted to v16i8. 90*9880d681SAndroid Build Coastguard Workerdefine <2 x i8> @f8(<2 x i8> %dummy, <2 x i8> %val1, <2 x i8> %val2) { 91*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f8: 92*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28 93*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 94*9880d681SAndroid Build Coastguard Worker %ret = sub <2 x i8> %val1, %val2 95*9880d681SAndroid Build Coastguard Worker ret <2 x i8> %ret 96*9880d681SAndroid Build Coastguard Worker} 97*9880d681SAndroid Build Coastguard Worker 98*9880d681SAndroid Build Coastguard Worker; Test a v4i8 subtraction, which gets promoted to v16i8. 99*9880d681SAndroid Build Coastguard Workerdefine <4 x i8> @f9(<4 x i8> %dummy, <4 x i8> %val1, <4 x i8> %val2) { 100*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f9: 101*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28 102*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 103*9880d681SAndroid Build Coastguard Worker %ret = sub <4 x i8> %val1, %val2 104*9880d681SAndroid Build Coastguard Worker ret <4 x i8> %ret 105*9880d681SAndroid Build Coastguard Worker} 106*9880d681SAndroid Build Coastguard Worker 107*9880d681SAndroid Build Coastguard Worker; Test a v8i8 subtraction, which gets promoted to v16i8. 108*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @f10(<8 x i8> %dummy, <8 x i8> %val1, <8 x i8> %val2) { 109*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f10: 110*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28 111*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 112*9880d681SAndroid Build Coastguard Worker %ret = sub <8 x i8> %val1, %val2 113*9880d681SAndroid Build Coastguard Worker ret <8 x i8> %ret 114*9880d681SAndroid Build Coastguard Worker} 115*9880d681SAndroid Build Coastguard Worker 116*9880d681SAndroid Build Coastguard Worker; Test a v2i16 subtraction, which gets promoted to v8i16. 117*9880d681SAndroid Build Coastguard Workerdefine <2 x i16> @f11(<2 x i16> %dummy, <2 x i16> %val1, <2 x i16> %val2) { 118*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f11: 119*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28 120*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 121*9880d681SAndroid Build Coastguard Worker %ret = sub <2 x i16> %val1, %val2 122*9880d681SAndroid Build Coastguard Worker ret <2 x i16> %ret 123*9880d681SAndroid Build Coastguard Worker} 124*9880d681SAndroid Build Coastguard Worker 125*9880d681SAndroid Build Coastguard Worker; Test a v4i16 subtraction, which gets promoted to v8i16. 126*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @f12(<4 x i16> %dummy, <4 x i16> %val1, <4 x i16> %val2) { 127*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f12: 128*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28 129*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 130*9880d681SAndroid Build Coastguard Worker %ret = sub <4 x i16> %val1, %val2 131*9880d681SAndroid Build Coastguard Worker ret <4 x i16> %ret 132*9880d681SAndroid Build Coastguard Worker} 133*9880d681SAndroid Build Coastguard Worker 134*9880d681SAndroid Build Coastguard Worker; Test a v2i32 subtraction, which gets promoted to v4i32. 135*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @f13(<2 x i32> %dummy, <2 x i32> %val1, <2 x i32> %val2) { 136*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f13: 137*9880d681SAndroid Build Coastguard Worker; CHECK: vsf %v24, %v26, %v28 138*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14 139*9880d681SAndroid Build Coastguard Worker %ret = sub <2 x i32> %val1, %val2 140*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %ret 141*9880d681SAndroid Build Coastguard Worker} 142*9880d681SAndroid Build Coastguard Worker 143*9880d681SAndroid Build Coastguard Worker; Test a v2f32 subtraction, which gets promoted to v4f32. 144*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @f14(<2 x float> %val1, <2 x float> %val2) { 145*9880d681SAndroid Build Coastguard Worker; No particular output expected, but must compile. 146*9880d681SAndroid Build Coastguard Worker %ret = fsub <2 x float> %val1, %val2 147*9880d681SAndroid Build Coastguard Worker ret <2 x float> %ret 148*9880d681SAndroid Build Coastguard Worker} 149