xref: /aosp_15_r20/external/llvm/test/CodeGen/SystemZ/vec-sub-01.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; Test vector subtraction.
2*9880d681SAndroid Build Coastguard Worker;
3*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
4*9880d681SAndroid Build Coastguard Worker
5*9880d681SAndroid Build Coastguard Worker; Test a v16i8 subtraction.
6*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @f1(<16 x i8> %dummy, <16 x i8> %val1, <16 x i8> %val2) {
7*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f1:
8*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28
9*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
10*9880d681SAndroid Build Coastguard Worker  %ret = sub <16 x i8> %val1, %val2
11*9880d681SAndroid Build Coastguard Worker  ret <16 x i8> %ret
12*9880d681SAndroid Build Coastguard Worker}
13*9880d681SAndroid Build Coastguard Worker
14*9880d681SAndroid Build Coastguard Worker; Test a v8i16 subtraction.
15*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @f2(<8 x i16> %dummy, <8 x i16> %val1, <8 x i16> %val2) {
16*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f2:
17*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28
18*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
19*9880d681SAndroid Build Coastguard Worker  %ret = sub <8 x i16> %val1, %val2
20*9880d681SAndroid Build Coastguard Worker  ret <8 x i16> %ret
21*9880d681SAndroid Build Coastguard Worker}
22*9880d681SAndroid Build Coastguard Worker
23*9880d681SAndroid Build Coastguard Worker; Test a v4i32 subtraction.
24*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @f3(<4 x i32> %dummy, <4 x i32> %val1, <4 x i32> %val2) {
25*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f3:
26*9880d681SAndroid Build Coastguard Worker; CHECK: vsf %v24, %v26, %v28
27*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
28*9880d681SAndroid Build Coastguard Worker  %ret = sub <4 x i32> %val1, %val2
29*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %ret
30*9880d681SAndroid Build Coastguard Worker}
31*9880d681SAndroid Build Coastguard Worker
32*9880d681SAndroid Build Coastguard Worker; Test a v2i64 subtraction.
33*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @f4(<2 x i64> %dummy, <2 x i64> %val1, <2 x i64> %val2) {
34*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f4:
35*9880d681SAndroid Build Coastguard Worker; CHECK: vsg %v24, %v26, %v28
36*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
37*9880d681SAndroid Build Coastguard Worker  %ret = sub <2 x i64> %val1, %val2
38*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %ret
39*9880d681SAndroid Build Coastguard Worker}
40*9880d681SAndroid Build Coastguard Worker
41*9880d681SAndroid Build Coastguard Worker; Test a v4f32 subtraction, as an example of an operation that needs to be
42*9880d681SAndroid Build Coastguard Worker; scalarized and reassembled.  At present there's an unnecessary move that
43*9880d681SAndroid Build Coastguard Worker; could be avoided with smarter ordering.  It also isn't important whether
44*9880d681SAndroid Build Coastguard Worker; the VSLDBs use the result of the VLRs or use %v24 and %v26 directly.
45*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @f5(<4 x float> %val1, <4 x float> %val2) {
46*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f5:
47*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vlr %v[[A1:[0-5]]], %v24
48*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vlr %v[[A2:[0-5]]], %v26
49*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[B1:[0-5]]], %v[[A1]], 1
50*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[B2:[0-5]]], %v[[A2]], 1
51*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[C1:[0-5]]], %v[[A1]], 2
52*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[C2:[0-5]]], %v[[A2]], 2
53*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[D1:[0-5]]], %v[[A1]], 3
54*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vrepf %v[[D2:[0-5]]], %v[[A2]], 3
55*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: ldr %f[[A1copy:[0-5]]], %f[[A1]]
56*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[A1copy]], %f[[A2]]
57*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[B1]], %f[[B2]]
58*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[C1]], %f[[C2]]
59*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: sebr %f[[D1]], %f[[D2]]
60*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vmrhf [[HIGH:%v[0-9]+]], %v[[A1copy]], %v[[B1]]
61*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: vmrhf [[LOW:%v[0-9]+]], %v[[C1]], %v[[D1]]
62*9880d681SAndroid Build Coastguard Worker; CHECK: vmrhg %v24, [[HIGH]], [[LOW]]
63*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
64*9880d681SAndroid Build Coastguard Worker  %ret = fsub <4 x float> %val1, %val2
65*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %ret
66*9880d681SAndroid Build Coastguard Worker}
67*9880d681SAndroid Build Coastguard Worker
68*9880d681SAndroid Build Coastguard Worker; Test a v2f64 subtraction.
69*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @f6(<2 x double> %dummy, <2 x double> %val1,
70*9880d681SAndroid Build Coastguard Worker                        <2 x double> %val2) {
71*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f6:
72*9880d681SAndroid Build Coastguard Worker; CHECK: vfsdb %v24, %v26, %v28
73*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
74*9880d681SAndroid Build Coastguard Worker  %ret = fsub <2 x double> %val1, %val2
75*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %ret
76*9880d681SAndroid Build Coastguard Worker}
77*9880d681SAndroid Build Coastguard Worker
78*9880d681SAndroid Build Coastguard Worker; Test an f64 subtraction that uses vector registers.
79*9880d681SAndroid Build Coastguard Workerdefine double @f7(<2 x double> %val1, <2 x double> %val2) {
80*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f7:
81*9880d681SAndroid Build Coastguard Worker; CHECK: wfsdb %f0, %v24, %v26
82*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
83*9880d681SAndroid Build Coastguard Worker  %scalar1 = extractelement <2 x double> %val1, i32 0
84*9880d681SAndroid Build Coastguard Worker  %scalar2 = extractelement <2 x double> %val2, i32 0
85*9880d681SAndroid Build Coastguard Worker  %ret = fsub double %scalar1, %scalar2
86*9880d681SAndroid Build Coastguard Worker  ret double %ret
87*9880d681SAndroid Build Coastguard Worker}
88*9880d681SAndroid Build Coastguard Worker
89*9880d681SAndroid Build Coastguard Worker; Test a v2i8 subtraction, which gets promoted to v16i8.
90*9880d681SAndroid Build Coastguard Workerdefine <2 x i8> @f8(<2 x i8> %dummy, <2 x i8> %val1, <2 x i8> %val2) {
91*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f8:
92*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28
93*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
94*9880d681SAndroid Build Coastguard Worker  %ret = sub <2 x i8> %val1, %val2
95*9880d681SAndroid Build Coastguard Worker  ret <2 x i8> %ret
96*9880d681SAndroid Build Coastguard Worker}
97*9880d681SAndroid Build Coastguard Worker
98*9880d681SAndroid Build Coastguard Worker; Test a v4i8 subtraction, which gets promoted to v16i8.
99*9880d681SAndroid Build Coastguard Workerdefine <4 x i8> @f9(<4 x i8> %dummy, <4 x i8> %val1, <4 x i8> %val2) {
100*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f9:
101*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28
102*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
103*9880d681SAndroid Build Coastguard Worker  %ret = sub <4 x i8> %val1, %val2
104*9880d681SAndroid Build Coastguard Worker  ret <4 x i8> %ret
105*9880d681SAndroid Build Coastguard Worker}
106*9880d681SAndroid Build Coastguard Worker
107*9880d681SAndroid Build Coastguard Worker; Test a v8i8 subtraction, which gets promoted to v16i8.
108*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @f10(<8 x i8> %dummy, <8 x i8> %val1, <8 x i8> %val2) {
109*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f10:
110*9880d681SAndroid Build Coastguard Worker; CHECK: vsb %v24, %v26, %v28
111*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
112*9880d681SAndroid Build Coastguard Worker  %ret = sub <8 x i8> %val1, %val2
113*9880d681SAndroid Build Coastguard Worker  ret <8 x i8> %ret
114*9880d681SAndroid Build Coastguard Worker}
115*9880d681SAndroid Build Coastguard Worker
116*9880d681SAndroid Build Coastguard Worker; Test a v2i16 subtraction, which gets promoted to v8i16.
117*9880d681SAndroid Build Coastguard Workerdefine <2 x i16> @f11(<2 x i16> %dummy, <2 x i16> %val1, <2 x i16> %val2) {
118*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f11:
119*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28
120*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
121*9880d681SAndroid Build Coastguard Worker  %ret = sub <2 x i16> %val1, %val2
122*9880d681SAndroid Build Coastguard Worker  ret <2 x i16> %ret
123*9880d681SAndroid Build Coastguard Worker}
124*9880d681SAndroid Build Coastguard Worker
125*9880d681SAndroid Build Coastguard Worker; Test a v4i16 subtraction, which gets promoted to v8i16.
126*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @f12(<4 x i16> %dummy, <4 x i16> %val1, <4 x i16> %val2) {
127*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f12:
128*9880d681SAndroid Build Coastguard Worker; CHECK: vsh %v24, %v26, %v28
129*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
130*9880d681SAndroid Build Coastguard Worker  %ret = sub <4 x i16> %val1, %val2
131*9880d681SAndroid Build Coastguard Worker  ret <4 x i16> %ret
132*9880d681SAndroid Build Coastguard Worker}
133*9880d681SAndroid Build Coastguard Worker
134*9880d681SAndroid Build Coastguard Worker; Test a v2i32 subtraction, which gets promoted to v4i32.
135*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @f13(<2 x i32> %dummy, <2 x i32> %val1, <2 x i32> %val2) {
136*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f13:
137*9880d681SAndroid Build Coastguard Worker; CHECK: vsf %v24, %v26, %v28
138*9880d681SAndroid Build Coastguard Worker; CHECK: br %r14
139*9880d681SAndroid Build Coastguard Worker  %ret = sub <2 x i32> %val1, %val2
140*9880d681SAndroid Build Coastguard Worker  ret <2 x i32> %ret
141*9880d681SAndroid Build Coastguard Worker}
142*9880d681SAndroid Build Coastguard Worker
143*9880d681SAndroid Build Coastguard Worker; Test a v2f32 subtraction, which gets promoted to v4f32.
144*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @f14(<2 x float> %val1, <2 x float> %val2) {
145*9880d681SAndroid Build Coastguard Worker; No particular output expected, but must compile.
146*9880d681SAndroid Build Coastguard Worker  %ret = fsub <2 x float> %val1, %val2
147*9880d681SAndroid Build Coastguard Worker  ret <2 x float> %ret
148*9880d681SAndroid Build Coastguard Worker}
149