xref: /aosp_15_r20/art/test/646-checker-simd-hadd/src/HaddShort.java (revision 795d594fd825385562da6b089ea9b2033f3abf5a)
1*795d594fSAndroid Build Coastguard Worker /*
2*795d594fSAndroid Build Coastguard Worker  * Copyright (C) 2017 The Android Open Source Project
3*795d594fSAndroid Build Coastguard Worker  *
4*795d594fSAndroid Build Coastguard Worker  * Licensed under the Apache License, Version 2.0 (the "License");
5*795d594fSAndroid Build Coastguard Worker  * you may not use this file except in compliance with the License.
6*795d594fSAndroid Build Coastguard Worker  * You may obtain a copy of the License at
7*795d594fSAndroid Build Coastguard Worker  *
8*795d594fSAndroid Build Coastguard Worker  *      http://www.apache.org/licenses/LICENSE-2.0
9*795d594fSAndroid Build Coastguard Worker  *
10*795d594fSAndroid Build Coastguard Worker  * Unless required by applicable law or agreed to in writing, software
11*795d594fSAndroid Build Coastguard Worker  * distributed under the License is distributed on an "AS IS" BASIS,
12*795d594fSAndroid Build Coastguard Worker  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*795d594fSAndroid Build Coastguard Worker  * See the License for the specific language governing permissions and
14*795d594fSAndroid Build Coastguard Worker  * limitations under the License.
15*795d594fSAndroid Build Coastguard Worker  */
16*795d594fSAndroid Build Coastguard Worker 
17*795d594fSAndroid Build Coastguard Worker /**
18*795d594fSAndroid Build Coastguard Worker  * Tests for halving-add idiomatic vectorization.
19*795d594fSAndroid Build Coastguard Worker  */
20*795d594fSAndroid Build Coastguard Worker public class HaddShort {
21*795d594fSAndroid Build Coastguard Worker 
22*795d594fSAndroid Build Coastguard Worker   private static final int N = 64 * 1024;
23*795d594fSAndroid Build Coastguard Worker   private static final int M = N + 31;
24*795d594fSAndroid Build Coastguard Worker 
25*795d594fSAndroid Build Coastguard Worker   static short[] sB1 = new short[M];
26*795d594fSAndroid Build Coastguard Worker   static short[] sB2 = new short[M];
27*795d594fSAndroid Build Coastguard Worker   static short[] sBo = new short[M];
28*795d594fSAndroid Build Coastguard Worker 
$inline$mone()29*795d594fSAndroid Build Coastguard Worker   private static int $inline$mone() {
30*795d594fSAndroid Build Coastguard Worker     return -1;
31*795d594fSAndroid Build Coastguard Worker   }
32*795d594fSAndroid Build Coastguard Worker 
33*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_signed(short[], short[], short[]) loop_optimization (before)
34*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
35*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
36*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
37*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
38*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
39*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
40*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
41*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
42*795d594fSAndroid Build Coastguard Worker   //
43*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.halving_add_signed(short[], short[], short[]) loop_optimization (after)
44*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
45*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
46*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
47*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
48*795d594fSAndroid Build Coastguard Worker   //
49*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.halving_add_signed(short[], short[], short[]) loop_optimization (after)
50*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
51*795d594fSAndroid Build Coastguard Worker   //
52*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
53*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
54*795d594fSAndroid Build Coastguard Worker   //
55*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
56*795d594fSAndroid Build Coastguard Worker   //
57*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
58*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
59*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
60*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
61*795d594fSAndroid Build Coastguard Worker   //
62*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
halving_add_signed(short[] b1, short[] b2, short[] bo)63*795d594fSAndroid Build Coastguard Worker   private static void halving_add_signed(short[] b1, short[] b2, short[] bo) {
64*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
65*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
66*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) ((b1[i] + b2[i]) >> 1);
67*795d594fSAndroid Build Coastguard Worker     }
68*795d594fSAndroid Build Coastguard Worker   }
69*795d594fSAndroid Build Coastguard Worker 
70*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_signed_alt(short[], short[], short[]) loop_optimization (before)
71*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
72*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I10:i\d+>>  IntConstant 10                      loop:none
73*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<M10:i\d+>>  IntConstant -10                     loop:none
74*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
75*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
76*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
77*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<I10>>]              loop:<<Loop>>      outer_loop:none
78*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Get2>>,<<M10>>]              loop:<<Loop>>      outer_loop:none
79*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add3:i\d+>> Add [<<Add1>>,<<Add2>>]             loop:<<Loop>>      outer_loop:none
80*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add3>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
81*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
82*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
83*795d594fSAndroid Build Coastguard Worker   //
84*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.halving_add_signed_alt(short[], short[], short[]) loop_optimization (after)
85*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
86*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
87*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
88*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
89*795d594fSAndroid Build Coastguard Worker   //
90*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.halving_add_signed_alt(short[], short[], short[]) loop_optimization (after)
91*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
92*795d594fSAndroid Build Coastguard Worker   //
93*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
94*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
95*795d594fSAndroid Build Coastguard Worker   //
96*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
97*795d594fSAndroid Build Coastguard Worker   //
98*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
99*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
100*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
101*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
102*795d594fSAndroid Build Coastguard Worker   //
103*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
halving_add_signed_alt(short[] b1, short[] b2, short[] bo)104*795d594fSAndroid Build Coastguard Worker   private static void halving_add_signed_alt(short[] b1, short[] b2, short[] bo) {
105*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
106*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
107*795d594fSAndroid Build Coastguard Worker       // Cancelling constant computations do not confuse recognition.
108*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (((b1[i] + 10) + (b2[i] - 10)) >> 1);
109*795d594fSAndroid Build Coastguard Worker     }
110*795d594fSAndroid Build Coastguard Worker   }
111*795d594fSAndroid Build Coastguard Worker 
112*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_unsigned(short[], short[], short[]) instruction_simplifier (before)
113*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
114*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
115*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
116*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
117*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
118*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<UMAX>>]             loop:<<Loop>>      outer_loop:none
119*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And2:i\d+>> And [<<UMAX>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
120*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<And1>>,<<And2>>]             loop:<<Loop>>      outer_loop:none
121*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
122*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
123*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
124*795d594fSAndroid Build Coastguard Worker   //
125*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (before)
126*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
127*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
128*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
129*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
130*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
131*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
132*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
133*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
134*795d594fSAndroid Build Coastguard Worker   //
135*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (after)
136*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
137*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
138*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
139*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
140*795d594fSAndroid Build Coastguard Worker   //
141*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (after)
142*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
143*795d594fSAndroid Build Coastguard Worker   //
144*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
145*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
146*795d594fSAndroid Build Coastguard Worker   //
147*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
148*795d594fSAndroid Build Coastguard Worker   //
149*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
150*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
151*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
152*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
153*795d594fSAndroid Build Coastguard Worker   //
154*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
halving_add_unsigned(short[] b1, short[] b2, short[] bo)155*795d594fSAndroid Build Coastguard Worker   private static void halving_add_unsigned(short[] b1, short[] b2, short[] bo) {
156*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
157*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
158*795d594fSAndroid Build Coastguard Worker       int v1 = b1[i] & 0xffff;
159*795d594fSAndroid Build Coastguard Worker       int v2 = b2[i] & 0xffff;
160*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) ((v1 + v2) >> 1);
161*795d594fSAndroid Build Coastguard Worker     }
162*795d594fSAndroid Build Coastguard Worker   }
163*795d594fSAndroid Build Coastguard Worker 
164*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (before)
165*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
166*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
167*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
168*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
169*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
170*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
171*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
172*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
173*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
174*795d594fSAndroid Build Coastguard Worker   //
175*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (after)
176*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
177*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
178*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
179*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
180*795d594fSAndroid Build Coastguard Worker   //
181*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (after)
182*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
183*795d594fSAndroid Build Coastguard Worker   //
184*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
185*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
186*795d594fSAndroid Build Coastguard Worker   //
187*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
188*795d594fSAndroid Build Coastguard Worker   //
189*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
190*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
191*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
192*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
193*795d594fSAndroid Build Coastguard Worker   //
194*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_signed(short[] b1, short[] b2, short[] bo)195*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_signed(short[] b1, short[] b2, short[] bo) {
196*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
197*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
198*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) ((b1[i] + b2[i] + 1) >> 1);
199*795d594fSAndroid Build Coastguard Worker     }
200*795d594fSAndroid Build Coastguard Worker   }
201*795d594fSAndroid Build Coastguard Worker 
202*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_signed_alt(short[], short[], short[]) loop_optimization (before)
203*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
204*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
205*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
206*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
207*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
208*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
209*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
210*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
211*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
212*795d594fSAndroid Build Coastguard Worker   //
213*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_signed_alt(short[], short[], short[]) loop_optimization (after)
214*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
215*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
216*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
217*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
218*795d594fSAndroid Build Coastguard Worker   //
219*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_signed_alt(short[], short[], short[]) loop_optimization (after)
220*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
221*795d594fSAndroid Build Coastguard Worker   //
222*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
223*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
224*795d594fSAndroid Build Coastguard Worker   //
225*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
226*795d594fSAndroid Build Coastguard Worker   //
227*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
228*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
229*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
230*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
231*795d594fSAndroid Build Coastguard Worker   //
232*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_signed_alt(short[] b1, short[] b2, short[] bo)233*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_signed_alt(short[] b1, short[] b2, short[] bo) {
234*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
235*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
236*795d594fSAndroid Build Coastguard Worker       // Slightly different order in idiom does not confuse recognition.
237*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (((1 + b1[i]) + b2[i]) >> 1);
238*795d594fSAndroid Build Coastguard Worker     }
239*795d594fSAndroid Build Coastguard Worker   }
240*795d594fSAndroid Build Coastguard Worker 
241*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_signed_alt2(short[], short[], short[]) loop_optimization (before)
242*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
243*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I10:i\d+>>  IntConstant 10                      loop:none
244*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<M9:i\d+>>   IntConstant -9                      loop:none
245*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
246*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
247*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
248*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<I10>>]              loop:<<Loop>>      outer_loop:none
249*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Get2>>,<<M9>>]               loop:<<Loop>>      outer_loop:none
250*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add3:i\d+>> Add [<<Add1>>,<<Add2>>]             loop:<<Loop>>      outer_loop:none
251*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add3>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
252*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
253*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
254*795d594fSAndroid Build Coastguard Worker   //
255*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_signed_alt2(short[], short[], short[]) loop_optimization (after)
256*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
257*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
258*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
259*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
260*795d594fSAndroid Build Coastguard Worker   //
261*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_signed_alt2(short[], short[], short[]) loop_optimization (after)
262*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
263*795d594fSAndroid Build Coastguard Worker   //
264*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
265*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
266*795d594fSAndroid Build Coastguard Worker   //
267*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
268*795d594fSAndroid Build Coastguard Worker   //
269*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
270*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
271*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
272*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
273*795d594fSAndroid Build Coastguard Worker   //
274*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_signed_alt2(short[] b1, short[] b2, short[] bo)275*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_signed_alt2(short[] b1, short[] b2, short[] bo) {
276*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
277*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
278*795d594fSAndroid Build Coastguard Worker       // Computations that cancel to adding 1 also do not confuse recognition.
279*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (((b1[i] + 10) + (b2[i] - 9)) >> 1);
280*795d594fSAndroid Build Coastguard Worker     }
281*795d594fSAndroid Build Coastguard Worker   }
282*795d594fSAndroid Build Coastguard Worker 
283*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_signed_alt3(short[], short[], short[]) loop_optimization (before)
284*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
285*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<M1:i\d+>>   IntConstant -1                      loop:none
286*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I9:i\d+>>   IntConstant 9                       loop:none
287*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<M9:i\d+>>   IntConstant -9                      loop:none
288*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
289*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
290*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
291*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<I9>>]               loop:<<Loop>>      outer_loop:none
292*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Get2>>,<<M9>>]               loop:<<Loop>>      outer_loop:none
293*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add3:i\d+>> Add [<<Add1>>,<<Add2>>]             loop:<<Loop>>      outer_loop:none
294*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Sub:i\d+>>  Sub [<<Add3>>,<<M1>>]               loop:<<Loop>>      outer_loop:none
295*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Sub>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
296*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
297*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
298*795d594fSAndroid Build Coastguard Worker   //
299*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_signed_alt3(short[], short[], short[]) loop_optimization (after)
300*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
301*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
302*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
303*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
304*795d594fSAndroid Build Coastguard Worker   //
305*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_signed_alt3(short[], short[], short[]) loop_optimization (after)
306*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
307*795d594fSAndroid Build Coastguard Worker   //
308*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
309*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
310*795d594fSAndroid Build Coastguard Worker   //
311*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
312*795d594fSAndroid Build Coastguard Worker   //
313*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
314*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
315*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none
316*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
317*795d594fSAndroid Build Coastguard Worker   //
318*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_signed_alt3(short[] b1, short[] b2, short[] bo)319*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_signed_alt3(short[] b1, short[] b2, short[] bo) {
320*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
321*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
322*795d594fSAndroid Build Coastguard Worker       // Computations that cancel to adding 1 also do not confuse recognition.
323*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (((b1[i] + 9) + (b2[i] - 9) - $inline$mone()) >> 1);
324*795d594fSAndroid Build Coastguard Worker     }
325*795d594fSAndroid Build Coastguard Worker   }
326*795d594fSAndroid Build Coastguard Worker 
327*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_unsigned(short[], short[], short[]) instruction_simplifier (before)
328*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
329*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
330*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
331*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
332*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
333*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<UMAX>>]             loop:<<Loop>>      outer_loop:none
334*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And2:i\d+>> And [<<UMAX>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
335*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<And1>>,<<And2>>]             loop:<<Loop>>      outer_loop:none
336*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
337*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
338*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
339*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
340*795d594fSAndroid Build Coastguard Worker   //
341*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (before)
342*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
343*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
344*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
345*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
346*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
347*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
348*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
349*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
350*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
351*795d594fSAndroid Build Coastguard Worker   //
352*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (after)
353*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
354*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
355*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
356*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
357*795d594fSAndroid Build Coastguard Worker   //
358*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (after)
359*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
360*795d594fSAndroid Build Coastguard Worker   //
361*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
362*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
363*795d594fSAndroid Build Coastguard Worker   //
364*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
365*795d594fSAndroid Build Coastguard Worker   //
366*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
367*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
368*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
369*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
370*795d594fSAndroid Build Coastguard Worker   //
371*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_unsigned(short[] b1, short[] b2, short[] bo)372*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_unsigned(short[] b1, short[] b2, short[] bo) {
373*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
374*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
375*795d594fSAndroid Build Coastguard Worker       int v1 = b1[i] & 0xffff;
376*795d594fSAndroid Build Coastguard Worker       int v2 = b2[i] & 0xffff;
377*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) ((v1 + v2 + 1) >> 1);
378*795d594fSAndroid Build Coastguard Worker     }
379*795d594fSAndroid Build Coastguard Worker   }
380*795d594fSAndroid Build Coastguard Worker 
381*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_unsigned_alt(short[], short[], short[]) instruction_simplifier (before)
382*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
383*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
384*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
385*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
386*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:s\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
387*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<UMAX>>]             loop:<<Loop>>      outer_loop:none
388*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And2:i\d+>> And [<<UMAX>>,<<Get2>>]             loop:<<Loop>>      outer_loop:none
389*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<And2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
390*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<And1>>]             loop:<<Loop>>      outer_loop:none
391*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
392*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
393*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
394*795d594fSAndroid Build Coastguard Worker   //
395*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.rounding_halving_add_unsigned_alt(short[], short[], short[]) loop_optimization (before)
396*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
397*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
398*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
399*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:c\d+>> ArrayGet                            loop:<<Loop>>      outer_loop:none
400*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
401*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add2:i\d+>> Add [<<Get1>>,<<Add1>>]             loop:<<Loop>>      outer_loop:none
402*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add2>>,<<I1>>]               loop:<<Loop>>      outer_loop:none
403*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
404*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
405*795d594fSAndroid Build Coastguard Worker   //
406*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.rounding_halving_add_unsigned_alt(short[], short[], short[]) loop_optimization (after)
407*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
408*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
409*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
410*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
411*795d594fSAndroid Build Coastguard Worker   //
412*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.rounding_halving_add_unsigned_alt(short[], short[], short[]) loop_optimization (after)
413*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
414*795d594fSAndroid Build Coastguard Worker   //
415*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
416*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
417*795d594fSAndroid Build Coastguard Worker   //
418*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
419*795d594fSAndroid Build Coastguard Worker   //
420*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get1:d\d+>> VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
421*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get2:d\d+>> VecLoad                               loop:<<Loop>>      outer_loop:none
422*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none
423*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
424*795d594fSAndroid Build Coastguard Worker   //
425*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
rounding_halving_add_unsigned_alt(short[] b1, short[] b2, short[] bo)426*795d594fSAndroid Build Coastguard Worker   private static void rounding_halving_add_unsigned_alt(short[] b1, short[] b2, short[] bo) {
427*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, Math.min(b1.length, b2.length));
428*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
429*795d594fSAndroid Build Coastguard Worker       // Slightly different order in idiom does not confuse recognition.
430*795d594fSAndroid Build Coastguard Worker       int v1 = b1[i] & 0xffff;
431*795d594fSAndroid Build Coastguard Worker       int v2 = b2[i] & 0xffff;
432*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (v1 + (v2 + 1) >> 1);
433*795d594fSAndroid Build Coastguard Worker     }
434*795d594fSAndroid Build Coastguard Worker   }
435*795d594fSAndroid Build Coastguard Worker 
436*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_signed_constant(short[], short[]) loop_optimization (before)
437*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
438*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767                   loop:none
439*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
440*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get:s\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
441*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get>>,<<SMAX>>]              loop:<<Loop>>      outer_loop:none
442*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
443*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
444*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
445*795d594fSAndroid Build Coastguard Worker   //
446*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.halving_add_signed_constant(short[], short[]) loop_optimization (after)
447*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767                     loop:none
448*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<SMAX>>]         loop:none
449*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
450*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
451*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
452*795d594fSAndroid Build Coastguard Worker   //
453*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.halving_add_signed_constant(short[], short[]) loop_optimization (after)
454*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
455*795d594fSAndroid Build Coastguard Worker   //
456*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
457*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
458*795d594fSAndroid Build Coastguard Worker   //
459*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
460*795d594fSAndroid Build Coastguard Worker   //
461*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767                     loop:none
462*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<SMAX>>]         loop:none
463*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
464*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none
465*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
466*795d594fSAndroid Build Coastguard Worker   //
467*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
halving_add_signed_constant(short[] b1, short[] bo)468*795d594fSAndroid Build Coastguard Worker   private static void halving_add_signed_constant(short[] b1, short[] bo) {
469*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, b1.length);
470*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
471*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) ((b1[i] + 0x7fff) >> 1);
472*795d594fSAndroid Build Coastguard Worker     }
473*795d594fSAndroid Build Coastguard Worker   }
474*795d594fSAndroid Build Coastguard Worker 
475*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_unsigned_constant(short[], short[]) instruction_simplifier (before)
476*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
477*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
478*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
479*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get:s\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
480*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<And:i\d+>>  And [<<Get>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
481*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<And>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
482*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
483*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
484*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>>      outer_loop:none
485*795d594fSAndroid Build Coastguard Worker   //
486*795d594fSAndroid Build Coastguard Worker   /// CHECK-START: void HaddShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (before)
487*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<I1:i\d+>>   IntConstant 1                       loop:none
488*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                   loop:none
489*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Phi:i\d+>>  Phi                                 loop:<<Loop:B\d+>> outer_loop:none
490*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get:c\d+>>  ArrayGet                            loop:<<Loop>>      outer_loop:none
491*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Add:i\d+>>  Add [<<Get>>,<<UMAX>>]              loop:<<Loop>>      outer_loop:none
492*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Shr:i\d+>>  Shr [<<Add>>,<<I1>>]                loop:<<Loop>>      outer_loop:none
493*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Cnv:s\d+>>  TypeConversion [<<Shr>>]            loop:<<Loop>>      outer_loop:none
494*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>>      outer_loop:none
495*795d594fSAndroid Build Coastguard Worker   //
496*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM: void HaddShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (after)
497*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
498*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
499*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
500*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
501*795d594fSAndroid Build Coastguard Worker   /// CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
502*795d594fSAndroid Build Coastguard Worker   //
503*795d594fSAndroid Build Coastguard Worker   /// CHECK-START-ARM64: void HaddShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (after)
504*795d594fSAndroid Build Coastguard Worker   /// CHECK-IF:     hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true'
505*795d594fSAndroid Build Coastguard Worker   //
506*795d594fSAndroid Build Coastguard Worker   //      HalvingAdd idiom is not supported for SVE.
507*795d594fSAndroid Build Coastguard Worker   ///     CHECK-NOT: VecHalvingAdd
508*795d594fSAndroid Build Coastguard Worker   //
509*795d594fSAndroid Build Coastguard Worker   /// CHECK-ELSE:
510*795d594fSAndroid Build Coastguard Worker   //
511*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535                     loop:none
512*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>]         loop:none
513*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<Get:d\d+>>  VecLoad                               loop:<<Loop:B\d+>> outer_loop:none
514*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none
515*795d594fSAndroid Build Coastguard Worker   ///     CHECK-DAG:               VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>>      outer_loop:none
516*795d594fSAndroid Build Coastguard Worker   //
517*795d594fSAndroid Build Coastguard Worker   /// CHECK-FI:
halving_add_unsigned_constant(short[] b1, short[] bo)518*795d594fSAndroid Build Coastguard Worker   private static void halving_add_unsigned_constant(short[] b1, short[] bo) {
519*795d594fSAndroid Build Coastguard Worker     int min_length = Math.min(bo.length, b1.length);
520*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < min_length; i++) {
521*795d594fSAndroid Build Coastguard Worker       bo[i] = (short) (((b1[i] & 0xffff) + 0xffff) >> 1);
522*795d594fSAndroid Build Coastguard Worker     }
523*795d594fSAndroid Build Coastguard Worker   }
524*795d594fSAndroid Build Coastguard Worker 
main()525*795d594fSAndroid Build Coastguard Worker   public static void main() {
526*795d594fSAndroid Build Coastguard Worker     // Some interesting values.
527*795d594fSAndroid Build Coastguard Worker     short[] interesting = {
528*795d594fSAndroid Build Coastguard Worker       (short) 0x0000,
529*795d594fSAndroid Build Coastguard Worker       (short) 0x0001,
530*795d594fSAndroid Build Coastguard Worker       (short) 0x0002,
531*795d594fSAndroid Build Coastguard Worker       (short) 0x1234,
532*795d594fSAndroid Build Coastguard Worker       (short) 0x8000,
533*795d594fSAndroid Build Coastguard Worker       (short) 0x8001,
534*795d594fSAndroid Build Coastguard Worker       (short) 0x7fff,
535*795d594fSAndroid Build Coastguard Worker       (short) 0xffff
536*795d594fSAndroid Build Coastguard Worker     };
537*795d594fSAndroid Build Coastguard Worker     // Initialize cross-values to test all cases, and also
538*795d594fSAndroid Build Coastguard Worker     // set up some extra values to exercise the cleanup loop.
539*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
540*795d594fSAndroid Build Coastguard Worker       sB1[i] = (short) i;
541*795d594fSAndroid Build Coastguard Worker       sB2[i] = interesting[i & 7];
542*795d594fSAndroid Build Coastguard Worker     }
543*795d594fSAndroid Build Coastguard Worker 
544*795d594fSAndroid Build Coastguard Worker     // Test halving add idioms.
545*795d594fSAndroid Build Coastguard Worker     halving_add_signed(sB1, sB2, sBo);
546*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
547*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i]) >> 1);
548*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
549*795d594fSAndroid Build Coastguard Worker     }
550*795d594fSAndroid Build Coastguard Worker     halving_add_signed_alt(sB1, sB2, sBo);
551*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
552*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i]) >> 1);
553*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
554*795d594fSAndroid Build Coastguard Worker     }
555*795d594fSAndroid Build Coastguard Worker     halving_add_unsigned(sB1, sB2, sBo);
556*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
557*795d594fSAndroid Build Coastguard Worker       short e = (short) (((sB1[i] & 0xffff) + (sB2[i] & 0xffff)) >> 1);
558*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
559*795d594fSAndroid Build Coastguard Worker     }
560*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_signed(sB1, sB2, sBo);
561*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
562*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i] + 1) >> 1);
563*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
564*795d594fSAndroid Build Coastguard Worker     }
565*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_signed_alt(sB1, sB2, sBo);
566*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
567*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i] + 1) >> 1);
568*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
569*795d594fSAndroid Build Coastguard Worker     }
570*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_signed_alt2(sB1, sB2, sBo);
571*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
572*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i] + 1) >> 1);
573*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
574*795d594fSAndroid Build Coastguard Worker     }
575*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_signed_alt3(sB1, sB2, sBo);
576*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
577*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + sB2[i] + 1) >> 1);
578*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
579*795d594fSAndroid Build Coastguard Worker     }
580*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_unsigned(sB1, sB2, sBo);
581*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
582*795d594fSAndroid Build Coastguard Worker       short e = (short) (((sB1[i] & 0xffff) + (sB2[i] & 0xffff) + 1) >> 1);
583*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
584*795d594fSAndroid Build Coastguard Worker     }
585*795d594fSAndroid Build Coastguard Worker     rounding_halving_add_unsigned_alt(sB1, sB2, sBo);
586*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
587*795d594fSAndroid Build Coastguard Worker       short e = (short) (((sB1[i] & 0xffff) + (sB2[i] & 0xffff) + 1) >> 1);
588*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
589*795d594fSAndroid Build Coastguard Worker     }
590*795d594fSAndroid Build Coastguard Worker     halving_add_signed_constant(sB1, sBo);
591*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
592*795d594fSAndroid Build Coastguard Worker       short e = (short) ((sB1[i] + 0x7fff) >> 1);
593*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
594*795d594fSAndroid Build Coastguard Worker     }
595*795d594fSAndroid Build Coastguard Worker     halving_add_unsigned_constant(sB1, sBo);
596*795d594fSAndroid Build Coastguard Worker     for (int i = 0; i < M; i++) {
597*795d594fSAndroid Build Coastguard Worker       short e = (short) (((sB1[i] & 0xffff) + 0xffff) >> 1);
598*795d594fSAndroid Build Coastguard Worker       expectEquals(e, sBo[i]);
599*795d594fSAndroid Build Coastguard Worker     }
600*795d594fSAndroid Build Coastguard Worker 
601*795d594fSAndroid Build Coastguard Worker     System.out.println("HaddShort passed");
602*795d594fSAndroid Build Coastguard Worker   }
603*795d594fSAndroid Build Coastguard Worker 
expectEquals(int expected, int result)604*795d594fSAndroid Build Coastguard Worker   private static void expectEquals(int expected, int result) {
605*795d594fSAndroid Build Coastguard Worker     if (expected != result) {
606*795d594fSAndroid Build Coastguard Worker       throw new Error("Expected: " + expected + ", found: " + result);
607*795d594fSAndroid Build Coastguard Worker     }
608*795d594fSAndroid Build Coastguard Worker   }
609*795d594fSAndroid Build Coastguard Worker }
610