1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2017 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker /** 18*795d594fSAndroid Build Coastguard Worker * Tests for SAD (sum of absolute differences). 19*795d594fSAndroid Build Coastguard Worker */ 20*795d594fSAndroid Build Coastguard Worker public class SimdSadByte { 21*795d594fSAndroid Build Coastguard Worker 22*795d594fSAndroid Build Coastguard Worker // TODO: lower precision still coming, b/64091002 23*795d594fSAndroid Build Coastguard Worker sadByte2Byte(byte[] b1, byte[] b2)24*795d594fSAndroid Build Coastguard Worker private static byte sadByte2Byte(byte[] b1, byte[] b2) { 25*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 26*795d594fSAndroid Build Coastguard Worker byte sad = 0; 27*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 28*795d594fSAndroid Build Coastguard Worker sad += Math.abs(b1[i] - b2[i]); 29*795d594fSAndroid Build Coastguard Worker } 30*795d594fSAndroid Build Coastguard Worker return sad; 31*795d594fSAndroid Build Coastguard Worker } 32*795d594fSAndroid Build Coastguard Worker sadByte2ByteAlt(byte[] b1, byte[] b2)33*795d594fSAndroid Build Coastguard Worker private static byte sadByte2ByteAlt(byte[] b1, byte[] b2) { 34*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 35*795d594fSAndroid Build Coastguard Worker byte sad = 0; 36*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 37*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 38*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 39*795d594fSAndroid Build Coastguard Worker sad += s >= p ? s - p : p - s; 40*795d594fSAndroid Build Coastguard Worker } 41*795d594fSAndroid Build Coastguard Worker return sad; 42*795d594fSAndroid Build Coastguard Worker } 43*795d594fSAndroid Build Coastguard Worker sadByte2ByteAlt2(byte[] b1, byte[] b2)44*795d594fSAndroid Build Coastguard Worker private static byte sadByte2ByteAlt2(byte[] b1, byte[] b2) { 45*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 46*795d594fSAndroid Build Coastguard Worker byte sad = 0; 47*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 48*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 49*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 50*795d594fSAndroid Build Coastguard Worker int x = s - p; 51*795d594fSAndroid Build Coastguard Worker if (x < 0) x = -x; 52*795d594fSAndroid Build Coastguard Worker sad += x; 53*795d594fSAndroid Build Coastguard Worker } 54*795d594fSAndroid Build Coastguard Worker return sad; 55*795d594fSAndroid Build Coastguard Worker } 56*795d594fSAndroid Build Coastguard Worker sadByte2Short(byte[] b1, byte[] b2)57*795d594fSAndroid Build Coastguard Worker private static short sadByte2Short(byte[] b1, byte[] b2) { 58*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 59*795d594fSAndroid Build Coastguard Worker short sad = 0; 60*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 61*795d594fSAndroid Build Coastguard Worker sad += Math.abs(b1[i] - b2[i]); 62*795d594fSAndroid Build Coastguard Worker } 63*795d594fSAndroid Build Coastguard Worker return sad; 64*795d594fSAndroid Build Coastguard Worker } 65*795d594fSAndroid Build Coastguard Worker sadByte2ShortAlt(byte[] b1, byte[] b2)66*795d594fSAndroid Build Coastguard Worker private static short sadByte2ShortAlt(byte[] b1, byte[] b2) { 67*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 68*795d594fSAndroid Build Coastguard Worker short sad = 0; 69*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 70*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 71*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 72*795d594fSAndroid Build Coastguard Worker sad += s >= p ? s - p : p - s; 73*795d594fSAndroid Build Coastguard Worker } 74*795d594fSAndroid Build Coastguard Worker return sad; 75*795d594fSAndroid Build Coastguard Worker } 76*795d594fSAndroid Build Coastguard Worker sadByte2ShortAlt2(byte[] b1, byte[] b2)77*795d594fSAndroid Build Coastguard Worker private static short sadByte2ShortAlt2(byte[] b1, byte[] b2) { 78*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 79*795d594fSAndroid Build Coastguard Worker short sad = 0; 80*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 81*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 82*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 83*795d594fSAndroid Build Coastguard Worker int x = s - p; 84*795d594fSAndroid Build Coastguard Worker if (x < 0) x = -x; 85*795d594fSAndroid Build Coastguard Worker sad += x; 86*795d594fSAndroid Build Coastguard Worker } 87*795d594fSAndroid Build Coastguard Worker return sad; 88*795d594fSAndroid Build Coastguard Worker } 89*795d594fSAndroid Build Coastguard Worker 90*795d594fSAndroid Build Coastguard Worker /// CHECK-START: int SimdSadByte.sadByte2Int(byte[], byte[]) loop_optimization (before) 91*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 92*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons1:i\d+>> IntConstant 1 loop:none 93*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 94*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop>> outer_loop:none 95*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 96*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 97*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Sub:i\d+>> Sub [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 98*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Intrin:i\d+>> Abs [<<Sub>>] loop:<<Loop>> outer_loop:none 99*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi2>>,<<Intrin>>] loop:<<Loop>> outer_loop:none 100*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons1>>] loop:<<Loop>> outer_loop:none 101*795d594fSAndroid Build Coastguard Worker // 102*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: int SimdSadByte.sadByte2Int(byte[], byte[]) loop_optimization (after) 103*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 104*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 105*795d594fSAndroid Build Coastguard Worker // 106*795d594fSAndroid Build Coastguard Worker // SAD idiom is not supported for SVE. 107*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecSADAccumulate 108*795d594fSAndroid Build Coastguard Worker // 109*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 110*795d594fSAndroid Build Coastguard Worker // 111*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons16:i\d+>> IntConstant 16 loop:none 112*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Set:d\d+>> VecSetScalars [<<Cons0>>] loop:none 113*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 114*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:d\d+>> Phi [<<Set>>,{{d\d+}}] loop:<<Loop>> outer_loop:none 115*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load1:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 116*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load2:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 117*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SAD:d\d+>> VecSADAccumulate [<<Phi2>>,<<Load1>>,<<Load2>>] loop:<<Loop>> outer_loop:none 118*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons16>>] loop:<<Loop>> outer_loop:none 119*795d594fSAndroid Build Coastguard Worker // 120*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: sadByte2Int(byte[] b1, byte[] b2)121*795d594fSAndroid Build Coastguard Worker private static int sadByte2Int(byte[] b1, byte[] b2) { 122*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 123*795d594fSAndroid Build Coastguard Worker int sad = 0; 124*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 125*795d594fSAndroid Build Coastguard Worker sad += Math.abs(b1[i] - b2[i]); 126*795d594fSAndroid Build Coastguard Worker } 127*795d594fSAndroid Build Coastguard Worker return sad; 128*795d594fSAndroid Build Coastguard Worker } 129*795d594fSAndroid Build Coastguard Worker 130*795d594fSAndroid Build Coastguard Worker /// CHECK-START: int SimdSadByte.sadByte2IntAlt(byte[], byte[]) loop_optimization (before) 131*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 132*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons1:i\d+>> IntConstant 1 loop:none 133*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 134*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop>> outer_loop:none 135*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 136*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 137*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Sub:i\d+>> Sub [<<Get2>>,<<Get1>>] loop:<<Loop>> outer_loop:none 138*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Intrin:i\d+>> Abs [<<Sub>>] loop:<<Loop>> outer_loop:none 139*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi2>>,<<Intrin>>] loop:<<Loop>> outer_loop:none 140*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons1>>] loop:<<Loop>> outer_loop:none 141*795d594fSAndroid Build Coastguard Worker // 142*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: int SimdSadByte.sadByte2IntAlt(byte[], byte[]) loop_optimization (after) 143*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 144*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 145*795d594fSAndroid Build Coastguard Worker // 146*795d594fSAndroid Build Coastguard Worker // SAD idiom is not supported for SVE. 147*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecSADAccumulate 148*795d594fSAndroid Build Coastguard Worker // 149*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 150*795d594fSAndroid Build Coastguard Worker // 151*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons16:i\d+>> IntConstant 16 loop:none 152*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Set:d\d+>> VecSetScalars [<<Cons0>>] loop:none 153*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 154*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:d\d+>> Phi [<<Set>>,{{d\d+}}] loop:<<Loop>> outer_loop:none 155*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load1:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 156*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load2:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 157*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SAD:d\d+>> VecSADAccumulate [<<Phi2>>,<<Load2>>,<<Load1>>] loop:<<Loop>> outer_loop:none 158*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons16>>] loop:<<Loop>> outer_loop:none 159*795d594fSAndroid Build Coastguard Worker // 160*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: sadByte2IntAlt(byte[] b1, byte[] b2)161*795d594fSAndroid Build Coastguard Worker private static int sadByte2IntAlt(byte[] b1, byte[] b2) { 162*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 163*795d594fSAndroid Build Coastguard Worker int sad = 0; 164*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 165*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 166*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 167*795d594fSAndroid Build Coastguard Worker sad += s >= p ? s - p : p - s; 168*795d594fSAndroid Build Coastguard Worker } 169*795d594fSAndroid Build Coastguard Worker return sad; 170*795d594fSAndroid Build Coastguard Worker } 171*795d594fSAndroid Build Coastguard Worker 172*795d594fSAndroid Build Coastguard Worker /// CHECK-START: int SimdSadByte.sadByte2IntAlt2(byte[], byte[]) loop_optimization (before) 173*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 174*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons1:i\d+>> IntConstant 1 loop:none 175*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 176*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop>> outer_loop:none 177*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 178*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 179*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Sub:i\d+>> Sub [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 180*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Intrin:i\d+>> Abs [<<Sub>>] loop:<<Loop>> outer_loop:none 181*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi2>>,<<Intrin>>] loop:<<Loop>> outer_loop:none 182*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons1>>] loop:<<Loop>> outer_loop:none 183*795d594fSAndroid Build Coastguard Worker // 184*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: int SimdSadByte.sadByte2IntAlt2(byte[], byte[]) loop_optimization (after) 185*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 186*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 187*795d594fSAndroid Build Coastguard Worker // 188*795d594fSAndroid Build Coastguard Worker // SAD idiom is not supported for SVE. 189*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecSADAccumulate 190*795d594fSAndroid Build Coastguard Worker // 191*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 192*795d594fSAndroid Build Coastguard Worker // 193*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons16:i\d+>> IntConstant 16 loop:none 194*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Set:d\d+>> VecSetScalars [<<Cons0>>] loop:none 195*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 196*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:d\d+>> Phi [<<Set>>,{{d\d+}}] loop:<<Loop>> outer_loop:none 197*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load1:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 198*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load2:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 199*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SAD:d\d+>> VecSADAccumulate [<<Phi2>>,<<Load1>>,<<Load2>>] loop:<<Loop>> outer_loop:none 200*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons16>>] loop:<<Loop>> outer_loop:none 201*795d594fSAndroid Build Coastguard Worker // 202*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: sadByte2IntAlt2(byte[] b1, byte[] b2)203*795d594fSAndroid Build Coastguard Worker private static int sadByte2IntAlt2(byte[] b1, byte[] b2) { 204*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 205*795d594fSAndroid Build Coastguard Worker int sad = 0; 206*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 207*795d594fSAndroid Build Coastguard Worker byte s = b1[i]; 208*795d594fSAndroid Build Coastguard Worker byte p = b2[i]; 209*795d594fSAndroid Build Coastguard Worker int x = s - p; 210*795d594fSAndroid Build Coastguard Worker if (x < 0) x = -x; 211*795d594fSAndroid Build Coastguard Worker sad += x; 212*795d594fSAndroid Build Coastguard Worker } 213*795d594fSAndroid Build Coastguard Worker return sad; 214*795d594fSAndroid Build Coastguard Worker } 215*795d594fSAndroid Build Coastguard Worker 216*795d594fSAndroid Build Coastguard Worker /// CHECK-START: long SimdSadByte.sadByte2Long(byte[], byte[]) loop_optimization (before) 217*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 218*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons1:i\d+>> IntConstant 1 loop:none 219*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<ConsL:j\d+>> LongConstant 0 loop:none 220*795d594fSAndroid Build Coastguard Worker 221*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 222*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:j\d+>> Phi [<<ConsL>>,{{j\d+}}] loop:<<Loop>> outer_loop:none 223*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 224*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 225*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv1:j\d+>> TypeConversion [<<Get1>>] loop:<<Loop>> outer_loop:none 226*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv2:j\d+>> TypeConversion [<<Get2>>] loop:<<Loop>> outer_loop:none 227*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Sub:j\d+>> Sub [<<Cnv1>>,<<Cnv2>>] loop:<<Loop>> outer_loop:none 228*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Intrin:j\d+>> Abs [<<Sub>>] loop:<<Loop>> outer_loop:none 229*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi2>>,<<Intrin>>] loop:<<Loop>> outer_loop:none 230*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons1>>] loop:<<Loop>> outer_loop:none 231*795d594fSAndroid Build Coastguard Worker // 232*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: long SimdSadByte.sadByte2Long(byte[], byte[]) loop_optimization (after) 233*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 234*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<ConsL:j\d+>> LongConstant 0 loop:none 235*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 236*795d594fSAndroid Build Coastguard Worker // 237*795d594fSAndroid Build Coastguard Worker // SAD idiom is not supported for SVE. 238*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecSADAccumulate 239*795d594fSAndroid Build Coastguard Worker // 240*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 241*795d594fSAndroid Build Coastguard Worker // 242*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons16:i\d+>> IntConstant 16 loop:none 243*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Set:d\d+>> VecSetScalars [<<ConsL>>] loop:none 244*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 245*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:d\d+>> Phi [<<Set>>,{{d\d+}}] loop:<<Loop>> outer_loop:none 246*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load1:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 247*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load2:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 248*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SAD:d\d+>> VecSADAccumulate [<<Phi2>>,<<Load1>>,<<Load2>>] loop:<<Loop>> outer_loop:none 249*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons16>>] loop:<<Loop>> outer_loop:none 250*795d594fSAndroid Build Coastguard Worker // 251*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: sadByte2Long(byte[] b1, byte[] b2)252*795d594fSAndroid Build Coastguard Worker private static long sadByte2Long(byte[] b1, byte[] b2) { 253*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 254*795d594fSAndroid Build Coastguard Worker long sad = 0; 255*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 256*795d594fSAndroid Build Coastguard Worker long x = b1[i]; 257*795d594fSAndroid Build Coastguard Worker long y = b2[i]; 258*795d594fSAndroid Build Coastguard Worker sad += Math.abs(x - y); 259*795d594fSAndroid Build Coastguard Worker } 260*795d594fSAndroid Build Coastguard Worker return sad; 261*795d594fSAndroid Build Coastguard Worker } 262*795d594fSAndroid Build Coastguard Worker 263*795d594fSAndroid Build Coastguard Worker /// CHECK-START: long SimdSadByte.sadByte2LongAt1(byte[], byte[]) loop_optimization (before) 264*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 265*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons1:i\d+>> IntConstant 1 loop:none 266*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<ConsL:j\d+>> LongConstant 1 loop:none 267*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 268*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:j\d+>> Phi [<<ConsL>>,{{j\d+}}] loop:<<Loop>> outer_loop:none 269*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 270*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:b\d+>> ArrayGet [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 271*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv1:j\d+>> TypeConversion [<<Get1>>] loop:<<Loop>> outer_loop:none 272*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv2:j\d+>> TypeConversion [<<Get2>>] loop:<<Loop>> outer_loop:none 273*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Sub:j\d+>> Sub [<<Cnv1>>,<<Cnv2>>] loop:<<Loop>> outer_loop:none 274*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Intrin:j\d+>> Abs [<<Sub>>] loop:<<Loop>> outer_loop:none 275*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi2>>,<<Intrin>>] loop:<<Loop>> outer_loop:none 276*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons1>>] loop:<<Loop>> outer_loop:none 277*795d594fSAndroid Build Coastguard Worker // 278*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: long SimdSadByte.sadByte2LongAt1(byte[], byte[]) loop_optimization (after) 279*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons0:i\d+>> IntConstant 0 loop:none 280*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<ConsL:j\d+>> LongConstant 1 loop:none 281*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 282*795d594fSAndroid Build Coastguard Worker // 283*795d594fSAndroid Build Coastguard Worker // SAD idiom is not supported for SVE. 284*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecSADAccumulate 285*795d594fSAndroid Build Coastguard Worker // 286*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 287*795d594fSAndroid Build Coastguard Worker // 288*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cons16:i\d+>> IntConstant 16 loop:none 289*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Set:d\d+>> VecSetScalars [<<ConsL>>] loop:none 290*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi1:i\d+>> Phi [<<Cons0>>,{{i\d+}}] loop:<<Loop:B\d+>> outer_loop:none 291*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi2:d\d+>> Phi [<<Set>>,{{d\d+}}] loop:<<Loop>> outer_loop:none 292*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load1:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 293*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Load2:d\d+>> VecLoad [{{l\d+}},<<Phi1>>] loop:<<Loop>> outer_loop:none 294*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SAD:d\d+>> VecSADAccumulate [<<Phi2>>,<<Load1>>,<<Load2>>] loop:<<Loop>> outer_loop:none 295*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: Add [<<Phi1>>,<<Cons16>>] loop:<<Loop>> outer_loop:none 296*795d594fSAndroid Build Coastguard Worker // 297*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: sadByte2LongAt1(byte[] b1, byte[] b2)298*795d594fSAndroid Build Coastguard Worker private static long sadByte2LongAt1(byte[] b1, byte[] b2) { 299*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(b1.length, b2.length); 300*795d594fSAndroid Build Coastguard Worker long sad = 1; // starts at 1 301*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 302*795d594fSAndroid Build Coastguard Worker long x = b1[i]; 303*795d594fSAndroid Build Coastguard Worker long y = b2[i]; 304*795d594fSAndroid Build Coastguard Worker sad += Math.abs(x - y); 305*795d594fSAndroid Build Coastguard Worker } 306*795d594fSAndroid Build Coastguard Worker return sad; 307*795d594fSAndroid Build Coastguard Worker } 308*795d594fSAndroid Build Coastguard Worker main()309*795d594fSAndroid Build Coastguard Worker public static void main() { 310*795d594fSAndroid Build Coastguard Worker // Cross-test the two most extreme values individually. 311*795d594fSAndroid Build Coastguard Worker byte[] b1 = { 0, -128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; 312*795d594fSAndroid Build Coastguard Worker byte[] b2 = { 0, 127, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; 313*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2Byte(b1, b2)); 314*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2Byte(b2, b1)); 315*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2ByteAlt(b1, b2)); 316*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2ByteAlt(b2, b1)); 317*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2ByteAlt2(b1, b2)); 318*795d594fSAndroid Build Coastguard Worker expectEquals(-1, sadByte2ByteAlt2(b2, b1)); 319*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2Short(b1, b2)); 320*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2Short(b2, b1)); 321*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2ShortAlt(b1, b2)); 322*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2ShortAlt(b2, b1)); 323*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2ShortAlt2(b1, b2)); 324*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2ShortAlt2(b2, b1)); 325*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2Int(b1, b2)); 326*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2Int(b2, b1)); 327*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2IntAlt(b1, b2)); 328*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2IntAlt(b2, b1)); 329*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2IntAlt2(b1, b2)); 330*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2IntAlt2(b2, b1)); 331*795d594fSAndroid Build Coastguard Worker expectEquals(255, sadByte2Long(b1, b2)); 332*795d594fSAndroid Build Coastguard Worker expectEquals(255L, sadByte2Long(b2, b1)); 333*795d594fSAndroid Build Coastguard Worker expectEquals(256L, sadByte2LongAt1(b1, b2)); 334*795d594fSAndroid Build Coastguard Worker expectEquals(256L, sadByte2LongAt1(b2, b1)); 335*795d594fSAndroid Build Coastguard Worker 336*795d594fSAndroid Build Coastguard Worker // Use cross-values to test all cases. 337*795d594fSAndroid Build Coastguard Worker // One for scalar cleanup. 338*795d594fSAndroid Build Coastguard Worker int n = 256; 339*795d594fSAndroid Build Coastguard Worker int m = n * n + 1; 340*795d594fSAndroid Build Coastguard Worker int k = 0; 341*795d594fSAndroid Build Coastguard Worker b1 = new byte[m]; 342*795d594fSAndroid Build Coastguard Worker b2 = new byte[m]; 343*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < n; i++) { 344*795d594fSAndroid Build Coastguard Worker for (int j = 0; j < n; j++) { 345*795d594fSAndroid Build Coastguard Worker b1[k] = (byte) i; 346*795d594fSAndroid Build Coastguard Worker b2[k] = (byte) j; 347*795d594fSAndroid Build Coastguard Worker k++; 348*795d594fSAndroid Build Coastguard Worker } 349*795d594fSAndroid Build Coastguard Worker } 350*795d594fSAndroid Build Coastguard Worker b1[k] = 10; 351*795d594fSAndroid Build Coastguard Worker b2[k] = 2; 352*795d594fSAndroid Build Coastguard Worker expectEquals(8, sadByte2Byte(b1, b2)); 353*795d594fSAndroid Build Coastguard Worker expectEquals(8, sadByte2ByteAlt(b1, b2)); 354*795d594fSAndroid Build Coastguard Worker expectEquals(8, sadByte2ByteAlt2(b1, b2)); 355*795d594fSAndroid Build Coastguard Worker expectEquals(21768, sadByte2Short(b1, b2)); 356*795d594fSAndroid Build Coastguard Worker expectEquals(21768, sadByte2ShortAlt(b1, b2)); 357*795d594fSAndroid Build Coastguard Worker expectEquals(21768, sadByte2ShortAlt2(b1, b2)); 358*795d594fSAndroid Build Coastguard Worker expectEquals(5592328, sadByte2Int(b1, b2)); 359*795d594fSAndroid Build Coastguard Worker expectEquals(5592328, sadByte2IntAlt(b1, b2)); 360*795d594fSAndroid Build Coastguard Worker expectEquals(5592328, sadByte2IntAlt2(b1, b2)); 361*795d594fSAndroid Build Coastguard Worker expectEquals(5592328L, sadByte2Long(b1, b2)); 362*795d594fSAndroid Build Coastguard Worker expectEquals(5592329L, sadByte2LongAt1(b1, b2)); 363*795d594fSAndroid Build Coastguard Worker 364*795d594fSAndroid Build Coastguard Worker System.out.println("SimdSadByte passed"); 365*795d594fSAndroid Build Coastguard Worker } 366*795d594fSAndroid Build Coastguard Worker expectEquals(int expected, int result)367*795d594fSAndroid Build Coastguard Worker private static void expectEquals(int expected, int result) { 368*795d594fSAndroid Build Coastguard Worker if (expected != result) { 369*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 370*795d594fSAndroid Build Coastguard Worker } 371*795d594fSAndroid Build Coastguard Worker } 372*795d594fSAndroid Build Coastguard Worker expectEquals(long expected, long result)373*795d594fSAndroid Build Coastguard Worker private static void expectEquals(long expected, long result) { 374*795d594fSAndroid Build Coastguard Worker if (expected != result) { 375*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 376*795d594fSAndroid Build Coastguard Worker } 377*795d594fSAndroid Build Coastguard Worker } 378*795d594fSAndroid Build Coastguard Worker } 379