1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mattr=+sse4.2 | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mattr=+sse4.2 -x86-experimental-vector-widening-legalization | FileCheck %s --check-prefix=CHECK-WIDE 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Workerdefine void @update(i64* %dst_i, i64* %src_i, i32 %n) nounwind { 5*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: update: 6*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-LABEL: update: 7*9880d681SAndroid Build Coastguard Workerentry: 8*9880d681SAndroid Build Coastguard Worker %dst_i.addr = alloca i64* ; <i64**> [#uses=2] 9*9880d681SAndroid Build Coastguard Worker %src_i.addr = alloca i64* ; <i64**> [#uses=2] 10*9880d681SAndroid Build Coastguard Worker %n.addr = alloca i32 ; <i32*> [#uses=2] 11*9880d681SAndroid Build Coastguard Worker %i = alloca i32, align 4 ; <i32*> [#uses=8] 12*9880d681SAndroid Build Coastguard Worker %dst = alloca <8 x i8>*, align 4 ; <<8 x i8>**> [#uses=2] 13*9880d681SAndroid Build Coastguard Worker %src = alloca <8 x i8>*, align 4 ; <<8 x i8>**> [#uses=2] 14*9880d681SAndroid Build Coastguard Worker store i64* %dst_i, i64** %dst_i.addr 15*9880d681SAndroid Build Coastguard Worker store i64* %src_i, i64** %src_i.addr 16*9880d681SAndroid Build Coastguard Worker store i32 %n, i32* %n.addr 17*9880d681SAndroid Build Coastguard Worker store i32 0, i32* %i 18*9880d681SAndroid Build Coastguard Worker br label %forcond 19*9880d681SAndroid Build Coastguard Worker 20*9880d681SAndroid Build Coastguard Workerforcond: ; preds = %forinc, %entry 21*9880d681SAndroid Build Coastguard Worker %tmp = load i32, i32* %i ; <i32> [#uses=1] 22*9880d681SAndroid Build Coastguard Worker %tmp1 = load i32, i32* %n.addr ; <i32> [#uses=1] 23*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %tmp, %tmp1 ; <i1> [#uses=1] 24*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %forbody, label %afterfor 25*9880d681SAndroid Build Coastguard Worker 26*9880d681SAndroid Build Coastguard Workerforbody: ; preds = %forcond 27*9880d681SAndroid Build Coastguard Worker %tmp2 = load i32, i32* %i ; <i32> [#uses=1] 28*9880d681SAndroid Build Coastguard Worker %tmp3 = load i64*, i64** %dst_i.addr ; <i64*> [#uses=1] 29*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr i64, i64* %tmp3, i32 %tmp2 ; <i64*> [#uses=1] 30*9880d681SAndroid Build Coastguard Worker %conv = bitcast i64* %arrayidx to <8 x i8>* ; <<8 x i8>*> [#uses=1] 31*9880d681SAndroid Build Coastguard Worker store <8 x i8>* %conv, <8 x i8>** %dst 32*9880d681SAndroid Build Coastguard Worker %tmp4 = load i32, i32* %i ; <i32> [#uses=1] 33*9880d681SAndroid Build Coastguard Worker %tmp5 = load i64*, i64** %src_i.addr ; <i64*> [#uses=1] 34*9880d681SAndroid Build Coastguard Worker %arrayidx6 = getelementptr i64, i64* %tmp5, i32 %tmp4 ; <i64*> [#uses=1] 35*9880d681SAndroid Build Coastguard Worker %conv7 = bitcast i64* %arrayidx6 to <8 x i8>* ; <<8 x i8>*> [#uses=1] 36*9880d681SAndroid Build Coastguard Worker store <8 x i8>* %conv7, <8 x i8>** %src 37*9880d681SAndroid Build Coastguard Worker %tmp8 = load i32, i32* %i ; <i32> [#uses=1] 38*9880d681SAndroid Build Coastguard Worker %tmp9 = load <8 x i8>*, <8 x i8>** %dst ; <<8 x i8>*> [#uses=1] 39*9880d681SAndroid Build Coastguard Worker %arrayidx10 = getelementptr <8 x i8>, <8 x i8>* %tmp9, i32 %tmp8 ; <<8 x i8>*> [#uses=1] 40*9880d681SAndroid Build Coastguard Worker %tmp11 = load i32, i32* %i ; <i32> [#uses=1] 41*9880d681SAndroid Build Coastguard Worker %tmp12 = load <8 x i8>*, <8 x i8>** %src ; <<8 x i8>*> [#uses=1] 42*9880d681SAndroid Build Coastguard Worker %arrayidx13 = getelementptr <8 x i8>, <8 x i8>* %tmp12, i32 %tmp11 ; <<8 x i8>*> [#uses=1] 43*9880d681SAndroid Build Coastguard Worker %tmp14 = load <8 x i8>, <8 x i8>* %arrayidx13 ; <<8 x i8>> [#uses=1] 44*9880d681SAndroid Build Coastguard Worker %add = add <8 x i8> %tmp14, < i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1 > ; <<8 x i8>> [#uses=1] 45*9880d681SAndroid Build Coastguard Worker %shr = ashr <8 x i8> %add, < i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2, i8 2 > ; <<8 x i8>> [#uses=1] 46*9880d681SAndroid Build Coastguard Worker store <8 x i8> %shr, <8 x i8>* %arrayidx10 47*9880d681SAndroid Build Coastguard Worker br label %forinc 48*9880d681SAndroid Build Coastguard Worker; CHECK: %forbody 49*9880d681SAndroid Build Coastguard Worker; CHECK: pmovzxbw 50*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: paddw 51*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psllw $8 52*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psraw $8 53*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: psraw $2 54*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: pshufb 55*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: movq 56*9880d681SAndroid Build Coastguard Worker; 57*9880d681SAndroid Build Coastguard Worker; FIXME: We shouldn't require both a movd and an insert. 58*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE: %forbody 59*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE: movd 60*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: pinsrd 61*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: paddb 62*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: psrlw $2 63*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: pand 64*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: pxor 65*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: psubb 66*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: pextrd 67*9880d681SAndroid Build Coastguard Worker; CHECK-WIDE-NEXT: movd 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Workerforinc: ; preds = %forbody 70*9880d681SAndroid Build Coastguard Worker %tmp15 = load i32, i32* %i ; <i32> [#uses=1] 71*9880d681SAndroid Build Coastguard Worker %inc = add i32 %tmp15, 1 ; <i32> [#uses=1] 72*9880d681SAndroid Build Coastguard Worker store i32 %inc, i32* %i 73*9880d681SAndroid Build Coastguard Worker br label %forcond 74*9880d681SAndroid Build Coastguard Worker 75*9880d681SAndroid Build Coastguard Workerafterfor: ; preds = %forcond 76*9880d681SAndroid Build Coastguard Worker ret void 77*9880d681SAndroid Build Coastguard Worker} 78*9880d681SAndroid Build Coastguard Worker 79