1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=x86 -mattr=+sse4.2 | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker; CHECK: padd 3*9880d681SAndroid Build Coastguard Worker; CHECK: pand 4*9880d681SAndroid Build Coastguard Worker 5*9880d681SAndroid Build Coastguard Worker; widen v8i8 to v16i8 (checks even power of 2 widening with add & and) 6*9880d681SAndroid Build Coastguard Worker 7*9880d681SAndroid Build Coastguard Workerdefine void @update(i64* %dst_i, i64* %src_i, i32 %n) nounwind { 8*9880d681SAndroid Build Coastguard Workerentry: 9*9880d681SAndroid Build Coastguard Worker %dst_i.addr = alloca i64* ; <i64**> [#uses=2] 10*9880d681SAndroid Build Coastguard Worker %src_i.addr = alloca i64* ; <i64**> [#uses=2] 11*9880d681SAndroid Build Coastguard Worker %n.addr = alloca i32 ; <i32*> [#uses=2] 12*9880d681SAndroid Build Coastguard Worker %i = alloca i32, align 4 ; <i32*> [#uses=8] 13*9880d681SAndroid Build Coastguard Worker %dst = alloca <8 x i8>*, align 4 ; <<8 x i8>**> [#uses=2] 14*9880d681SAndroid Build Coastguard Worker %src = alloca <8 x i8>*, align 4 ; <<8 x i8>**> [#uses=2] 15*9880d681SAndroid Build Coastguard Worker store i64* %dst_i, i64** %dst_i.addr 16*9880d681SAndroid Build Coastguard Worker store i64* %src_i, i64** %src_i.addr 17*9880d681SAndroid Build Coastguard Worker store i32 %n, i32* %n.addr 18*9880d681SAndroid Build Coastguard Worker store i32 0, i32* %i 19*9880d681SAndroid Build Coastguard Worker br label %forcond 20*9880d681SAndroid Build Coastguard Worker 21*9880d681SAndroid Build Coastguard Workerforcond: ; preds = %forinc, %entry 22*9880d681SAndroid Build Coastguard Worker %tmp = load i32, i32* %i ; <i32> [#uses=1] 23*9880d681SAndroid Build Coastguard Worker %tmp1 = load i32, i32* %n.addr ; <i32> [#uses=1] 24*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %tmp, %tmp1 ; <i1> [#uses=1] 25*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %forbody, label %afterfor 26*9880d681SAndroid Build Coastguard Worker 27*9880d681SAndroid Build Coastguard Workerforbody: ; preds = %forcond 28*9880d681SAndroid Build Coastguard Worker %tmp2 = load i32, i32* %i ; <i32> [#uses=1] 29*9880d681SAndroid Build Coastguard Worker %tmp3 = load i64*, i64** %dst_i.addr ; <i64*> [#uses=1] 30*9880d681SAndroid Build Coastguard Worker %arrayidx = getelementptr i64, i64* %tmp3, i32 %tmp2 ; <i64*> [#uses=1] 31*9880d681SAndroid Build Coastguard Worker %conv = bitcast i64* %arrayidx to <8 x i8>* ; <<8 x i8>*> [#uses=1] 32*9880d681SAndroid Build Coastguard Worker store <8 x i8>* %conv, <8 x i8>** %dst 33*9880d681SAndroid Build Coastguard Worker %tmp4 = load i32, i32* %i ; <i32> [#uses=1] 34*9880d681SAndroid Build Coastguard Worker %tmp5 = load i64*, i64** %src_i.addr ; <i64*> [#uses=1] 35*9880d681SAndroid Build Coastguard Worker %arrayidx6 = getelementptr i64, i64* %tmp5, i32 %tmp4 ; <i64*> [#uses=1] 36*9880d681SAndroid Build Coastguard Worker %conv7 = bitcast i64* %arrayidx6 to <8 x i8>* ; <<8 x i8>*> [#uses=1] 37*9880d681SAndroid Build Coastguard Worker store <8 x i8>* %conv7, <8 x i8>** %src 38*9880d681SAndroid Build Coastguard Worker %tmp8 = load i32, i32* %i ; <i32> [#uses=1] 39*9880d681SAndroid Build Coastguard Worker %tmp9 = load <8 x i8>*, <8 x i8>** %dst ; <<8 x i8>*> [#uses=1] 40*9880d681SAndroid Build Coastguard Worker %arrayidx10 = getelementptr <8 x i8>, <8 x i8>* %tmp9, i32 %tmp8 ; <<8 x i8>*> [#uses=1] 41*9880d681SAndroid Build Coastguard Worker %tmp11 = load i32, i32* %i ; <i32> [#uses=1] 42*9880d681SAndroid Build Coastguard Worker %tmp12 = load <8 x i8>*, <8 x i8>** %src ; <<8 x i8>*> [#uses=1] 43*9880d681SAndroid Build Coastguard Worker %arrayidx13 = getelementptr <8 x i8>, <8 x i8>* %tmp12, i32 %tmp11 ; <<8 x i8>*> [#uses=1] 44*9880d681SAndroid Build Coastguard Worker %tmp14 = load <8 x i8>, <8 x i8>* %arrayidx13 ; <<8 x i8>> [#uses=1] 45*9880d681SAndroid Build Coastguard Worker %add = add <8 x i8> %tmp14, < i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1 > ; <<8 x i8>> [#uses=1] 46*9880d681SAndroid Build Coastguard Worker %and = and <8 x i8> %add, < i8 4, i8 4, i8 4, i8 4, i8 4, i8 4, i8 4, i8 4 > ; <<8 x i8>> [#uses=1] 47*9880d681SAndroid Build Coastguard Worker store <8 x i8> %and, <8 x i8>* %arrayidx10 48*9880d681SAndroid Build Coastguard Worker br label %forinc 49*9880d681SAndroid Build Coastguard Worker 50*9880d681SAndroid Build Coastguard Workerforinc: ; preds = %forbody 51*9880d681SAndroid Build Coastguard Worker %tmp15 = load i32, i32* %i ; <i32> [#uses=1] 52*9880d681SAndroid Build Coastguard Worker %inc = add i32 %tmp15, 1 ; <i32> [#uses=1] 53*9880d681SAndroid Build Coastguard Worker store i32 %inc, i32* %i 54*9880d681SAndroid Build Coastguard Worker br label %forcond 55*9880d681SAndroid Build Coastguard Worker 56*9880d681SAndroid Build Coastguard Workerafterfor: ; preds = %forcond 57*9880d681SAndroid Build Coastguard Worker ret void 58*9880d681SAndroid Build Coastguard Worker} 59*9880d681SAndroid Build Coastguard Worker 60