1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=arm-eabi %s -o - | FileCheck %s -check-prefix=CHECK --check-prefix=CHECK-LE 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=armv7-eabi %s -o - | FileCheck %s --check-prefix=CHECK-V7-LE 3*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=armeb-eabi %s -o - | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-BE 4*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=armebv7-eabi %s -o - | FileCheck %s -check-prefix=CHECK-V7-BE 5*9880d681SAndroid Build Coastguard Worker; Check generated signed and unsigned multiply accumulate long. 6*9880d681SAndroid Build Coastguard Worker 7*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest1(i32 %a, i32 %b, i64 %c) { 8*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest1: 9*9880d681SAndroid Build Coastguard Worker;CHECK: umlal 10*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %a to i64 11*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %b to i64 12*9880d681SAndroid Build Coastguard Worker %mul = mul i64 %conv1, %conv 13*9880d681SAndroid Build Coastguard Worker %add = add i64 %mul, %c 14*9880d681SAndroid Build Coastguard Worker ret i64 %add 15*9880d681SAndroid Build Coastguard Worker} 16*9880d681SAndroid Build Coastguard Worker 17*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest2(i32 %a, i32 %b, i64 %c) { 18*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest2: 19*9880d681SAndroid Build Coastguard Worker;CHECK: smlal 20*9880d681SAndroid Build Coastguard Worker %conv = sext i32 %a to i64 21*9880d681SAndroid Build Coastguard Worker %conv1 = sext i32 %b to i64 22*9880d681SAndroid Build Coastguard Worker %mul = mul nsw i64 %conv1, %conv 23*9880d681SAndroid Build Coastguard Worker %add = add nsw i64 %mul, %c 24*9880d681SAndroid Build Coastguard Worker ret i64 %add 25*9880d681SAndroid Build Coastguard Worker} 26*9880d681SAndroid Build Coastguard Worker 27*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest3(i32 %a, i32 %b, i32 %c) { 28*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest3: 29*9880d681SAndroid Build Coastguard Worker;CHECK: umlal 30*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %b to i64 31*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %a to i64 32*9880d681SAndroid Build Coastguard Worker %mul = mul i64 %conv, %conv1 33*9880d681SAndroid Build Coastguard Worker %conv2 = zext i32 %c to i64 34*9880d681SAndroid Build Coastguard Worker %add = add i64 %mul, %conv2 35*9880d681SAndroid Build Coastguard Worker ret i64 %add 36*9880d681SAndroid Build Coastguard Worker} 37*9880d681SAndroid Build Coastguard Worker 38*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest4(i32 %a, i32 %b, i32 %c) { 39*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest4: 40*9880d681SAndroid Build Coastguard Worker;CHECK: smlal 41*9880d681SAndroid Build Coastguard Worker %conv = sext i32 %b to i64 42*9880d681SAndroid Build Coastguard Worker %conv1 = sext i32 %a to i64 43*9880d681SAndroid Build Coastguard Worker %mul = mul nsw i64 %conv, %conv1 44*9880d681SAndroid Build Coastguard Worker %conv2 = sext i32 %c to i64 45*9880d681SAndroid Build Coastguard Worker %add = add nsw i64 %mul, %conv2 46*9880d681SAndroid Build Coastguard Worker ret i64 %add 47*9880d681SAndroid Build Coastguard Worker} 48*9880d681SAndroid Build Coastguard Worker 49*9880d681SAndroid Build Coastguard Worker; Two things to check here: the @earlyclobber constraint (on <= v5) and the "$Rd = $R" ones. 50*9880d681SAndroid Build Coastguard Worker; + Without @earlyclobber the v7 code is natural. With it, the first two 51*9880d681SAndroid Build Coastguard Worker; registers must be distinct from the third. 52*9880d681SAndroid Build Coastguard Worker; + Without "$Rd = $R", this can be satisfied without a mov before the umlal 53*9880d681SAndroid Build Coastguard Worker; by trying to use 6 different registers in the MachineInstr. The natural 54*9880d681SAndroid Build Coastguard Worker; evolution of this attempt currently leaves only two movs in the final 55*9880d681SAndroid Build Coastguard Worker; function, both after the umlal. With it, *some* move has to happen 56*9880d681SAndroid Build Coastguard Worker; before the umlal. 57*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest5(i64 %c, i32 %a, i32 %b) { 58*9880d681SAndroid Build Coastguard Worker; CHECK-V7-LE-LABEL: MACLongTest5: 59*9880d681SAndroid Build Coastguard Worker; CHECK-V7-LE-LABEL: umlal r0, r1, r0, r0 60*9880d681SAndroid Build Coastguard Worker; CHECK-V7-BE-LABEL: MACLongTest5: 61*9880d681SAndroid Build Coastguard Worker; CHECK-V7-BE-LABEL: umlal r1, r0, r1, r1 62*9880d681SAndroid Build Coastguard Worker 63*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: MACLongTest5: 64*9880d681SAndroid Build Coastguard Worker; CHECK-LE: mov [[RDLO:r[0-9]+]], r0 65*9880d681SAndroid Build Coastguard Worker; CHECK-LE: umlal [[RDLO]], r1, r0, r0 66*9880d681SAndroid Build Coastguard Worker; CHECK-LE: mov r0, [[RDLO]] 67*9880d681SAndroid Build Coastguard Worker; CHECK-BE: mov [[RDLO:r[0-9]+]], r1 68*9880d681SAndroid Build Coastguard Worker; CHECK-BE: umlal [[RDLO]], r0, r1, r1 69*9880d681SAndroid Build Coastguard Worker; CHECK-BE: mov r1, [[RDLO]] 70*9880d681SAndroid Build Coastguard Worker 71*9880d681SAndroid Build Coastguard Worker %conv.trunc = trunc i64 %c to i32 72*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %conv.trunc to i64 73*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %b to i64 74*9880d681SAndroid Build Coastguard Worker %mul = mul i64 %conv, %conv 75*9880d681SAndroid Build Coastguard Worker %add = add i64 %mul, %c 76*9880d681SAndroid Build Coastguard Worker ret i64 %add 77*9880d681SAndroid Build Coastguard Worker} 78*9880d681SAndroid Build Coastguard Worker 79*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest6(i32 %a, i32 %b, i32 %c, i32 %d) { 80*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest6: 81*9880d681SAndroid Build Coastguard Worker;CHECK: smull r12, lr, r1, r0 82*9880d681SAndroid Build Coastguard Worker;CHECK: smlal r12, lr, r3, r2 83*9880d681SAndroid Build Coastguard Worker %conv = sext i32 %a to i64 84*9880d681SAndroid Build Coastguard Worker %conv1 = sext i32 %b to i64 85*9880d681SAndroid Build Coastguard Worker %mul = mul nsw i64 %conv1, %conv 86*9880d681SAndroid Build Coastguard Worker %conv2 = sext i32 %c to i64 87*9880d681SAndroid Build Coastguard Worker %conv3 = sext i32 %d to i64 88*9880d681SAndroid Build Coastguard Worker %mul4 = mul nsw i64 %conv3, %conv2 89*9880d681SAndroid Build Coastguard Worker %add = add nsw i64 %mul4, %mul 90*9880d681SAndroid Build Coastguard Worker ret i64 %add 91*9880d681SAndroid Build Coastguard Worker} 92*9880d681SAndroid Build Coastguard Worker 93*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest7(i64 %acc, i32 %lhs, i32 %rhs) { 94*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest7: 95*9880d681SAndroid Build Coastguard Worker;CHECK-NOT: smlal 96*9880d681SAndroid Build Coastguard Worker %conv = sext i32 %lhs to i64 97*9880d681SAndroid Build Coastguard Worker %conv1 = sext i32 %rhs to i64 98*9880d681SAndroid Build Coastguard Worker %mul = mul nsw i64 %conv1, %conv 99*9880d681SAndroid Build Coastguard Worker %shl = shl i64 %mul, 32 100*9880d681SAndroid Build Coastguard Worker %shr = lshr i64 %mul, 32 101*9880d681SAndroid Build Coastguard Worker %or = or i64 %shl, %shr 102*9880d681SAndroid Build Coastguard Worker %add = add i64 %or, %acc 103*9880d681SAndroid Build Coastguard Worker ret i64 %add 104*9880d681SAndroid Build Coastguard Worker} 105*9880d681SAndroid Build Coastguard Worker 106*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest8(i64 %acc, i32 %lhs, i32 %rhs) { 107*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest8: 108*9880d681SAndroid Build Coastguard Worker;CHECK-NOT: smlal 109*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %lhs to i64 110*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %rhs to i64 111*9880d681SAndroid Build Coastguard Worker %mul = mul nuw i64 %conv1, %conv 112*9880d681SAndroid Build Coastguard Worker %and = and i64 %mul, 4294967295 113*9880d681SAndroid Build Coastguard Worker %shl = shl i64 %mul, 32 114*9880d681SAndroid Build Coastguard Worker %or = or i64 %and, %shl 115*9880d681SAndroid Build Coastguard Worker %add = add i64 %or, %acc 116*9880d681SAndroid Build Coastguard Worker ret i64 %add 117*9880d681SAndroid Build Coastguard Worker} 118*9880d681SAndroid Build Coastguard Worker 119*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest9(i32 %lhs, i32 %rhs, i32 %lo, i32 %hi) { 120*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest9: 121*9880d681SAndroid Build Coastguard Worker;CHECK-V7-LE:umaal 122*9880d681SAndroid Build Coastguard Worker;CHECK-V7-BE:umaal 123*9880d681SAndroid Build Coastguard Worker;CHECK-NOT:umaal 124*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %lhs to i64 125*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %rhs to i64 126*9880d681SAndroid Build Coastguard Worker %mul = mul nuw i64 %conv1, %conv 127*9880d681SAndroid Build Coastguard Worker %conv2 = zext i32 %lo to i64 128*9880d681SAndroid Build Coastguard Worker %add = add i64 %mul, %conv2 129*9880d681SAndroid Build Coastguard Worker %conv3 = zext i32 %hi to i64 130*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %add, %conv3 131*9880d681SAndroid Build Coastguard Worker ret i64 %add2 132*9880d681SAndroid Build Coastguard Worker} 133*9880d681SAndroid Build Coastguard Worker 134*9880d681SAndroid Build Coastguard Workerdefine i64 @MACLongTest10(i32 %lhs, i32 %rhs, i32 %lo, i32 %hi) { 135*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: MACLongTest10: 136*9880d681SAndroid Build Coastguard Worker;CHECK-V7-LE:umaal 137*9880d681SAndroid Build Coastguard Worker;CHECK-V7-BE:umaal 138*9880d681SAndroid Build Coastguard Worker;CHECK-NOT:umaal 139*9880d681SAndroid Build Coastguard Worker %conv = zext i32 %lhs to i64 140*9880d681SAndroid Build Coastguard Worker %conv1 = zext i32 %rhs to i64 141*9880d681SAndroid Build Coastguard Worker %mul = mul nuw i64 %conv1, %conv 142*9880d681SAndroid Build Coastguard Worker %conv2 = zext i32 %lo to i64 143*9880d681SAndroid Build Coastguard Worker %conv3 = zext i32 %hi to i64 144*9880d681SAndroid Build Coastguard Worker %add = add i64 %conv2, %conv3 145*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %add, %mul 146*9880d681SAndroid Build Coastguard Worker ret i64 %add2 147*9880d681SAndroid Build Coastguard Worker} 148