1*9880d681SAndroid Build Coastguard Worker; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2*9880d681SAndroid Build Coastguard Worker; RUN: opt < %s -instsimplify -S | FileCheck %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Worker; If any bits of the shift amount are known to make it exceed or equal 5*9880d681SAndroid Build Coastguard Worker; the number of bits in the type, the shift causes undefined behavior. 6*9880d681SAndroid Build Coastguard Worker 7*9880d681SAndroid Build Coastguard Workerdefine i32 @shl_amount_is_known_bogus(i32 %a, i32 %b) { 8*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_amount_is_known_bogus( 9*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i32 undef 10*9880d681SAndroid Build Coastguard Worker; 11*9880d681SAndroid Build Coastguard Worker %or = or i32 %b, 32 12*9880d681SAndroid Build Coastguard Worker %shl = shl i32 %a, %or 13*9880d681SAndroid Build Coastguard Worker ret i32 %shl 14*9880d681SAndroid Build Coastguard Worker} 15*9880d681SAndroid Build Coastguard Worker 16*9880d681SAndroid Build Coastguard Worker; Check some weird types and the other shift ops. 17*9880d681SAndroid Build Coastguard Worker 18*9880d681SAndroid Build Coastguard Workerdefine i31 @lshr_amount_is_known_bogus(i31 %a, i31 %b) { 19*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @lshr_amount_is_known_bogus( 20*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i31 undef 21*9880d681SAndroid Build Coastguard Worker; 22*9880d681SAndroid Build Coastguard Worker %or = or i31 %b, 31 23*9880d681SAndroid Build Coastguard Worker %shr = lshr i31 %a, %or 24*9880d681SAndroid Build Coastguard Worker ret i31 %shr 25*9880d681SAndroid Build Coastguard Worker} 26*9880d681SAndroid Build Coastguard Worker 27*9880d681SAndroid Build Coastguard Workerdefine i33 @ashr_amount_is_known_bogus(i33 %a, i33 %b) { 28*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @ashr_amount_is_known_bogus( 29*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i33 undef 30*9880d681SAndroid Build Coastguard Worker; 31*9880d681SAndroid Build Coastguard Worker %or = or i33 %b, 33 32*9880d681SAndroid Build Coastguard Worker %shr = ashr i33 %a, %or 33*9880d681SAndroid Build Coastguard Worker ret i33 %shr 34*9880d681SAndroid Build Coastguard Worker} 35*9880d681SAndroid Build Coastguard Worker 36*9880d681SAndroid Build Coastguard Worker 37*9880d681SAndroid Build Coastguard Worker; If all valid bits of the shift amount are known 0, there's no shift. 38*9880d681SAndroid Build Coastguard Worker; It doesn't matter if high bits are set because that would be undefined. 39*9880d681SAndroid Build Coastguard Worker; Therefore, the only possible valid result of these shifts is %a. 40*9880d681SAndroid Build Coastguard Worker 41*9880d681SAndroid Build Coastguard Workerdefine i16 @ashr_amount_is_zero(i16 %a, i16 %b) { 42*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @ashr_amount_is_zero( 43*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i16 %a 44*9880d681SAndroid Build Coastguard Worker; 45*9880d681SAndroid Build Coastguard Worker %and = and i16 %b, 65520 ; 0xfff0 46*9880d681SAndroid Build Coastguard Worker %shr = ashr i16 %a, %and 47*9880d681SAndroid Build Coastguard Worker ret i16 %shr 48*9880d681SAndroid Build Coastguard Worker} 49*9880d681SAndroid Build Coastguard Worker 50*9880d681SAndroid Build Coastguard Workerdefine i300 @lshr_amount_is_zero(i300 %a, i300 %b) { 51*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @lshr_amount_is_zero( 52*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i300 %a 53*9880d681SAndroid Build Coastguard Worker; 54*9880d681SAndroid Build Coastguard Worker %and = and i300 %b, 2048 55*9880d681SAndroid Build Coastguard Worker %shr = lshr i300 %a, %and 56*9880d681SAndroid Build Coastguard Worker ret i300 %shr 57*9880d681SAndroid Build Coastguard Worker} 58*9880d681SAndroid Build Coastguard Worker 59*9880d681SAndroid Build Coastguard Workerdefine i9 @shl_amount_is_zero(i9 %a, i9 %b) { 60*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_amount_is_zero( 61*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i9 %a 62*9880d681SAndroid Build Coastguard Worker; 63*9880d681SAndroid Build Coastguard Worker %and = and i9 %b, 496 ; 0x1f0 64*9880d681SAndroid Build Coastguard Worker %shl = shl i9 %a, %and 65*9880d681SAndroid Build Coastguard Worker ret i9 %shl 66*9880d681SAndroid Build Coastguard Worker} 67*9880d681SAndroid Build Coastguard Worker 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Worker; Verify that we've calculated the log2 boundary of valid bits correctly for a weird type. 70*9880d681SAndroid Build Coastguard Worker 71*9880d681SAndroid Build Coastguard Workerdefine i9 @shl_amount_is_not_known_zero(i9 %a, i9 %b) { 72*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_amount_is_not_known_zero( 73*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[AND:%.*]] = and i9 %b, -8 74*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[SHL:%.*]] = shl i9 %a, [[AND]] 75*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i9 [[SHL]] 76*9880d681SAndroid Build Coastguard Worker; 77*9880d681SAndroid Build Coastguard Worker %and = and i9 %b, 504 ; 0x1f8 78*9880d681SAndroid Build Coastguard Worker %shl = shl i9 %a, %and 79*9880d681SAndroid Build Coastguard Worker ret i9 %shl 80*9880d681SAndroid Build Coastguard Worker} 81*9880d681SAndroid Build Coastguard Worker 82*9880d681SAndroid Build Coastguard Worker 83*9880d681SAndroid Build Coastguard Worker; For vectors, we need all scalar elements to meet the requirements to optimize. 84*9880d681SAndroid Build Coastguard Worker 85*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @ashr_vector_bogus(<2 x i32> %a, <2 x i32> %b) { 86*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @ashr_vector_bogus( 87*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret <2 x i32> undef 88*9880d681SAndroid Build Coastguard Worker; 89*9880d681SAndroid Build Coastguard Worker %or = or <2 x i32> %b, <i32 32, i32 32> 90*9880d681SAndroid Build Coastguard Worker %shr = ashr <2 x i32> %a, %or 91*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %shr 92*9880d681SAndroid Build Coastguard Worker} 93*9880d681SAndroid Build Coastguard Worker 94*9880d681SAndroid Build Coastguard Worker; FIXME: This is undef, but computeKnownBits doesn't handle the union. 95*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @shl_vector_bogus(<2 x i32> %a, <2 x i32> %b) { 96*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_vector_bogus( 97*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[OR:%.*]] = or <2 x i32> %b, <i32 32, i32 64> 98*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[SHL:%.*]] = shl <2 x i32> %a, [[OR]] 99*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret <2 x i32> [[SHL]] 100*9880d681SAndroid Build Coastguard Worker; 101*9880d681SAndroid Build Coastguard Worker %or = or <2 x i32> %b, <i32 32, i32 64> 102*9880d681SAndroid Build Coastguard Worker %shl = shl <2 x i32> %a, %or 103*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %shl 104*9880d681SAndroid Build Coastguard Worker} 105*9880d681SAndroid Build Coastguard Worker 106*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @lshr_vector_zero(<2 x i32> %a, <2 x i32> %b) { 107*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @lshr_vector_zero( 108*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret <2 x i32> %a 109*9880d681SAndroid Build Coastguard Worker; 110*9880d681SAndroid Build Coastguard Worker %and = and <2 x i32> %b, <i32 64, i32 256> 111*9880d681SAndroid Build Coastguard Worker %shr = lshr <2 x i32> %a, %and 112*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %shr 113*9880d681SAndroid Build Coastguard Worker} 114*9880d681SAndroid Build Coastguard Worker 115*9880d681SAndroid Build Coastguard Worker; Make sure that weird vector types work too. 116*9880d681SAndroid Build Coastguard Workerdefine <2 x i15> @shl_vector_zero(<2 x i15> %a, <2 x i15> %b) { 117*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_vector_zero( 118*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret <2 x i15> %a 119*9880d681SAndroid Build Coastguard Worker; 120*9880d681SAndroid Build Coastguard Worker %and = and <2 x i15> %b, <i15 1024, i15 1024> 121*9880d681SAndroid Build Coastguard Worker %shl = shl <2 x i15> %a, %and 122*9880d681SAndroid Build Coastguard Worker ret <2 x i15> %shl 123*9880d681SAndroid Build Coastguard Worker} 124*9880d681SAndroid Build Coastguard Worker 125*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @shl_vector_for_real(<2 x i32> %a, <2 x i32> %b) { 126*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_vector_for_real( 127*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[AND:%.*]] = and <2 x i32> %b, <i32 3, i32 3> 128*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: [[SHL:%.*]] = shl <2 x i32> %a, [[AND]] 129*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret <2 x i32> [[SHL]] 130*9880d681SAndroid Build Coastguard Worker; 131*9880d681SAndroid Build Coastguard Worker %and = and <2 x i32> %b, <i32 3, i32 3> ; a necessary mask op 132*9880d681SAndroid Build Coastguard Worker %shl = shl <2 x i32> %a, %and 133*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %shl 134*9880d681SAndroid Build Coastguard Worker} 135*9880d681SAndroid Build Coastguard Worker 136*9880d681SAndroid Build Coastguard Worker 137*9880d681SAndroid Build Coastguard Worker; We calculate the valid bits of the shift using log2, and log2 of 1 (the type width) is 0. 138*9880d681SAndroid Build Coastguard Worker; That should be ok. Either the shift amount is 0 or invalid (1), so we can always return %a. 139*9880d681SAndroid Build Coastguard Worker 140*9880d681SAndroid Build Coastguard Workerdefine i1 @shl_i1(i1 %a, i1 %b) { 141*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: @shl_i1( 142*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret i1 %a 143*9880d681SAndroid Build Coastguard Worker; 144*9880d681SAndroid Build Coastguard Worker %shl = shl i1 %a, %b 145*9880d681SAndroid Build Coastguard Worker ret i1 %shl 146*9880d681SAndroid Build Coastguard Worker} 147*9880d681SAndroid Build Coastguard Worker 148