1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.bswap.i32(i32) nounwind readnone 5*9880d681SAndroid Build Coastguard Workerdeclare <2 x i32> @llvm.bswap.v2i32(<2 x i32>) nounwind readnone 6*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.bswap.v4i32(<4 x i32>) nounwind readnone 7*9880d681SAndroid Build Coastguard Workerdeclare <8 x i32> @llvm.bswap.v8i32(<8 x i32>) nounwind readnone 8*9880d681SAndroid Build Coastguard Workerdeclare i64 @llvm.bswap.i64(i64) nounwind readnone 9*9880d681SAndroid Build Coastguard Workerdeclare <2 x i64> @llvm.bswap.v2i64(<2 x i64>) nounwind readnone 10*9880d681SAndroid Build Coastguard Workerdeclare <4 x i64> @llvm.bswap.v4i64(<4 x i64>) nounwind readnone 11*9880d681SAndroid Build Coastguard Worker 12*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: @test_bswap_i32 13*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[VAL:v[0-9]+]] 14*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 [[TMP0:v[0-9]+]], [[VAL]], [[VAL]], 8 15*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 [[TMP1:v[0-9]+]], [[VAL]], [[VAL]], 24 16*9880d681SAndroid Build Coastguard Worker; SI-DAG: s_mov_b32 [[K:s[0-9]+]], 0xff00ff 17*9880d681SAndroid Build Coastguard Worker; SI: v_bfi_b32 [[RESULT:v[0-9]+]], [[K]], [[TMP1]], [[TMP0]] 18*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 19*9880d681SAndroid Build Coastguard Worker; SI: s_endpgm 20*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) nounwind { 21*9880d681SAndroid Build Coastguard Worker %val = load i32, i32 addrspace(1)* %in, align 4 22*9880d681SAndroid Build Coastguard Worker %bswap = call i32 @llvm.bswap.i32(i32 %val) nounwind readnone 23*9880d681SAndroid Build Coastguard Worker store i32 %bswap, i32 addrspace(1)* %out, align 4 24*9880d681SAndroid Build Coastguard Worker ret void 25*9880d681SAndroid Build Coastguard Worker} 26*9880d681SAndroid Build Coastguard Worker 27*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: @test_bswap_v2i32 28*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 29*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 30*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 31*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 32*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 33*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 34*9880d681SAndroid Build Coastguard Worker; SI: s_endpgm 35*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in) nounwind { 36*9880d681SAndroid Build Coastguard Worker %val = load <2 x i32>, <2 x i32> addrspace(1)* %in, align 8 37*9880d681SAndroid Build Coastguard Worker %bswap = call <2 x i32> @llvm.bswap.v2i32(<2 x i32> %val) nounwind readnone 38*9880d681SAndroid Build Coastguard Worker store <2 x i32> %bswap, <2 x i32> addrspace(1)* %out, align 8 39*9880d681SAndroid Build Coastguard Worker ret void 40*9880d681SAndroid Build Coastguard Worker} 41*9880d681SAndroid Build Coastguard Worker 42*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: @test_bswap_v4i32 43*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 44*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 45*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 46*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 47*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 48*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 49*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 50*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 51*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 52*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 53*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 54*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 55*9880d681SAndroid Build Coastguard Worker; SI: s_endpgm 56*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) nounwind { 57*9880d681SAndroid Build Coastguard Worker %val = load <4 x i32>, <4 x i32> addrspace(1)* %in, align 16 58*9880d681SAndroid Build Coastguard Worker %bswap = call <4 x i32> @llvm.bswap.v4i32(<4 x i32> %val) nounwind readnone 59*9880d681SAndroid Build Coastguard Worker store <4 x i32> %bswap, <4 x i32> addrspace(1)* %out, align 16 60*9880d681SAndroid Build Coastguard Worker ret void 61*9880d681SAndroid Build Coastguard Worker} 62*9880d681SAndroid Build Coastguard Worker 63*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: @test_bswap_v8i32 64*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 65*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 66*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 67*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 68*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 69*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 70*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 71*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 72*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 73*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 74*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 75*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 76*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 77*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 78*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 79*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 80*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 81*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 82*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 83*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 84*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 85*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 86*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_alignbit_b32 87*9880d681SAndroid Build Coastguard Worker; SI-DAG: v_bfi_b32 88*9880d681SAndroid Build Coastguard Worker; SI: s_endpgm 89*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_v8i32(<8 x i32> addrspace(1)* %out, <8 x i32> addrspace(1)* %in) nounwind { 90*9880d681SAndroid Build Coastguard Worker %val = load <8 x i32>, <8 x i32> addrspace(1)* %in, align 32 91*9880d681SAndroid Build Coastguard Worker %bswap = call <8 x i32> @llvm.bswap.v8i32(<8 x i32> %val) nounwind readnone 92*9880d681SAndroid Build Coastguard Worker store <8 x i32> %bswap, <8 x i32> addrspace(1)* %out, align 32 93*9880d681SAndroid Build Coastguard Worker ret void 94*9880d681SAndroid Build Coastguard Worker} 95*9880d681SAndroid Build Coastguard Worker 96*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_i64(i64 addrspace(1)* %out, i64 addrspace(1)* %in) nounwind { 97*9880d681SAndroid Build Coastguard Worker %val = load i64, i64 addrspace(1)* %in, align 8 98*9880d681SAndroid Build Coastguard Worker %bswap = call i64 @llvm.bswap.i64(i64 %val) nounwind readnone 99*9880d681SAndroid Build Coastguard Worker store i64 %bswap, i64 addrspace(1)* %out, align 8 100*9880d681SAndroid Build Coastguard Worker ret void 101*9880d681SAndroid Build Coastguard Worker} 102*9880d681SAndroid Build Coastguard Worker 103*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_v2i64(<2 x i64> addrspace(1)* %out, <2 x i64> addrspace(1)* %in) nounwind { 104*9880d681SAndroid Build Coastguard Worker %val = load <2 x i64>, <2 x i64> addrspace(1)* %in, align 16 105*9880d681SAndroid Build Coastguard Worker %bswap = call <2 x i64> @llvm.bswap.v2i64(<2 x i64> %val) nounwind readnone 106*9880d681SAndroid Build Coastguard Worker store <2 x i64> %bswap, <2 x i64> addrspace(1)* %out, align 16 107*9880d681SAndroid Build Coastguard Worker ret void 108*9880d681SAndroid Build Coastguard Worker} 109*9880d681SAndroid Build Coastguard Worker 110*9880d681SAndroid Build Coastguard Workerdefine void @test_bswap_v4i64(<4 x i64> addrspace(1)* %out, <4 x i64> addrspace(1)* %in) nounwind { 111*9880d681SAndroid Build Coastguard Worker %val = load <4 x i64>, <4 x i64> addrspace(1)* %in, align 32 112*9880d681SAndroid Build Coastguard Worker %bswap = call <4 x i64> @llvm.bswap.v4i64(<4 x i64> %val) nounwind readnone 113*9880d681SAndroid Build Coastguard Worker store <4 x i64> %bswap, <4 x i64> addrspace(1)* %out, align 32 114*9880d681SAndroid Build Coastguard Worker ret void 115*9880d681SAndroid Build Coastguard Worker} 116