xref: /aosp_15_r20/external/llvm/test/CodeGen/AMDGPU/schedule-vs-if-nested-loop.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker;RUN: llc < %s -march=r600 -mcpu=cayman -stress-sched -verify-misched
2*9880d681SAndroid Build Coastguard Worker;REQUIRES: asserts
3*9880d681SAndroid Build Coastguard Worker
4*9880d681SAndroid Build Coastguard Workerdefine amdgpu_vs void @main(<4 x float> inreg %reg0, <4 x float> inreg %reg1) {
5*9880d681SAndroid Build Coastguard Workermain_body:
6*9880d681SAndroid Build Coastguard Worker  %0 = extractelement <4 x float> %reg1, i32 0
7*9880d681SAndroid Build Coastguard Worker  %1 = extractelement <4 x float> %reg1, i32 1
8*9880d681SAndroid Build Coastguard Worker  %2 = extractelement <4 x float> %reg1, i32 2
9*9880d681SAndroid Build Coastguard Worker  %3 = extractelement <4 x float> %reg1, i32 3
10*9880d681SAndroid Build Coastguard Worker  %4 = fcmp ult float %0, 0.000000e+00
11*9880d681SAndroid Build Coastguard Worker  %5 = select i1 %4, float 1.000000e+00, float 0.000000e+00
12*9880d681SAndroid Build Coastguard Worker  %6 = fsub float -0.000000e+00, %5
13*9880d681SAndroid Build Coastguard Worker  %7 = fptosi float %6 to i32
14*9880d681SAndroid Build Coastguard Worker  %8 = bitcast i32 %7 to float
15*9880d681SAndroid Build Coastguard Worker  %9 = bitcast float %8 to i32
16*9880d681SAndroid Build Coastguard Worker  %10 = icmp ne i32 %9, 0
17*9880d681SAndroid Build Coastguard Worker  br i1 %10, label %LOOP, label %ENDIF
18*9880d681SAndroid Build Coastguard Worker
19*9880d681SAndroid Build Coastguard WorkerENDIF:                                            ; preds = %ENDIF16, %LOOP, %main_body
20*9880d681SAndroid Build Coastguard Worker  %temp.0 = phi float [ 0.000000e+00, %main_body ], [ %temp.1, %LOOP ], [ %temp.1, %ENDIF16 ]
21*9880d681SAndroid Build Coastguard Worker  %temp1.0 = phi float [ 1.000000e+00, %main_body ], [ %temp1.1, %LOOP ], [ %temp1.1, %ENDIF16 ]
22*9880d681SAndroid Build Coastguard Worker  %temp2.0 = phi float [ 0.000000e+00, %main_body ], [ %temp2.1, %LOOP ], [ %temp2.1, %ENDIF16 ]
23*9880d681SAndroid Build Coastguard Worker  %temp3.0 = phi float [ 0.000000e+00, %main_body ], [ %temp3.1, %LOOP ], [ %temp3.1, %ENDIF16 ]
24*9880d681SAndroid Build Coastguard Worker  %11 = load <4 x float>, <4 x float> addrspace(9)* null
25*9880d681SAndroid Build Coastguard Worker  %12 = extractelement <4 x float> %11, i32 0
26*9880d681SAndroid Build Coastguard Worker  %13 = fmul float %12, %0
27*9880d681SAndroid Build Coastguard Worker  %14 = load <4 x float>, <4 x float> addrspace(9)* null
28*9880d681SAndroid Build Coastguard Worker  %15 = extractelement <4 x float> %14, i32 1
29*9880d681SAndroid Build Coastguard Worker  %16 = fmul float %15, %0
30*9880d681SAndroid Build Coastguard Worker  %17 = load <4 x float>, <4 x float> addrspace(9)* null
31*9880d681SAndroid Build Coastguard Worker  %18 = extractelement <4 x float> %17, i32 2
32*9880d681SAndroid Build Coastguard Worker  %19 = fmul float %18, %0
33*9880d681SAndroid Build Coastguard Worker  %20 = load <4 x float>, <4 x float> addrspace(9)* null
34*9880d681SAndroid Build Coastguard Worker  %21 = extractelement <4 x float> %20, i32 3
35*9880d681SAndroid Build Coastguard Worker  %22 = fmul float %21, %0
36*9880d681SAndroid Build Coastguard Worker  %23 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 1)
37*9880d681SAndroid Build Coastguard Worker  %24 = extractelement <4 x float> %23, i32 0
38*9880d681SAndroid Build Coastguard Worker  %25 = fmul float %24, %1
39*9880d681SAndroid Build Coastguard Worker  %26 = fadd float %25, %13
40*9880d681SAndroid Build Coastguard Worker  %27 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 1)
41*9880d681SAndroid Build Coastguard Worker  %28 = extractelement <4 x float> %27, i32 1
42*9880d681SAndroid Build Coastguard Worker  %29 = fmul float %28, %1
43*9880d681SAndroid Build Coastguard Worker  %30 = fadd float %29, %16
44*9880d681SAndroid Build Coastguard Worker  %31 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 1)
45*9880d681SAndroid Build Coastguard Worker  %32 = extractelement <4 x float> %31, i32 2
46*9880d681SAndroid Build Coastguard Worker  %33 = fmul float %32, %1
47*9880d681SAndroid Build Coastguard Worker  %34 = fadd float %33, %19
48*9880d681SAndroid Build Coastguard Worker  %35 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 1)
49*9880d681SAndroid Build Coastguard Worker  %36 = extractelement <4 x float> %35, i32 3
50*9880d681SAndroid Build Coastguard Worker  %37 = fmul float %36, %1
51*9880d681SAndroid Build Coastguard Worker  %38 = fadd float %37, %22
52*9880d681SAndroid Build Coastguard Worker  %39 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 2)
53*9880d681SAndroid Build Coastguard Worker  %40 = extractelement <4 x float> %39, i32 0
54*9880d681SAndroid Build Coastguard Worker  %41 = fmul float %40, %2
55*9880d681SAndroid Build Coastguard Worker  %42 = fadd float %41, %26
56*9880d681SAndroid Build Coastguard Worker  %43 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 2)
57*9880d681SAndroid Build Coastguard Worker  %44 = extractelement <4 x float> %43, i32 1
58*9880d681SAndroid Build Coastguard Worker  %45 = fmul float %44, %2
59*9880d681SAndroid Build Coastguard Worker  %46 = fadd float %45, %30
60*9880d681SAndroid Build Coastguard Worker  %47 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 2)
61*9880d681SAndroid Build Coastguard Worker  %48 = extractelement <4 x float> %47, i32 2
62*9880d681SAndroid Build Coastguard Worker  %49 = fmul float %48, %2
63*9880d681SAndroid Build Coastguard Worker  %50 = fadd float %49, %34
64*9880d681SAndroid Build Coastguard Worker  %51 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 2)
65*9880d681SAndroid Build Coastguard Worker  %52 = extractelement <4 x float> %51, i32 3
66*9880d681SAndroid Build Coastguard Worker  %53 = fmul float %52, %2
67*9880d681SAndroid Build Coastguard Worker  %54 = fadd float %53, %38
68*9880d681SAndroid Build Coastguard Worker  %55 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 3)
69*9880d681SAndroid Build Coastguard Worker  %56 = extractelement <4 x float> %55, i32 0
70*9880d681SAndroid Build Coastguard Worker  %57 = fmul float %56, %3
71*9880d681SAndroid Build Coastguard Worker  %58 = fadd float %57, %42
72*9880d681SAndroid Build Coastguard Worker  %59 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 3)
73*9880d681SAndroid Build Coastguard Worker  %60 = extractelement <4 x float> %59, i32 1
74*9880d681SAndroid Build Coastguard Worker  %61 = fmul float %60, %3
75*9880d681SAndroid Build Coastguard Worker  %62 = fadd float %61, %46
76*9880d681SAndroid Build Coastguard Worker  %63 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 3)
77*9880d681SAndroid Build Coastguard Worker  %64 = extractelement <4 x float> %63, i32 2
78*9880d681SAndroid Build Coastguard Worker  %65 = fmul float %64, %3
79*9880d681SAndroid Build Coastguard Worker  %66 = fadd float %65, %50
80*9880d681SAndroid Build Coastguard Worker  %67 = load <4 x float>, <4 x float> addrspace(9)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(9)* null, i64 0, i32 3)
81*9880d681SAndroid Build Coastguard Worker  %68 = extractelement <4 x float> %67, i32 3
82*9880d681SAndroid Build Coastguard Worker  %69 = fmul float %68, %3
83*9880d681SAndroid Build Coastguard Worker  %70 = fadd float %69, %54
84*9880d681SAndroid Build Coastguard Worker  %71 = insertelement <4 x float> undef, float %58, i32 0
85*9880d681SAndroid Build Coastguard Worker  %72 = insertelement <4 x float> %71, float %62, i32 1
86*9880d681SAndroid Build Coastguard Worker  %73 = insertelement <4 x float> %72, float %66, i32 2
87*9880d681SAndroid Build Coastguard Worker  %74 = insertelement <4 x float> %73, float %70, i32 3
88*9880d681SAndroid Build Coastguard Worker  call void @llvm.R600.store.swizzle(<4 x float> %74, i32 60, i32 1)
89*9880d681SAndroid Build Coastguard Worker  %75 = insertelement <4 x float> undef, float %temp.0, i32 0
90*9880d681SAndroid Build Coastguard Worker  %76 = insertelement <4 x float> %75, float %temp1.0, i32 1
91*9880d681SAndroid Build Coastguard Worker  %77 = insertelement <4 x float> %76, float %temp2.0, i32 2
92*9880d681SAndroid Build Coastguard Worker  %78 = insertelement <4 x float> %77, float %temp3.0, i32 3
93*9880d681SAndroid Build Coastguard Worker  call void @llvm.R600.store.swizzle(<4 x float> %78, i32 0, i32 2)
94*9880d681SAndroid Build Coastguard Worker  ret void
95*9880d681SAndroid Build Coastguard Worker
96*9880d681SAndroid Build Coastguard WorkerLOOP:                                             ; preds = %main_body, %ENDIF19
97*9880d681SAndroid Build Coastguard Worker  %temp.1 = phi float [ %93, %ENDIF19 ], [ 0.000000e+00, %main_body ]
98*9880d681SAndroid Build Coastguard Worker  %temp1.1 = phi float [ %94, %ENDIF19 ], [ 1.000000e+00, %main_body ]
99*9880d681SAndroid Build Coastguard Worker  %temp2.1 = phi float [ %95, %ENDIF19 ], [ 0.000000e+00, %main_body ]
100*9880d681SAndroid Build Coastguard Worker  %temp3.1 = phi float [ %96, %ENDIF19 ], [ 0.000000e+00, %main_body ]
101*9880d681SAndroid Build Coastguard Worker  %temp4.0 = phi float [ %97, %ENDIF19 ], [ -2.000000e+00, %main_body ]
102*9880d681SAndroid Build Coastguard Worker  %79 = fcmp uge float %temp4.0, %0
103*9880d681SAndroid Build Coastguard Worker  %80 = select i1 %79, float 1.000000e+00, float 0.000000e+00
104*9880d681SAndroid Build Coastguard Worker  %81 = fsub float -0.000000e+00, %80
105*9880d681SAndroid Build Coastguard Worker  %82 = fptosi float %81 to i32
106*9880d681SAndroid Build Coastguard Worker  %83 = bitcast i32 %82 to float
107*9880d681SAndroid Build Coastguard Worker  %84 = bitcast float %83 to i32
108*9880d681SAndroid Build Coastguard Worker  %85 = icmp ne i32 %84, 0
109*9880d681SAndroid Build Coastguard Worker  br i1 %85, label %ENDIF, label %ENDIF16
110*9880d681SAndroid Build Coastguard Worker
111*9880d681SAndroid Build Coastguard WorkerENDIF16:                                          ; preds = %LOOP
112*9880d681SAndroid Build Coastguard Worker  %86 = fcmp une float %2, %temp4.0
113*9880d681SAndroid Build Coastguard Worker  %87 = select i1 %86, float 1.000000e+00, float 0.000000e+00
114*9880d681SAndroid Build Coastguard Worker  %88 = fsub float -0.000000e+00, %87
115*9880d681SAndroid Build Coastguard Worker  %89 = fptosi float %88 to i32
116*9880d681SAndroid Build Coastguard Worker  %90 = bitcast i32 %89 to float
117*9880d681SAndroid Build Coastguard Worker  %91 = bitcast float %90 to i32
118*9880d681SAndroid Build Coastguard Worker  %92 = icmp ne i32 %91, 0
119*9880d681SAndroid Build Coastguard Worker  br i1 %92, label %ENDIF, label %ENDIF19
120*9880d681SAndroid Build Coastguard Worker
121*9880d681SAndroid Build Coastguard WorkerENDIF19:                                          ; preds = %ENDIF16
122*9880d681SAndroid Build Coastguard Worker  %93 = fadd float %temp.1, 1.000000e+00
123*9880d681SAndroid Build Coastguard Worker  %94 = fadd float %temp1.1, 0.000000e+00
124*9880d681SAndroid Build Coastguard Worker  %95 = fadd float %temp2.1, 0.000000e+00
125*9880d681SAndroid Build Coastguard Worker  %96 = fadd float %temp3.1, 0.000000e+00
126*9880d681SAndroid Build Coastguard Worker  %97 = fadd float %temp4.0, 1.000000e+00
127*9880d681SAndroid Build Coastguard Worker  br label %LOOP
128*9880d681SAndroid Build Coastguard Worker}
129*9880d681SAndroid Build Coastguard Worker
130*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.R600.store.swizzle(<4 x float>, i32, i32)
131