xref: /aosp_15_r20/external/clang/test/CodeGenCUDA/printf.cu (revision 67e74705e28f6214e480b399dd47ea732279e315)
1*67e74705SXin Li // REQUIRES: x86-registered-target
2*67e74705SXin Li // REQUIRES: nvptx-registered-target
3*67e74705SXin Li 
4*67e74705SXin Li // RUN: %clang_cc1 -triple nvptx64-nvidia-cuda -fcuda-is-device -emit-llvm \
5*67e74705SXin Li // RUN:   -o - %s | FileCheck %s
6*67e74705SXin Li 
7*67e74705SXin Li #include "Inputs/cuda.h"
8*67e74705SXin Li 
9*67e74705SXin Li extern "C" __device__ int vprintf(const char*, const char*);
10*67e74705SXin Li 
11*67e74705SXin Li // Check a simple call to printf end-to-end.
12*67e74705SXin Li // CHECK: [[SIMPLE_PRINTF_TY:%[a-zA-Z0-9_]+]] = type { i32, i64, double }
CheckSimple()13*67e74705SXin Li __device__ int CheckSimple() {
14*67e74705SXin Li   // CHECK: [[BUF:%[a-zA-Z0-9_]+]] = alloca [[SIMPLE_PRINTF_TY]]
15*67e74705SXin Li   // CHECK: [[FMT:%[0-9]+]] = load{{.*}}%fmt
16*67e74705SXin Li   const char* fmt = "%d %lld %f";
17*67e74705SXin Li   // CHECK: [[PTR0:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 0
18*67e74705SXin Li   // CHECK: store i32 1, i32* [[PTR0]], align 4
19*67e74705SXin Li   // CHECK: [[PTR1:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 1
20*67e74705SXin Li   // CHECK: store i64 2, i64* [[PTR1]], align 8
21*67e74705SXin Li   // CHECK: [[PTR2:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 2
22*67e74705SXin Li   // CHECK: store double 3.0{{[^,]*}}, double* [[PTR2]], align 8
23*67e74705SXin Li   // CHECK: [[BUF_CAST:%[0-9]+]] = bitcast [[SIMPLE_PRINTF_TY]]* [[BUF]] to i8*
24*67e74705SXin Li   // CHECK: [[RET:%[0-9]+]] = call i32 @vprintf(i8* [[FMT]], i8* [[BUF_CAST]])
25*67e74705SXin Li   // CHECK: ret i32 [[RET]]
26*67e74705SXin Li   return printf(fmt, 1, 2ll, 3.0);
27*67e74705SXin Li }
28*67e74705SXin Li 
CheckNoArgs()29*67e74705SXin Li __device__ void CheckNoArgs() {
30*67e74705SXin Li   // CHECK: call i32 @vprintf({{.*}}, i8* null){{$}}
31*67e74705SXin Li   printf("hello, world!");
32*67e74705SXin Li }
33*67e74705SXin Li 
34*67e74705SXin Li // Check that printf's alloca happens in the entry block, not inside the if
35*67e74705SXin Li // statement.
36*67e74705SXin Li __device__ bool foo();
CheckAllocaIsInEntryBlock()37*67e74705SXin Li __device__ void CheckAllocaIsInEntryBlock() {
38*67e74705SXin Li   // CHECK: alloca %printf_args
39*67e74705SXin Li   // CHECK: call {{.*}} @_Z3foov()
40*67e74705SXin Li   if (foo()) {
41*67e74705SXin Li     printf("%d", 42);
42*67e74705SXin Li   }
43*67e74705SXin Li }
44