blob: 6c80055ef467305019e65e57cf35104b1f20048c [file] [log] [blame] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc < %s -march=nvptx64 -mcpu=sm_90 | FileCheck %s
; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_90 | %ptxas-verify -arch=sm_90 %}
%struct.64 = type <{ i64 }>
declare i64 @callee(ptr %p);
declare i64 @callee_variadic(ptr %p, ...);
define %struct.64 @test_return_type_mismatch(ptr %p) {
; CHECK-LABEL: test_return_type_mismatch(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<32>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: ld.param.b64 %rd1, [test_return_type_mismatch_param_0];
; CHECK-NEXT: { // callseq 0, 0
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .align 1 .b8 retval0[8];
; CHECK-NEXT: st.param.b64 [param0], %rd1;
; CHECK-NEXT: prototype_0 : .callprototype (.param .align 1 .b8 _[8]) _ (.param .b64 _);
; CHECK-NEXT: mov.b64 %rd2, callee;
; CHECK-NEXT: call (retval0), %rd2, (param0), prototype_0;
; CHECK-NEXT: ld.param.b8 %rd3, [retval0+7];
; CHECK-NEXT: ld.param.b8 %rd4, [retval0+6];
; CHECK-NEXT: ld.param.b8 %rd5, [retval0+5];
; CHECK-NEXT: ld.param.b8 %rd6, [retval0+4];
; CHECK-NEXT: ld.param.b8 %rd7, [retval0+3];
; CHECK-NEXT: ld.param.b8 %rd8, [retval0+2];
; CHECK-NEXT: ld.param.b8 %rd9, [retval0+1];
; CHECK-NEXT: ld.param.b8 %rd10, [retval0];
; CHECK-NEXT: } // callseq 0
; CHECK-NEXT: shl.b64 %rd11, %rd9, 8;
; CHECK-NEXT: or.b64 %rd12, %rd11, %rd10;
; CHECK-NEXT: shl.b64 %rd13, %rd8, 16;
; CHECK-NEXT: shl.b64 %rd14, %rd7, 24;
; CHECK-NEXT: or.b64 %rd15, %rd14, %rd13;
; CHECK-NEXT: or.b64 %rd16, %rd15, %rd12;
; CHECK-NEXT: shl.b64 %rd17, %rd5, 8;
; CHECK-NEXT: or.b64 %rd18, %rd17, %rd6;
; CHECK-NEXT: shl.b64 %rd19, %rd4, 16;
; CHECK-NEXT: shl.b64 %rd20, %rd3, 24;
; CHECK-NEXT: or.b64 %rd21, %rd20, %rd19;
; CHECK-NEXT: or.b64 %rd22, %rd21, %rd18;
; CHECK-NEXT: shl.b64 %rd23, %rd22, 32;
; CHECK-NEXT: or.b64 %rd24, %rd23, %rd16;
; CHECK-NEXT: st.param.b8 [func_retval0], %rd10;
; CHECK-NEXT: shr.u64 %rd25, %rd24, 56;
; CHECK-NEXT: st.param.b8 [func_retval0+7], %rd25;
; CHECK-NEXT: shr.u64 %rd26, %rd24, 48;
; CHECK-NEXT: st.param.b8 [func_retval0+6], %rd26;
; CHECK-NEXT: shr.u64 %rd27, %rd24, 40;
; CHECK-NEXT: st.param.b8 [func_retval0+5], %rd27;
; CHECK-NEXT: shr.u64 %rd28, %rd24, 32;
; CHECK-NEXT: st.param.b8 [func_retval0+4], %rd28;
; CHECK-NEXT: shr.u64 %rd29, %rd24, 24;
; CHECK-NEXT: st.param.b8 [func_retval0+3], %rd29;
; CHECK-NEXT: shr.u64 %rd30, %rd24, 16;
; CHECK-NEXT: st.param.b8 [func_retval0+2], %rd30;
; CHECK-NEXT: shr.u64 %rd31, %rd24, 8;
; CHECK-NEXT: st.param.b8 [func_retval0+1], %rd31;
; CHECK-NEXT: ret;
%ret = call %struct.64 @callee(ptr %p)
ret %struct.64 %ret
}
define i64 @test_param_type_mismatch(ptr %p) {
; CHECK-LABEL: test_param_type_mismatch(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<3>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: { // callseq 1, 0
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .b64 retval0;
; CHECK-NEXT: prototype_1 : .callprototype (.param .b64 _) _ (.param .b64 _);
; CHECK-NEXT: st.param.b64 [param0], 7;
; CHECK-NEXT: mov.b64 %rd1, callee;
; CHECK-NEXT: call (retval0), %rd1, (param0), prototype_1;
; CHECK-NEXT: ld.param.b64 %rd2, [retval0];
; CHECK-NEXT: } // callseq 1
; CHECK-NEXT: st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT: ret;
%ret = call i64 @callee(i64 7)
ret i64 %ret
}
define i64 @test_param_count_mismatch(ptr %p) {
; CHECK-LABEL: test_param_count_mismatch(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<4>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: ld.param.b64 %rd1, [test_param_count_mismatch_param_0];
; CHECK-NEXT: { // callseq 2, 0
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .b64 param1;
; CHECK-NEXT: .param .b64 retval0;
; CHECK-NEXT: st.param.b64 [param0], %rd1;
; CHECK-NEXT: prototype_2 : .callprototype (.param .b64 _) _ (.param .b64 _, .param .b64 _);
; CHECK-NEXT: st.param.b64 [param1], 7;
; CHECK-NEXT: mov.b64 %rd2, callee;
; CHECK-NEXT: call (retval0), %rd2, (param0, param1), prototype_2;
; CHECK-NEXT: ld.param.b64 %rd3, [retval0];
; CHECK-NEXT: } // callseq 2
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
; CHECK-NEXT: ret;
%ret = call i64 @callee(ptr %p, i64 7)
ret i64 %ret
}
define %struct.64 @test_return_type_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_return_type_mismatch_variadic(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<32>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: ld.param.b64 %rd1, [test_return_type_mismatch_variadic_param_0];
; CHECK-NEXT: { // callseq 3, 0
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .align 1 .b8 retval0[8];
; CHECK-NEXT: st.param.b64 [param0], %rd1;
; CHECK-NEXT: prototype_3 : .callprototype (.param .align 1 .b8 _[8]) _ (.param .b64 _);
; CHECK-NEXT: mov.b64 %rd2, callee_variadic;
; CHECK-NEXT: call (retval0), %rd2, (param0), prototype_3;
; CHECK-NEXT: ld.param.b8 %rd3, [retval0+7];
; CHECK-NEXT: ld.param.b8 %rd4, [retval0+6];
; CHECK-NEXT: ld.param.b8 %rd5, [retval0+5];
; CHECK-NEXT: ld.param.b8 %rd6, [retval0+4];
; CHECK-NEXT: ld.param.b8 %rd7, [retval0+3];
; CHECK-NEXT: ld.param.b8 %rd8, [retval0+2];
; CHECK-NEXT: ld.param.b8 %rd9, [retval0+1];
; CHECK-NEXT: ld.param.b8 %rd10, [retval0];
; CHECK-NEXT: } // callseq 3
; CHECK-NEXT: shl.b64 %rd11, %rd9, 8;
; CHECK-NEXT: or.b64 %rd12, %rd11, %rd10;
; CHECK-NEXT: shl.b64 %rd13, %rd8, 16;
; CHECK-NEXT: shl.b64 %rd14, %rd7, 24;
; CHECK-NEXT: or.b64 %rd15, %rd14, %rd13;
; CHECK-NEXT: or.b64 %rd16, %rd15, %rd12;
; CHECK-NEXT: shl.b64 %rd17, %rd5, 8;
; CHECK-NEXT: or.b64 %rd18, %rd17, %rd6;
; CHECK-NEXT: shl.b64 %rd19, %rd4, 16;
; CHECK-NEXT: shl.b64 %rd20, %rd3, 24;
; CHECK-NEXT: or.b64 %rd21, %rd20, %rd19;
; CHECK-NEXT: or.b64 %rd22, %rd21, %rd18;
; CHECK-NEXT: shl.b64 %rd23, %rd22, 32;
; CHECK-NEXT: or.b64 %rd24, %rd23, %rd16;
; CHECK-NEXT: st.param.b8 [func_retval0], %rd10;
; CHECK-NEXT: shr.u64 %rd25, %rd24, 56;
; CHECK-NEXT: st.param.b8 [func_retval0+7], %rd25;
; CHECK-NEXT: shr.u64 %rd26, %rd24, 48;
; CHECK-NEXT: st.param.b8 [func_retval0+6], %rd26;
; CHECK-NEXT: shr.u64 %rd27, %rd24, 40;
; CHECK-NEXT: st.param.b8 [func_retval0+5], %rd27;
; CHECK-NEXT: shr.u64 %rd28, %rd24, 32;
; CHECK-NEXT: st.param.b8 [func_retval0+4], %rd28;
; CHECK-NEXT: shr.u64 %rd29, %rd24, 24;
; CHECK-NEXT: st.param.b8 [func_retval0+3], %rd29;
; CHECK-NEXT: shr.u64 %rd30, %rd24, 16;
; CHECK-NEXT: st.param.b8 [func_retval0+2], %rd30;
; CHECK-NEXT: shr.u64 %rd31, %rd24, 8;
; CHECK-NEXT: st.param.b8 [func_retval0+1], %rd31;
; CHECK-NEXT: ret;
%ret = call %struct.64 (ptr, ...) @callee_variadic(ptr %p)
ret %struct.64 %ret
}
define i64 @test_param_type_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_param_type_mismatch_variadic(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<3>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: ld.param.b64 %rd1, [test_param_type_mismatch_variadic_param_0];
; CHECK-NEXT: { // callseq 4, 0
; CHECK-NEXT: .param .align 8 .b8 param1[8];
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .b64 retval0;
; CHECK-NEXT: st.param.b64 [param0], %rd1;
; CHECK-NEXT: st.param.b64 [param1], 7;
; CHECK-NEXT: call.uni (retval0), callee_variadic, (param0, param1);
; CHECK-NEXT: ld.param.b64 %rd2, [retval0];
; CHECK-NEXT: } // callseq 4
; CHECK-NEXT: st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT: ret;
%ret = call i64 (ptr, ...) @callee_variadic(ptr %p, i64 7)
ret i64 %ret
}
define i64 @test_param_count_mismatch_variadic(ptr %p) {
; CHECK-LABEL: test_param_count_mismatch_variadic(
; CHECK: {
; CHECK-NEXT: .reg .b64 %rd<3>;
; CHECK-EMPTY:
; CHECK-NEXT: // %bb.0:
; CHECK-NEXT: ld.param.b64 %rd1, [test_param_count_mismatch_variadic_param_0];
; CHECK-NEXT: { // callseq 5, 0
; CHECK-NEXT: .param .align 8 .b8 param1[8];
; CHECK-NEXT: .param .b64 param0;
; CHECK-NEXT: .param .b64 retval0;
; CHECK-NEXT: st.param.b64 [param0], %rd1;
; CHECK-NEXT: st.param.b64 [param1], 7;
; CHECK-NEXT: call.uni (retval0), callee_variadic, (param0, param1);
; CHECK-NEXT: ld.param.b64 %rd2, [retval0];
; CHECK-NEXT: } // callseq 5
; CHECK-NEXT: st.param.b64 [func_retval0], %rd2;
; CHECK-NEXT: ret;
%ret = call i64 (ptr, ...) @callee_variadic(ptr %p, i64 7)
ret i64 %ret
}