79 lines
2.4 KiB
LLVM
79 lines
2.4 KiB
LLVM
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck %s
|
|
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -verify-machineinstrs --amdhsa-code-object-version=5 < %s | FileCheck -check-prefixes=V5 %s
|
|
|
|
; CHECK-LABEL: {{^}}recursive:
|
|
; CHECK: ScratchSize: 16
|
|
define void @recursive() {
|
|
call void @recursive()
|
|
store volatile i32 0, i32 addrspace(1)* undef
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}tail_recursive:
|
|
; CHECK: ScratchSize: 0
|
|
define void @tail_recursive() {
|
|
tail call void @tail_recursive()
|
|
ret void
|
|
}
|
|
|
|
define void @calls_tail_recursive() norecurse {
|
|
tail call void @tail_recursive()
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}tail_recursive_with_stack:
|
|
define void @tail_recursive_with_stack() {
|
|
%alloca = alloca i32, addrspace(5)
|
|
store volatile i32 0, i32 addrspace(5)* %alloca
|
|
tail call void @tail_recursive_with_stack()
|
|
ret void
|
|
}
|
|
|
|
; For an arbitrary recursive call, report a large number for unknown stack
|
|
; usage for code object v4 and older
|
|
; CHECK-LABEL: {{^}}calls_recursive:
|
|
; CHECK: .amdhsa_private_segment_fixed_size 16400{{$}}
|
|
;
|
|
; V5-LABEL: {{^}}calls_recursive:
|
|
; V5: .amdhsa_private_segment_fixed_size 0{{$}}
|
|
; V5: .amdhsa_uses_dynamic_stack 1
|
|
define amdgpu_kernel void @calls_recursive() {
|
|
call void @recursive()
|
|
ret void
|
|
}
|
|
|
|
; Make sure we do not report a huge stack size for tail recursive
|
|
; functions
|
|
; CHECK-LABEL: {{^}}kernel_indirectly_calls_tail_recursive:
|
|
; CHECK: .amdhsa_private_segment_fixed_size 0{{$}}
|
|
define amdgpu_kernel void @kernel_indirectly_calls_tail_recursive() {
|
|
call void @calls_tail_recursive()
|
|
ret void
|
|
}
|
|
|
|
; TODO: Even though tail_recursive is only called as a tail call, we
|
|
; end up treating it as generally recursive call from the regular call
|
|
; in the kernel.
|
|
|
|
; CHECK-LABEL: {{^}}kernel_calls_tail_recursive:
|
|
; CHECK: .amdhsa_private_segment_fixed_size 16384{{$}}
|
|
;
|
|
; V5-LABEL: {{^}}kernel_calls_tail_recursive:
|
|
; V5: .amdhsa_private_segment_fixed_size 0{{$}}
|
|
; V5: .amdhsa_uses_dynamic_stack 1
|
|
define amdgpu_kernel void @kernel_calls_tail_recursive() {
|
|
call void @tail_recursive()
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}kernel_calls_tail_recursive_with_stack:
|
|
; CHECK: .amdhsa_private_segment_fixed_size 16384{{$}}
|
|
;
|
|
; V5-LABEL: {{^}}kernel_calls_tail_recursive_with_stack:
|
|
; V5: .amdhsa_private_segment_fixed_size 8{{$}}
|
|
; V5: .amdhsa_uses_dynamic_stack 1
|
|
define amdgpu_kernel void @kernel_calls_tail_recursive_with_stack() {
|
|
call void @tail_recursive_with_stack()
|
|
ret void
|
|
}
|