forked from OSchip/llvm-project
130 lines
4.6 KiB
LLVM
130 lines
4.6 KiB
LLVM
; RUN: opt -passes=openmp-opt -debug-only=openmp-opt -disable-output < %s 2>&1 | FileCheck %s
|
|
; RUN: opt -passes=openmp-opt -pass-remarks-analysis=openmp-opt -disable-output < %s 2>&1 | FileCheck %s --check-prefix=REMARKS
|
|
; REQUIRES: asserts
|
|
; ModuleID = 'single_threaded_exeuction.c'
|
|
|
|
%struct.ident_t = type { i32, i32, i32, i32, i8* }
|
|
|
|
@0 = private unnamed_addr constant [1 x i8] c"\00", align 1
|
|
@1 = private unnamed_addr constant %struct.ident_t { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([1 x i8], [1 x i8]* @0, i32 0, i32 0) }, align 8
|
|
@kernel_exec_mode = weak constant i8 1
|
|
|
|
|
|
; CHECK-NOT: [openmp-opt] Basic block @kernel entry is executed by a single thread.
|
|
; CHECK: [openmp-opt] Basic block @kernel if.then is executed by a single thread.
|
|
; CHECK-NOT: [openmp-opt] Basic block @kernel if.else is executed by a single thread.
|
|
; CHECK-NOT: [openmp-opt] Basic block @kernel if.end is executed by a single thread.
|
|
define void @kernel() {
|
|
%call = call i32 @__kmpc_target_init(%struct.ident_t* nonnull @1, i8 1, i1 false, i1 false)
|
|
%cmp = icmp eq i32 %call, -1
|
|
br i1 %cmp, label %if.then, label %if.else
|
|
if.then:
|
|
br label %if.end
|
|
if.else:
|
|
br label %if.end
|
|
if.end:
|
|
call void @__kmpc_target_deinit(%struct.ident_t* null, i8 1, i1 true)
|
|
ret void
|
|
}
|
|
|
|
; REMARKS: remark: single_threaded_execution.c:1:0: Could not internalize function. Some optimizations may not be possible.
|
|
; REMARKS-NOT: remark: single_threaded_execution.c:1:0: Could not internalize function. Some optimizations may not be possible.
|
|
|
|
; CHECK-NOT: [openmp-opt] Basic block @nvptx entry is executed by a single thread.
|
|
; CHECK-DAG: [openmp-opt] Basic block @nvptx if.then is executed by a single thread.
|
|
; CHECK-NOT: [openmp-opt] Basic block @nvptx if.end is executed by a single thread.
|
|
; Function Attrs: noinline
|
|
define void @nvptx() {
|
|
entry:
|
|
%call = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
|
|
%cmp = icmp eq i32 %call, 0
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then:
|
|
call void @foo()
|
|
call void @bar()
|
|
call void @baz()
|
|
call void @cold()
|
|
br label %if.end
|
|
|
|
if.end:
|
|
ret void
|
|
}
|
|
|
|
; CHECK-NOT: [openmp-opt] Basic block @amdgcn entry is executed by a single thread.
|
|
; CHECK-DAG: [openmp-opt] Basic block @amdgcn if.then is executed by a single thread.
|
|
; CHECK-NOT: [openmp-opt] Basic block @amdgcn if.end is executed by a single thread.
|
|
; Function Attrs: noinline
|
|
define void @amdgcn() {
|
|
entry:
|
|
%call = call i32 @llvm.amdgcn.workitem.id.x()
|
|
%cmp = icmp eq i32 %call, 0
|
|
br i1 %cmp, label %if.then, label %if.end
|
|
|
|
if.then:
|
|
call void @foo()
|
|
call void @bar()
|
|
call void @baz()
|
|
call void @cold()
|
|
br label %if.end
|
|
|
|
if.end:
|
|
ret void
|
|
}
|
|
|
|
; CHECK: [openmp-opt] Basic block @foo entry is executed by a single thread.
|
|
; Function Attrs: noinline
|
|
define internal void @foo() {
|
|
entry:
|
|
ret void
|
|
}
|
|
|
|
; CHECK: [openmp-opt] Basic block @bar.internalized entry is executed by a single thread.
|
|
; Function Attrs: noinline
|
|
define void @bar() {
|
|
entry:
|
|
ret void
|
|
}
|
|
|
|
; CHECK-NOT: [openmp-opt] Basic block @baz entry is executed by a single thread.
|
|
; Function Attrs: noinline
|
|
define weak void @baz() !dbg !8 {
|
|
entry:
|
|
ret void
|
|
}
|
|
|
|
; CHECK-NOT: [openmp-opt] Basic block @cold entry is executed by a single thread.
|
|
; Function Attrs: cold convergent noinline nounwind optnone mustprogress
|
|
define weak void @cold() #0 !dbg !9 {
|
|
entry:
|
|
ret void
|
|
}
|
|
|
|
declare i32 @llvm.nvvm.read.ptx.sreg.tid.x()
|
|
|
|
declare i32 @llvm.amdgcn.workitem.id.x()
|
|
|
|
declare void @__kmpc_kernel_prepare_parallel(i8*)
|
|
|
|
declare i32 @__kmpc_target_init(%struct.ident_t*, i8, i1, i1)
|
|
|
|
declare void @__kmpc_target_deinit(%struct.ident_t*, i8, i1)
|
|
|
|
attributes #0 = { cold noinline }
|
|
|
|
!llvm.dbg.cu = !{!0}
|
|
!llvm.module.flags = !{!3, !4, !5, !6}
|
|
!nvvm.annotations = !{!7}
|
|
|
|
!0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, producer: "clang version 12.0.0", isOptimized: false, runtimeVersion: 0, emissionKind: FullDebug, enums: !2, splitDebugInlining: false, nameTableKind: None)
|
|
!1 = !DIFile(filename: "single_threaded_execution.c", directory: "/tmp/single_threaded_execution.c")
|
|
!2 = !{}
|
|
!3 = !{i32 2, !"Debug Info Version", i32 3}
|
|
!4 = !{i32 1, !"wchar_size", i32 4}
|
|
!5 = !{i32 7, !"openmp", i32 50}
|
|
!6 = !{i32 7, !"openmp-device", i32 50}
|
|
!7 = !{void ()* @kernel, !"kernel", i32 1}
|
|
!8 = distinct !DISubprogram(name: "bar", scope: !1, file: !1, line: 8, type: !10, scopeLine: 1, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!9 = distinct !DISubprogram(name: "cold", scope: !1, file: !1, line: 8, type: !10, scopeLine: 2, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!10 = !DISubroutineType(types: !2)
|