Issue |
126949
|
Summary |
[OMPIRBuilder] - Empty target task proxy function generated by OMPIRBuilder (`emitTargetTaskProxyFunction`)
|
Labels |
openmp,
mlir,
llvm:openmpirbuilder
|
Assignees |
|
Reporter |
bhandarkar-pranav
|
Reproducer:
```
$> mlir-translate -mlir-to-llvmir ${LLVM_PROJECT_DIR}/mlir/test/Target/LLVMIR/omptarget-depend-host-only
$> cat ${LLVM_PROJECT_DIR}/mlir/test/Target/LLVMIR/omptarget-depend-host-only.mlir
// RUN: mlir-translate -mlir-to-llvmir %s | FileCheck %s
module attributes {omp.is_target_device = false} {
llvm.func @omp_target_depend_() {
%0 = llvm.mlir.constant(39 : index) : i64
%1 = llvm.mlir.constant(1 : index) : i64
%2 = llvm.mlir.constant(40 : index) : i64
%3 = omp.map.bounds lower_bound(%1 : i64) upper_bound(%0 : i64) extent(%2 : i64) stride(%1 : i64) start_idx(%1 : i64)
%4 = llvm.mlir.addressof @_QFEa : !llvm.ptr
%5 = omp.map.info var_ptr(%4 : !llvm.ptr, !llvm.array<40 x i32>) map_clauses(from) capture(ByRef) bounds(%3) -> !llvm.ptr {name = "a"}
omp.target depend(taskdependin -> %4 : !llvm.ptr) map_entries(%5 -> %arg0 : !llvm.ptr) {
%6 = llvm.mlir.constant(100 : index) : i32
llvm.store %6, %arg0 : i32, !llvm.ptr
omp.terminator
}
llvm.return
}
llvm.mlir.global internal @_QFEa() {addr_space = 0 : i32} : !llvm.array<40 x i32> {
%0 = llvm.mlir.zero : !llvm.array<40 x i32>
llvm.return %0 : !llvm.array<40 x i32>
}
}
// CHECK: define void @omp_target_depend_()
// CHECK-NOT: define {{.*}} @
// CHECK-NOT: call i32 @__tgt_target_kernel({{.*}})
// CHECK: call void @__omp_offloading_[[DEV:.*]]_[[FIL:.*]]_omp_target_depend__l[[LINE:.*]](ptr {{.*}})
// CHECK-NEXT: ret void
// CHECK: define internal void @__omp_offloading_[[DEV]]_[[FIL]]_omp_target_depend__l[[LINE]](ptr %[[ADDR_A:.*]])
// CHECK: store i32 100, ptr %[[ADDR_A]], align 4
```
Two problems in the output
1. Empty target task proxy function `@.omp_target_task_proxy_func`
```
define internal void @.omp_target_task_proxy_func(i32 %thread.id, ptr %task) {
entry:
ret void
}
```
2. After 1 is fixed, we'll end up with dual execution of the kernel because we hit a corner case (single basic block task bodies) in `OpenMPIRBuilder::OutlineInfo::collectBlocks` such that the entire task body is not outlined in the target task.
```
codeRepl: ; preds = %entry
%omp_global_thread_num = call i32 @__kmpc_global_thread_num(ptr @2)
%5 = call ptr @__kmpc_omp_task_alloc(ptr @2, i32 %omp_global_thread_num, i32 0, i64 40, i64 0, ptr @.omp_target_task_proxy_func)
call void @__kmpc_omp_wait_deps(ptr @2, i32 %omp_global_thread_num, i32 1, ptr %.dep.arr.addr, i32 0, ptr null)
call void @__kmpc_omp_task_begin_if0(ptr @2, i32 %omp_global_thread_num, ptr %5)
call void @.omp_target_task_proxy_func(i32 %omp_global_thread_num, ptr %5) ;;; first execution of the kernel once problem 1 is fixed.
call void @__kmpc_omp_task_complete_if0(ptr @2, i32 %omp_global_thread_num, ptr %5)
br label %target.task.body
target.task.body: ; preds = %codeRepl
call void @__omp_offloading_10307_a581555_omp_target_depend__l11(ptr @_QFEa) ;;;; Second execution of the kernel when problem 1 is fixed
ret void
}
```
_______________________________________________
llvm-bugs mailing list
llvm-bugs@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-bugs