The following works with PARALLEL but not with TARGET.
OpenMP states the following is supposed to work:
A = 5; // == this->A
B = 6; // == this->B
C[44] = 7; // == this->C; assume 'int C[100]'
#pragma <parallel|target> firstprivate(A,C) private(B)
{
A += 5; // Now: A is 10.
B = 7;
C[44] += 7; // Now C is 14
// It is unspecified what value this->{A,B,C} has
}
// {A,B,C[44]} == this->{A,B,C[44]} are still {5,6,7}
* * *
In the C++ FE, that's handledby creating a temporary variable: v = create_temporary_var
(TREE_TYPE (m)); with SET_DECL_VALUE_EXPR (v, m); DECL_OMP_PRIVATIZED_MEMBER(v)
where 'm' is, e.g., 'this->A' - and a bunch of 'if
(DECL_OMP_PRIVATIZED_MEMBER(decl))'
in theg++ FE, only. For PARALLEL, the VALUE_EXPR survives until omp-low.cc,
which handles this for (first)privatizing. But for TARGET, in
gimplify.cc, after the following call in gimplify_omp_workshare 16813
gimple *g = gimplify_and_return_first (OMP_BODY (expr), &body);
will turn the 'A' in the body into 'this->A'.
* * *
Thus, while there is after omplower the expected
#pragma omp target ... firstprivate(A) and also D.3081 =
.omp_data_i->A; A= ...; what actually gets used is D.3084
= .omp_data_i->D.3046; this = D.3084;
D.2996 = this->A; which unsurprisingly breaks. * * *
This can be "fixed" by using the following patch. With that patch, the
-fdump-tree-omplower looks fine. But it does then fail with: during RTL
pass: expand g2.cpp:11:7: internal compiler error: in make_decl_rtl, at
varasm.cc:1443
for the 'A' with 'B = A' (where B is a non-member var) and 'A' is still
as the value expr 'this->A'. --- a/gcc/gimplify.cc +++ b/gcc/gimplify.cc
@@ -3285,12 +3285,15 @@ gimplify_var_or_parm_decl (tree *expr_p) if
(gimplify_omp_ctxp && omp_notice_variable (gimplify_omp_ctxp, decl,
true)) return GS_ALL_DONE; + if (!flag_openmp) // Assume: C++'s
DECL_OMP_PRIVATIZED_MEMBER (decl) + { /* If the decl is an alias for
another expression, substitute it now. */ if (DECL_HAS_VALUE_EXPR_P
(decl)) { *expr_p = unshare_expr (DECL_VALUE_EXPR (decl)); return GS_OK;
} + } return GS_ALL_DONE; } * * * Any idea / suggestion how to handle
this best? One way I see would be to add a lang-hook here to check for
DECL_OMP_PRIVATIZED_MEMBER, similar to the hack above. And
then ensure that the DECL_VALUE_EXPR points to the var decl
in the target region (i.e. some hacking in omp-low.cc).
I have no idea whether that would - nor whether that would be
the way forward. - Thoughts?
Tobias
#if TEMPL
template <typename T>
#else
#define T int
#endif
#if PRIVATE
#define firstprivate private
#endif
struct t {
T A;
void f()
{
T B = 49;
A = 7;
#pragma omp parallel firstprivate(A) if(0) shared(B) default(none)
{
if (A != 7) __builtin_printf("ERROR 1b: %d (!= 7) inside omp parallel\n", A);
A = 5;
B = A;
}
if (A != 7) __builtin_printf("ERROR 1: %d (!= 7) omp parallel\n", A);
if (B != 5) __builtin_printf("ERROR 1a: %d\n", B);
A = 8; B = 49;
#pragma omp parallel firstprivate(A)if(0) shared(B) default(none)
{
if (A != 8) __builtin_printf("ERROR 1b: %d (!= 8) inside omp parallel\n", A);
A = 6;
B = A;
}
if (A != 8) __builtin_printf("ERROR 2: %d (!= 8) omp parallel\n", A);
if (B != 6) __builtin_printf("ERROR 2a: %d\n", B);
A = 8; B = 49;
#pragma omp target firstprivate(A) map(from:B) defaultmap(none)
{
if (A != 7) __builtin_printf("ERROR 2b: %d (!= 7) inside omp target\n", A);
A = 7;
B = A;
}
if (A != 8) __builtin_printf("ERROR 3: %d (!= 8) omp target\n", A);
if (B != 7) __builtin_printf("ERROR 3a: %d\n", B);
A = 9; B = 49;
#pragma omp target firstprivate(A) map(from:B) defaultmap(none)
{
if (A != 7) __builtin_printf("ERROR 3b: %d (!= 7) inside omp target\n", A);
A = 8;
B = A;
}
if (A != 9) __builtin_printf("ERROR 4: %d (!= 9) omp target\n", A); else __builtin_printf("OK\n");
if (B != 8) __builtin_printf("ERROR 4a: %d\n", B);
}
};
void bar() {
#if TEMPL
struct t<int> x;
#else
struct t x;
#endif
x.f();
}
int main()
{
bar();
}