Hi! The ugly part is that OpenMP 5.1 made omp_all_memory a reserved identifier which isn't allowed to be used anywhere but in the depend clause, this is against how everything else has been handled in OpenMP so far (where some identifiers could have special meaning in some OpenMP clauses or pragmas but not elsewhere). The patch handles it by making it a conditional keyword (for -fopenmp only) and emitting a better diagnostics when it is used in a primary expression. Having a nicer diagnostics when e.g. trying to do int omp_all_memory; or int *omp_all_memory[10]; etc. would mean changing too many spots and hooking into name lookups to reject declaring any such symbols would be too ugly and I'm afraid there are way too many spots where one can introduce a name (variables, functions, namespaces, struct, enum, enumerators, template arguments, ...).
Otherwise, the handling is quite simple, normal depend clauses lower into addresses of variables being handed over to the library, for omp_all_memory I'm using NULL pointers. omp_all_memory can only be used with inout or out depend kinds and means that a task is dependent on all previously created sibling tasks that have any dependency (of any depend kind) and that any later created sibling tasks will be dependent on it if they have any dependency. Bootstrapped/regtested on x86_64-linux and i686-linux, committed to trunk. 2022-05-12 Jakub Jelinek <ja...@redhat.com> gcc/ * gimplify.cc (gimplify_omp_depend): Don't build_fold_addr_expr if null_pointer_node. (gimplify_scan_omp_clauses): Likewise. * tree-pretty-print.cc (dump_omp_clause): Print null_pointer_node as omp_all_memory. gcc/c-family/ * c-common.h (enum rid): Add RID_OMP_ALL_MEMORY. * c-omp.cc (c_finish_omp_depobj): Don't build_fold_addr_expr if null_pointer_node. gcc/c/ * c-parser.cc (c_parse_init): Register omp_all_memory as keyword if flag_openmp. (c_parser_postfix_expression): Diagnose uses of omp_all_memory in postfix expressions. (c_parser_omp_variable_list): Handle omp_all_memory in depend clause. * c-typeck.cc (c_finish_omp_clauses): Handle omp_all_memory keyword in depend clause as null_pointer_node, diagnose invalid uses. gcc/cp/ * lex.cc (init_reswords): Register omp_all_memory as keyword if flag_openmp. * parser.cc (cp_parser_primary_expression): Diagnose uses of omp_all_memory in postfix expressions. (cp_parser_omp_var_list_no_open): Handle omp_all_memory in depend clause. * semantics.cc (finish_omp_clauses): Handle omp_all_memory keyword in depend clause as null_pointer_node, diagnose invalid uses. * pt.cc (tsubst_omp_clause_decl): Pass through omp_all_memory. gcc/testsuite/ * c-c++-common/gomp/all-memory-1.c: New test. * c-c++-common/gomp/all-memory-2.c: New test. * c-c++-common/gomp/all-memory-3.c: New test. * g++.dg/gomp/all-memory-1.C: New test. * g++.dg/gomp/all-memory-2.C: New test. libgomp/ * libgomp.h (struct gomp_task): Add depend_all_memory member. * task.c (gomp_init_task): Initialize depend_all_memory. (gomp_task_handle_depend): Handle omp_all_memory. (gomp_task_run_post_handle_depend_hash): Clear parent->depend_all_memory if equal to current task. (gomp_task_maybe_wait_for_dependencies): Handle omp_all_memory. * testsuite/libgomp.c-c++-common/depend-1.c: New test. * testsuite/libgomp.c-c++-common/depend-2.c: New test. * testsuite/libgomp.c-c++-common/depend-3.c: New test. --- gcc/gimplify.cc.jj 2022-05-09 09:09:20.402472032 +0200 +++ gcc/gimplify.cc 2022-05-11 09:32:01.961698970 +0200 @@ -8623,7 +8623,8 @@ gimplify_omp_depend (tree *list_p, gimpl } if (error_operand_p (TREE_VALUE (t))) return 2; - TREE_VALUE (t) = build_fold_addr_expr (TREE_VALUE (t)); + if (TREE_VALUE (t) != null_pointer_node) + TREE_VALUE (t) = build_fold_addr_expr (TREE_VALUE (t)); r = build4 (ARRAY_REF, ptr_type_node, array, cnts[i], NULL_TREE, NULL_TREE); tem = build2_loc (OMP_CLAUSE_LOCATION (c), MODIFY_EXPR, @@ -8650,7 +8651,8 @@ gimplify_omp_depend (tree *list_p, gimpl } if (error_operand_p (OMP_CLAUSE_DECL (c))) return 2; - OMP_CLAUSE_DECL (c) = build_fold_addr_expr (OMP_CLAUSE_DECL (c)); + if (OMP_CLAUSE_DECL (c) != null_pointer_node) + OMP_CLAUSE_DECL (c) = build_fold_addr_expr (OMP_CLAUSE_DECL (c)); if (gimplify_expr (&OMP_CLAUSE_DECL (c), pre_p, NULL, is_gimple_val, fb_rvalue) == GS_ERROR) return 2; @@ -10346,12 +10348,15 @@ gimplify_scan_omp_clauses (tree *list_p, remove = true; break; } - OMP_CLAUSE_DECL (c) = build_fold_addr_expr (OMP_CLAUSE_DECL (c)); - if (gimplify_expr (&OMP_CLAUSE_DECL (c), pre_p, NULL, - is_gimple_val, fb_rvalue) == GS_ERROR) + if (OMP_CLAUSE_DECL (c) != null_pointer_node) { - remove = true; - break; + OMP_CLAUSE_DECL (c) = build_fold_addr_expr (OMP_CLAUSE_DECL (c)); + if (gimplify_expr (&OMP_CLAUSE_DECL (c), pre_p, NULL, + is_gimple_val, fb_rvalue) == GS_ERROR) + { + remove = true; + break; + } } if (code == OMP_TASK) ctx->has_depend = true; --- gcc/tree-pretty-print.cc.jj 2022-05-06 08:43:16.499060072 +0200 +++ gcc/tree-pretty-print.cc 2022-05-11 09:32:02.122696768 +0200 @@ -850,7 +850,10 @@ dump_omp_clause (pretty_printer *pp, tre pp_string (pp, name); pp_colon (pp); } - dump_generic_node (pp, t, spc, flags, false); + if (t == null_pointer_node) + pp_string (pp, "omp_all_memory"); + else + dump_generic_node (pp, t, spc, flags, false); pp_right_paren (pp); } break; --- gcc/c-family/c-common.h.jj 2022-05-09 18:20:05.036884184 +0200 +++ gcc/c-family/c-common.h 2022-05-11 09:32:02.114696878 +0200 @@ -219,6 +219,9 @@ enum rid RID_AT_INTERFACE, RID_AT_IMPLEMENTATION, + /* OpenMP */ + RID_OMP_ALL_MEMORY, + /* Named address support, mapping the keyword to a particular named address number. Named address space 0 is reserved for the generic address. If there are more than 254 named addresses, the addr_space_t type will need --- gcc/c-family/c-omp.cc.jj 2022-03-14 10:34:34.124924371 +0100 +++ gcc/c-family/c-omp.cc 2022-05-11 19:55:26.364606451 +0200 @@ -757,7 +757,7 @@ c_finish_omp_depobj (location_t loc, tre t = build2 (COMPOUND_EXPR, TREE_TYPE (t1), TREE_OPERAND (t, 0), t1); } - else + else if (t != null_pointer_node) t = build_fold_addr_expr (t); break; default: --- gcc/c/c-parser.cc.jj 2022-05-09 18:20:05.041884116 +0200 +++ gcc/c/c-parser.cc 2022-05-11 09:32:02.103697028 +0200 @@ -165,6 +165,14 @@ c_parse_init (void) C_SET_RID_CODE (id, RID_FIRST_INT_N + i); C_IS_RESERVED_WORD (id) = 1; } + + if (flag_openmp) + { + id = get_identifier ("omp_all_memory"); + C_SET_RID_CODE (id, RID_OMP_ALL_MEMORY); + C_IS_RESERVED_WORD (id) = 1; + ridpointers [RID_OMP_ALL_MEMORY] = id; + } } /* A parser structure recording information about the state and @@ -10202,6 +10210,13 @@ c_parser_postfix_expression (c_parser *p case RID_GENERIC: expr = c_parser_generic_selection (parser); break; + case RID_OMP_ALL_MEMORY: + gcc_assert (flag_openmp); + c_parser_consume_token (parser); + error_at (loc, "%<omp_all_memory%> may only be used in OpenMP " + "%<depend%> clause"); + expr.set_error (); + break; default: c_parser_error (parser, "expected expression"); expr.set_error (); @@ -13025,7 +13040,19 @@ c_parser_omp_variable_list (c_parser *pa if (c_parser_next_token_is_not (parser, CPP_NAME) || c_parser_peek_token (parser)->id_kind != C_ID_ID) { - struct c_expr expr = c_parser_expr_no_commas (parser, NULL); + struct c_expr expr; + if (kind == OMP_CLAUSE_DEPEND + && c_parser_next_token_is_keyword (parser, + RID_OMP_ALL_MEMORY) + && (c_parser_peek_2nd_token (parser)->type == CPP_COMMA + || (c_parser_peek_2nd_token (parser)->type + == CPP_CLOSE_PAREN))) + { + expr.value = ridpointers[RID_OMP_ALL_MEMORY]; + c_parser_consume_token (parser); + } + else + expr = c_parser_expr_no_commas (parser, NULL); if (expr.value != error_mark_node) { tree u = build_omp_clause (clause_loc, kind); --- gcc/c/c-typeck.cc.jj 2022-05-06 08:43:16.485060264 +0200 +++ gcc/c/c-typeck.cc 2022-05-11 09:32:02.078697370 +0200 @@ -14832,6 +14832,18 @@ c_finish_omp_clauses (tree clauses, enum } if (t == error_mark_node) remove = true; + else if (OMP_CLAUSE_CODE (c) == OMP_CLAUSE_DEPEND + && t == ridpointers[RID_OMP_ALL_MEMORY]) + { + if (OMP_CLAUSE_DEPEND_KIND (c) != OMP_CLAUSE_DEPEND_OUT + && OMP_CLAUSE_DEPEND_KIND (c) != OMP_CLAUSE_DEPEND_INOUT) + { + error_at (OMP_CLAUSE_LOCATION (c), + "%<omp_all_memory%> used with %<depend%> kind " + "other than %<out%> or %<inout%>"); + remove = true; + } + } else if (!lvalue_p (t)) { error_at (OMP_CLAUSE_LOCATION (c), @@ -14873,24 +14885,32 @@ c_finish_omp_clauses (tree clauses, enum } if (!remove) { - tree addr = build_unary_op (OMP_CLAUSE_LOCATION (c), ADDR_EXPR, - t, false); - if (addr == error_mark_node) - remove = true; + if (t == ridpointers[RID_OMP_ALL_MEMORY]) + t = null_pointer_node; else { + tree addr = build_unary_op (OMP_CLAUSE_LOCATION (c), + ADDR_EXPR, t, false); + if (addr == error_mark_node) + { + remove = true; + break; + } t = build_indirect_ref (OMP_CLAUSE_LOCATION (c), addr, RO_UNARY_STAR); if (t == error_mark_node) - remove = true; - else if (TREE_CODE (OMP_CLAUSE_DECL (c)) == TREE_LIST - && TREE_PURPOSE (OMP_CLAUSE_DECL (c)) - && (TREE_CODE (TREE_PURPOSE (OMP_CLAUSE_DECL (c))) - == TREE_VEC)) - TREE_VALUE (OMP_CLAUSE_DECL (c)) = t; - else - OMP_CLAUSE_DECL (c) = t; + { + remove = true; + break; + } } + if (TREE_CODE (OMP_CLAUSE_DECL (c)) == TREE_LIST + && TREE_PURPOSE (OMP_CLAUSE_DECL (c)) + && (TREE_CODE (TREE_PURPOSE (OMP_CLAUSE_DECL (c))) + == TREE_VEC)) + TREE_VALUE (OMP_CLAUSE_DECL (c)) = t; + else + OMP_CLAUSE_DECL (c) = t; } break; --- gcc/cp/lex.cc.jj 2022-05-09 18:20:05.069883739 +0200 +++ gcc/cp/lex.cc 2022-05-11 09:32:01.999698450 +0200 @@ -273,6 +273,14 @@ init_reswords (void) C_SET_RID_CODE (id, RID_FIRST_INT_N + i); set_identifier_kind (id, cik_keyword); } + + if (flag_openmp) + { + id = get_identifier ("omp_all_memory"); + C_SET_RID_CODE (id, RID_OMP_ALL_MEMORY); + set_identifier_kind (id, cik_keyword); + ridpointers [RID_OMP_ALL_MEMORY] = id; + } } static void --- gcc/cp/parser.cc.jj 2022-05-10 18:33:14.027038061 +0200 +++ gcc/cp/parser.cc 2022-05-11 09:32:02.054697698 +0200 @@ -5876,6 +5876,14 @@ cp_parser_primary_expression (cp_parser case RID_AT_SELECTOR: return cp_parser_objc_expression (parser); + case RID_OMP_ALL_MEMORY: + gcc_assert (flag_openmp); + cp_lexer_consume_token (parser->lexer); + error_at (token->location, + "%<omp_all_memory%> may only be used in OpenMP " + "%<depend%> clause"); + return error_mark_node; + case RID_TEMPLATE: if (parser->in_function_body && (cp_lexer_peek_nth_token (parser->lexer, 2)->type @@ -36732,6 +36740,15 @@ cp_parser_omp_var_list_no_open (cp_parse decl = cp_parser_primary_expression (parser, false, false, false, &idk); } + else if (kind == OMP_CLAUSE_DEPEND + && cp_parser_is_keyword (token, RID_OMP_ALL_MEMORY) + && (cp_lexer_nth_token_is (parser->lexer, 2, CPP_COMMA) + || cp_lexer_nth_token_is (parser->lexer, 2, + CPP_CLOSE_PAREN))) + { + decl = ridpointers[RID_OMP_ALL_MEMORY]; + cp_lexer_consume_token (parser->lexer); + } else { name = cp_parser_id_expression (parser, /*template_p=*/false, --- gcc/cp/semantics.cc.jj 2022-05-09 09:09:20.248474154 +0200 +++ gcc/cp/semantics.cc 2022-05-11 09:32:02.011698286 +0200 @@ -7815,6 +7815,20 @@ finish_omp_clauses (tree clauses, enum c } if (t == error_mark_node) remove = true; + else if (OMP_CLAUSE_CODE (c) == OMP_CLAUSE_DEPEND + && t == ridpointers[RID_OMP_ALL_MEMORY]) + { + if (OMP_CLAUSE_DEPEND_KIND (c) != OMP_CLAUSE_DEPEND_OUT + && OMP_CLAUSE_DEPEND_KIND (c) != OMP_CLAUSE_DEPEND_INOUT) + { + error_at (OMP_CLAUSE_LOCATION (c), + "%<omp_all_memory%> used with %<depend%> kind " + "other than %<out%> or %<inout%>"); + remove = true; + } + if (processing_template_decl) + break; + } else if (processing_template_decl && TREE_CODE (t) != OVERLOAD) break; else if (!lvalue_p (t)) @@ -7867,24 +7881,32 @@ finish_omp_clauses (tree clauses, enum c } if (!remove) { - tree addr = cp_build_addr_expr (t, tf_warning_or_error); - if (addr == error_mark_node) - remove = true; + if (t == ridpointers[RID_OMP_ALL_MEMORY]) + t = null_pointer_node; else { + tree addr = cp_build_addr_expr (t, tf_warning_or_error); + if (addr == error_mark_node) + { + remove = true; + break; + } t = cp_build_indirect_ref (OMP_CLAUSE_LOCATION (c), addr, RO_UNARY_STAR, tf_warning_or_error); if (t == error_mark_node) - remove = true; - else if (TREE_CODE (OMP_CLAUSE_DECL (c)) == TREE_LIST - && TREE_PURPOSE (OMP_CLAUSE_DECL (c)) - && (TREE_CODE (TREE_PURPOSE (OMP_CLAUSE_DECL (c))) - == TREE_VEC)) - TREE_VALUE (OMP_CLAUSE_DECL (c)) = t; - else - OMP_CLAUSE_DECL (c) = t; + { + remove = true; + break; + } } + if (TREE_CODE (OMP_CLAUSE_DECL (c)) == TREE_LIST + && TREE_PURPOSE (OMP_CLAUSE_DECL (c)) + && (TREE_CODE (TREE_PURPOSE (OMP_CLAUSE_DECL (c))) + == TREE_VEC)) + TREE_VALUE (OMP_CLAUSE_DECL (c)) = t; + else + OMP_CLAUSE_DECL (c) = t; } break; case OMP_CLAUSE_DETACH: --- gcc/cp/pt.cc.jj 2022-05-10 18:33:14.050037757 +0200 +++ gcc/cp/pt.cc 2022-05-11 09:32:01.989698587 +0200 @@ -17601,8 +17601,8 @@ static tree tsubst_omp_clause_decl (tree decl, tree args, tsubst_flags_t complain, tree in_decl, tree *iterator_cache) { - if (decl == NULL_TREE) - return NULL_TREE; + if (decl == NULL_TREE || decl == ridpointers[RID_OMP_ALL_MEMORY]) + return decl; /* Handle OpenMP iterators. */ if (TREE_CODE (decl) == TREE_LIST --- gcc/testsuite/c-c++-common/gomp/all-memory-1.c.jj 2022-05-11 09:32:02.055697684 +0200 +++ gcc/testsuite/c-c++-common/gomp/all-memory-1.c 2022-05-11 09:32:02.055697684 +0200 @@ -0,0 +1,52 @@ +int omp_all_memory; /* { dg-error "expected" } */ + +void +foo (void) +{ + int p = (&omp_all_memory)[0]; /* { dg-error "'omp_all_memory' may only be used in OpenMP 'depend' clause" } */ +} + +void +bar (void) +{ + int *omp_all_memory; /* { dg-error "expected" } */ +} + +void +baz (void) +{ + struct omp_all_memory { int a; }; /* { dg-error "expected" } */ +} + +void +qux (void) +{ + union omp_all_memory { int a; }; /* { dg-error "expected" } */ +} + +void +corge (void) +{ + enum omp_all_memory { OAM; }; /* { dg-error "expected" } */ +} + +void +garply (void) +{ + enum E { omp_all_memory }; } /* { dg-error "expected" } */ + +void +boo (void) +{ + int x, y; + #pragma omp task private (omp_all_memory) /* { dg-error "expected" } */ + ; + #pragma omp task depend(inout: *&omp_all_memory) /* { dg-error "'omp_all_memory' may only be used in OpenMP 'depend' clause" } */ + ; + #pragma omp task depend(inout: omp_all_memory[0]) /* { dg-error "'omp_all_memory' may only be used in OpenMP 'depend' clause" } */ + ; + #pragma omp task depend(in: omp_all_memory) /* { dg-error "'omp_all_memory' used with 'depend' kind other than 'out' or 'inout'" } */ + ; + #pragma omp task depend(mutexinoutset: omp_all_memory) /* { dg-error "'omp_all_memory' used with 'depend' kind other than 'out' or 'inout'" } */ + ; +} --- gcc/testsuite/c-c++-common/gomp/all-memory-2.c.jj 2022-05-11 09:32:02.054697698 +0200 +++ gcc/testsuite/c-c++-common/gomp/all-memory-2.c 2022-05-11 09:32:02.054697698 +0200 @@ -0,0 +1,55 @@ +/* { dg-options "-fno-openmp" } */ + +int omp_all_memory; /* { dg-bogus "expected" } */ + +void +foo (void) +{ + int p = (&omp_all_memory)[0]; /* { dg-bogus "'omp_all_memory' may only be used in OpenMP 'depend' clause" } */ +} + +void +bar (void) +{ + int *omp_all_memory; /* { dg-bogus "expected" } */ +} + +void +baz (void) +{ + struct omp_all_memory { int a; }; /* { dg-bogus "expected" } */ +} + +void +qux (void) +{ + union omp_all_memory { int a; }; /* { dg-bogus "expected" } */ +} + +void +corge (void) +{ + enum omp_all_memory { OAM }; /* { dg-bogus "expected" } */ +} + +void +garply (void) +{ + enum E { omp_all_memory }; /* { dg-bogus "expected" } */ +} + +void +boo (void) +{ + int x, y; + #pragma omp task private (omp_all_memory) + ; + #pragma omp task depend(inout: *&omp_all_memory) + ; + #pragma omp task depend(inout: omp_all_memory[0]) + ; + #pragma omp task depend(in: omp_all_memory) + ; + #pragma omp task depend(mutexinoutset: omp_all_memory) + ; +} --- gcc/testsuite/c-c++-common/gomp/all-memory-3.c.jj 2022-05-11 09:32:02.055697684 +0200 +++ gcc/testsuite/c-c++-common/gomp/all-memory-3.c 2022-05-11 09:32:02.054697698 +0200 @@ -0,0 +1,22 @@ +typedef struct __attribute__((__aligned__ (sizeof (void *)))) omp_depend_t { + char __omp_depend_t__[2 * sizeof (void *)]; +} omp_depend_t; + +omp_depend_t z; + +void +foo (void) +{ + int x = 0, y = 0; + #pragma omp task depend(out: omp_all_memory) + ; + #pragma omp task depend(inout: omp_all_memory) + ; + #pragma omp task depend(out: x, omp_all_memory, y) + ; + #pragma omp task depend(inout: omp_all_memory, y) + ; + #pragma omp task depend(out: x, omp_all_memory) + ; + #pragma omp depobj (z) depend (inout: omp_all_memory) +} --- gcc/testsuite/g++.dg/gomp/all-memory-1.C.jj 2022-05-11 09:32:02.055697684 +0200 +++ gcc/testsuite/g++.dg/gomp/all-memory-1.C 2022-05-11 09:32:02.055697684 +0200 @@ -0,0 +1,24 @@ +namespace A +{ + namespace omp_all_memory // { dg-error "expected" } + { + } +} + +namespace B +{ + template <int N> + void omp_all_memory () {} // { dg-error "expected" } +} + +namespace C +{ + template <int N> + struct omp_all_memory {}; // { dg-error "expected" } +} + +namespace D +{ + template <int omp_all_memory> // { dg-error "expected" } + struct S {}; +} --- gcc/testsuite/g++.dg/gomp/all-memory-2.C.jj 2022-05-11 09:32:02.055697684 +0200 +++ gcc/testsuite/g++.dg/gomp/all-memory-2.C 2022-05-11 09:32:02.055697684 +0200 @@ -0,0 +1,26 @@ +// { dg-options "-fno-openmp" } + +namespace A +{ + namespace omp_all_memory // { dg-bogus "expected" } + { + } +} + +namespace B +{ + template <int N> + void omp_all_memory () {} // { dg-bogus "expected" } +} + +namespace C +{ + template <int N> + struct omp_all_memory {}; // { dg-bogus "expected" } +} + +namespace D +{ + template <int omp_all_memory> // { dg-bogus "expected" } + struct S {}; +} --- libgomp/libgomp.h.jj 2022-05-06 08:43:16.527059688 +0200 +++ libgomp/libgomp.h 2022-05-11 09:37:32.259180692 +0200 @@ -574,6 +574,8 @@ struct gomp_task struct gomp_dependers_vec *dependers; struct htab *depend_hash; struct gomp_taskwait *taskwait; + /* Last depend({,in}out:omp_all_memory) child if any. */ + struct gomp_task *depend_all_memory; /* Number of items in DEPEND. */ size_t depend_count; /* Number of tasks this task depends on. Once this counter reaches --- libgomp/task.c.jj 2022-05-06 08:43:16.564059180 +0200 +++ libgomp/task.c 2022-05-11 18:23:12.939939207 +0200 @@ -80,6 +80,7 @@ gomp_init_task (struct gomp_task *task, task->dependers = NULL; task->depend_hash = NULL; task->taskwait = NULL; + task->depend_all_memory = NULL; task->depend_count = 0; task->completion_sem = NULL; task->deferred_p = false; @@ -171,6 +172,7 @@ gomp_task_handle_depend (struct gomp_tas size_t ndepend = (uintptr_t) depend[0]; size_t i; hash_entry_type ent; + bool all_memory = false; if (ndepend) { @@ -181,6 +183,7 @@ gomp_task_handle_depend (struct gomp_tas { task->depend[i].addr = depend[2 + i]; task->depend[i].is_in = i >= nout; + all_memory |= i < nout && depend[2 + i] == NULL; } } else @@ -201,6 +204,8 @@ gomp_task_handle_depend (struct gomp_tas { case GOMP_DEPEND_OUT: case GOMP_DEPEND_INOUT: + all_memory |= d[0] == NULL; + break; case GOMP_DEPEND_MUTEXINOUTSET: break; case GOMP_DEPEND_IN: @@ -226,8 +231,126 @@ gomp_task_handle_depend (struct gomp_tas task->depend[n++].is_in = 1; } } - task->depend_count = ndepend; task->num_dependees = 0; + if (__builtin_expect (parent->depend_all_memory && ndepend, false)) + { + struct gomp_task *tsk = parent->depend_all_memory; + if (tsk->dependers == NULL) + { + tsk->dependers + = gomp_malloc (sizeof (struct gomp_dependers_vec) + + 6 * sizeof (struct gomp_task *)); + tsk->dependers->n_elem = 1; + tsk->dependers->allocated = 6; + tsk->dependers->elem[0] = task; + } + else + { + if (tsk->dependers->n_elem == tsk->dependers->allocated) + { + tsk->dependers->allocated + = tsk->dependers->allocated * 2 + 2; + tsk->dependers + = gomp_realloc (tsk->dependers, + sizeof (struct gomp_dependers_vec) + + (tsk->dependers->allocated + * sizeof (struct gomp_task *))); + } + tsk->dependers->elem[tsk->dependers->n_elem++] = task; + } + task->num_dependees++; + } + if (__builtin_expect (all_memory, false)) + { + /* A task with depend(inout: omp_all_memory) depends on all previous + sibling tasks which have any dependencies and all later sibling + tasks which have any dependencies depend on it. */ + task->depend_count = 1; + task->depend[0].addr = NULL; + task->depend[0].next = NULL; + task->depend[0].prev = NULL; + task->depend[0].task = task; + task->depend[0].redundant = true; + task->depend[0].redundant_out = false; + if (parent->depend_hash) + { + /* Inlined htab_traverse + htab_clear. All newer siblings can + just depend on this task. Add dependencies on all previous + sibling tasks with dependencies and make them redundant and + clear the hash table. */ + hash_entry_type *slot = &parent->depend_hash->entries[0]; + hash_entry_type *end = slot + htab_size (parent->depend_hash); + for (; slot != end; ++slot) + { + if (*slot == HTAB_EMPTY_ENTRY) + continue; + if (*slot != HTAB_DELETED_ENTRY) + { + for (ent = *slot; ent; ent = ent->next) + { + struct gomp_task *tsk = ent->task; + + if (ent->redundant_out) + break; + + ent->redundant = true; + if (tsk->dependers == NULL) + { + tsk->dependers + = gomp_malloc (sizeof (struct gomp_dependers_vec) + + 6 * sizeof (struct gomp_task *)); + tsk->dependers->n_elem = 1; + tsk->dependers->allocated = 6; + tsk->dependers->elem[0] = task; + task->num_dependees++; + continue; + } + /* We already have some other dependency on tsk from + earlier depend clause. */ + else if (tsk->dependers->n_elem + && (tsk->dependers->elem[tsk->dependers->n_elem + - 1] == task)) + continue; + else if (tsk->dependers->n_elem + == tsk->dependers->allocated) + { + tsk->dependers->allocated + = tsk->dependers->allocated * 2 + 2; + tsk->dependers + = gomp_realloc (tsk->dependers, + sizeof (struct gomp_dependers_vec) + + (tsk->dependers->allocated + * sizeof (struct gomp_task *))); + } + tsk->dependers->elem[tsk->dependers->n_elem++] = task; + task->num_dependees++; + } + while (ent) + { + ent->redundant = true; + ent = ent->next; + } + } + *slot = HTAB_EMPTY_ENTRY; + } + if (htab_size (parent->depend_hash) <= 32) + { + parent->depend_hash->n_elements = 0; + parent->depend_hash->n_deleted = 0; + } + else + { + /* Shrink the hash table if it would be too large. + We don't want to walk e.g. megabytes of empty hash + table for every depend(inout: omp_all_memory). */ + free (parent->depend_hash); + parent->depend_hash = htab_create (12); + } + } + parent->depend_all_memory = task; + return; + } + task->depend_count = ndepend; if (parent->depend_hash == NULL) parent->depend_hash = htab_create (2 * ndepend > 12 ? 2 * ndepend : 12); for (i = 0; i < ndepend; i++) @@ -1175,6 +1298,8 @@ gomp_task_run_post_handle_depend_hash (s struct gomp_task *parent = child_task->parent; size_t i; + if (parent->depend_all_memory == child_task) + parent->depend_all_memory = NULL; for (i = 0; i < child_task->depend_count; i++) if (!child_task->depend[i].redundant) { @@ -1738,6 +1863,17 @@ gomp_task_maybe_wait_for_dependencies (v n = 5; } gomp_mutex_lock (&team->task_lock); + if (__builtin_expect (task->depend_all_memory && ndepend, false)) + { + struct gomp_task *tsk = task->depend_all_memory; + if (!tsk->parent_depends_on) + { + tsk->parent_depends_on = true; + ++num_awaited; + if (tsk->num_dependees == 0 && tsk->kind == GOMP_TASK_WAITING) + priority_queue_upgrade_task (tsk, task); + } + } for (i = 0; i < ndepend; i++) { elem.addr = depend[i + n]; @@ -1760,6 +1896,36 @@ gomp_task_maybe_wait_for_dependencies (v } elem.addr = d[0]; } + if (__builtin_expect (elem.addr == NULL && !elem.is_in, false)) + { + size_t size = htab_size (task->depend_hash); + if (htab_elements (task->depend_hash) * 8 < size && size > 32) + htab_expand (task->depend_hash); + + /* depend(inout: omp_all_memory) - depend on all previous + sibling tasks that do have dependencies. Inlined + htab_traverse. */ + hash_entry_type *slot = &task->depend_hash->entries[0]; + hash_entry_type *end = slot + htab_size (task->depend_hash); + for (; slot != end; ++slot) + { + if (*slot == HTAB_EMPTY_ENTRY || *slot == HTAB_DELETED_ENTRY) + continue; + for (ent = *slot; ent; ent = ent->next) + { + struct gomp_task *tsk = ent->task; + if (!tsk->parent_depends_on) + { + tsk->parent_depends_on = true; + ++num_awaited; + if (tsk->num_dependees == 0 + && tsk->kind == GOMP_TASK_WAITING) + priority_queue_upgrade_task (tsk, task); + } + } + } + break; + } ent = htab_find (task->depend_hash, &elem); for (; ent; ent = ent->next) if (elem.is_in && ent->is_in) --- libgomp/testsuite/libgomp.c-c++-common/depend-1.c.jj 2022-05-11 18:33:35.192808599 +0200 +++ libgomp/testsuite/libgomp.c-c++-common/depend-1.c 2022-05-11 18:31:46.649226878 +0200 @@ -0,0 +1,110 @@ +#include <stdlib.h> +#include <unistd.h> + +void +test (int ifval) +{ + int a[8], b[8], i; + for (i = 0; i < 8; i++) + { + a[i] = i; + b[i] = 2 * i; + } + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(a) depend(in: a[0]) + { + usleep (5000); + a[0] = 42; + } + #pragma omp task shared(a) depend(out: a[1]) + { + usleep (5000); + a[1] = 43; + } + #pragma omp task shared(a) depend(inout: a[2]) + { + usleep (5000); + a[2] = 44; + } + #pragma omp task shared(a) depend(mutexinoutset: a[3]) + { + usleep (5000); + a[3] = 45; + } + #pragma omp task shared(a) + { + usleep (15000); + a[4] = 46; + } + #pragma omp task shared(b) depend(in: b[0]) + { + usleep (5000); + b[0] = 47; + } + #pragma omp task shared(b) depend(in: b[4]) + { + usleep (5000); + b[4] = 48; + } + /* None of the above tasks depend on each other. + The following task depends on all but the a[4] = 46; one. */ + #pragma omp task shared(a, b) depend(out: omp_all_memory) private(i) if(ifval) + { + if (a[0] != 42 || a[1] != 43 || a[2] != 44 || a[3] != 45 + || a[5] != 5 || a[6] != 6 || a[7] != 7 + || b[0] != 47 || b[1] != 2 || b[2] != 4 || b[3] != 6 + || b[4] != 48 || b[5] != 10 || b[6] != 12 || b[7] != 14) + abort (); + for (i = 0; i < 8; ++i) + if (i != 4) + a[i] = 3 * i + 7; + for (i = 0; i < 8; ++i) + b[i] = 4 * i - 7; + } + /* The following task depends on both b[0] = 47; and + above omp_all_memory tasks, but as the latter depends on + the former, effectively it is dependent just on the omp_all_memory + task. */ + #pragma omp task shared(b) depend(inout: b[0]) + { + usleep (5000); + b[0] = 49; + } + /* The following task depends on all the above except a[4] = 46; one, + but it can be reduced to dependency on the above omp_all_memory + one and b[0] = 49; one. */ + #pragma omp task shared(a, b) depend(inout: b[7], omp_all_memory, b[6]) \ + private(i) if(ifval) + { + for (i = 0; i < 8; ++i) + if (i != 4) + { + if (a[i] != 3 * i + 7) + abort (); + a[i] = 5 * i + 50; + } + if (b[0] != 49) + abort (); + b[0] = 6 * i + 57; + for (i = 1; i < 8; ++i) + { + if (b[i] != 4 * i - 7) + abort (); + b[i] = 6 * i + 57; + } + } + #pragma omp taskwait + if (a[4] != 46) + abort (); + } +} + +int +main () +{ + test (1); + test (0); + return 0; +} --- libgomp/testsuite/libgomp.c-c++-common/depend-2.c.jj 2022-05-11 18:33:38.220769039 +0200 +++ libgomp/testsuite/libgomp.c-c++-common/depend-2.c 2022-05-11 18:42:21.406932767 +0200 @@ -0,0 +1,116 @@ +#include <omp.h> +#include <stdlib.h> +#include <unistd.h> + +void +test (int ifval) +{ + int a[8], b[8], i; + omp_depend_t d1, d2; + #pragma omp depobj (d1) depend(inout: omp_all_memory) + #pragma omp depobj (d2) depend(out: omp_all_memory) + for (i = 0; i < 8; i++) + { + a[i] = i; + b[i] = 2 * i; + } + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(a) depend(in: a[0]) + { + usleep (5000); + a[0] = 42; + } + #pragma omp task shared(a) depend(out: a[1]) + { + usleep (5000); + a[1] = 43; + } + #pragma omp task shared(a) depend(inout: a[2]) + { + usleep (5000); + a[2] = 44; + } + #pragma omp task shared(a) depend(mutexinoutset: a[3]) + { + usleep (5000); + a[3] = 45; + } + #pragma omp task shared(a) + { + usleep (15000); + a[4] = 46; + } + #pragma omp task shared(b) depend(in: b[0]) + { + usleep (5000); + b[0] = 47; + } + #pragma omp task shared(b) depend(in: b[4]) + { + usleep (5000); + b[4] = 48; + } + /* None of the above tasks depend on each other. + The following task depends on all but the a[4] = 46; one. */ + #pragma omp task shared(a, b) depend(depobj: d1) private(i) if(ifval) + { + if (a[0] != 42 || a[1] != 43 || a[2] != 44 || a[3] != 45 + || a[5] != 5 || a[6] != 6 || a[7] != 7 + || b[0] != 47 || b[1] != 2 || b[2] != 4 || b[3] != 6 + || b[4] != 48 || b[5] != 10 || b[6] != 12 || b[7] != 14) + abort (); + for (i = 0; i < 8; ++i) + if (i != 4) + a[i] = 3 * i + 7; + for (i = 0; i < 8; ++i) + b[i] = 4 * i - 7; + } + /* The following task depends on both b[0] = 47; and + above omp_all_memory tasks, but as the latter depends on + the former, effectively it is dependent just on the omp_all_memory + task. */ + #pragma omp task shared(b) depend(inout: b[0]) + { + usleep (5000); + b[0] = 49; + } + /* The following task depends on all the above except a[4] = 46; one, + but it can be reduced to dependency on the above omp_all_memory + one and b[0] = 49; one. */ + #pragma omp task shared(a, b) depend(inout: b[6]) depend(depobj: d2) \ + depend(out: b[7]) private(i) if(ifval) + { + for (i = 0; i < 8; ++i) + if (i != 4) + { + if (a[i] != 3 * i + 7) + abort (); + a[i] = 5 * i + 50; + } + if (b[0] != 49) + abort (); + b[0] = 6 * i + 57; + for (i = 1; i < 8; ++i) + { + if (b[i] != 4 * i - 7) + abort (); + b[i] = 6 * i + 57; + } + } + #pragma omp taskwait + if (a[4] != 46) + abort (); + } + #pragma omp depobj (d2) destroy + #pragma omp depobj (d1) destroy +} + +int +main () +{ + test (1); + test (0); + return 0; +} --- libgomp/testsuite/libgomp.c-c++-common/depend-3.c.jj 2022-05-11 18:37:06.347049578 +0200 +++ libgomp/testsuite/libgomp.c-c++-common/depend-3.c 2022-05-11 18:38:48.789710985 +0200 @@ -0,0 +1,103 @@ +#include <stdlib.h> +#include <unistd.h> + +int +main () +{ + int a[8], b[8], i; + for (i = 0; i < 8; i++) + { + a[i] = i; + b[i] = 2 * i; + } + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(a) depend(in: a[0]) + { + usleep (5000); + a[0] = 42; + } + #pragma omp task shared(a) depend(out: a[1]) + { + usleep (5000); + a[1] = 43; + } + #pragma omp task shared(a) depend(inout: a[2]) + { + usleep (5000); + a[2] = 44; + } + #pragma omp task shared(a) depend(mutexinoutset: a[3]) + { + usleep (5000); + a[3] = 45; + } + #pragma omp task shared(a) + { + usleep (15000); + a[4] = 46; + } + #pragma omp task shared(b) depend(in: b[0]) + { + usleep (5000); + b[0] = 47; + } + #pragma omp task shared(b) depend(in: b[4]) + { + usleep (5000); + b[4] = 48; + } + /* None of the above tasks depend on each other. + The following task depends on all but the a[4] = 46; one. */ + #pragma omp task shared(a, b) depend(iterator (j=0:7), inout: omp_all_memory) private(i) + { + if (a[0] != 42 || a[1] != 43 || a[2] != 44 || a[3] != 45 + || a[5] != 5 || a[6] != 6 || a[7] != 7 + || b[0] != 47 || b[1] != 2 || b[2] != 4 || b[3] != 6 + || b[4] != 48 || b[5] != 10 || b[6] != 12 || b[7] != 14) + abort (); + for (i = 0; i < 8; ++i) + if (i != 4) + a[i] = 3 * i + 7; + for (i = 0; i < 8; ++i) + b[i] = 4 * i - 7; + } + /* The following task depends on both b[0] = 47; and + above omp_all_memory tasks, but as the latter depends on + the former, effectively it is dependent just on the omp_all_memory + task. */ + #pragma omp task shared(b) depend(inout: b[0]) + { + usleep (5000); + b[0] = 49; + } + /* The following task depends on all the above except a[4] = 46; one, + but it can be reduced to dependency on the above omp_all_memory + one and b[0] = 49; one. */ + #pragma omp task shared(a, b) depend(inout: b[7]) depend(iterator(j=4:5), out: omp_all_memory) \ + depend(inout: b[6]) private(i) + { + for (i = 0; i < 8; ++i) + if (i != 4) + { + if (a[i] != 3 * i + 7) + abort (); + a[i] = 5 * i + 50; + } + if (b[0] != 49) + abort (); + b[0] = 6 * i + 57; + for (i = 1; i < 8; ++i) + { + if (b[i] != 4 * i - 7) + abort (); + b[i] = 6 * i + 57; + } + } + #pragma omp taskwait + if (a[4] != 46) + abort (); + } + return 0; +} Jakub