The patch fixes the following 2 issues: .MASK_STORE_LANES (&a, 4B, max_mask_34, vect_array.12);
here we miss to return the last argument as stored value. ivtmp_32 = ivtmp_31 + POLY_INT_CST [4, 4]; here we miss a bail out in vect_recog_over_widening_pattern. gcc/ChangeLog: PR tree-optimization/97079 * internal-fn.c (internal_fn_stored_value_index): Handle also .MASK_STORE_LANES. * tree-vect-patterns.c (vect_recog_over_widening_pattern): Bail out for POLY_INT_CST. gcc/testsuite/ChangeLog: PR tree-optimization/97079 * gcc.target/aarch64/sve/pr97079.c: New test. I'm running tests on x86_64-linux-gnu and I would appreciate running that on a SVE aarch64 machine. Ready for master? Thanks, Martin --- gcc/internal-fn.c | 1 + .../gcc.target/aarch64/sve/pr97079.c | 22 +++++++++++++++++++ gcc/tree-vect-patterns.c | 2 ++ 3 files changed, 25 insertions(+) create mode 100644 gcc/testsuite/gcc.target/aarch64/sve/pr97079.c diff --git a/gcc/internal-fn.c b/gcc/internal-fn.c index 92cb3cd845a..792d2ca568a 100644 --- a/gcc/internal-fn.c +++ b/gcc/internal-fn.c @@ -3795,6 +3795,7 @@ internal_fn_stored_value_index (internal_fn fn) switch (fn) { case IFN_MASK_STORE: + case IFN_MASK_STORE_LANES: case IFN_SCATTER_STORE: case IFN_MASK_SCATTER_STORE: case IFN_LEN_STORE: diff --git a/gcc/testsuite/gcc.target/aarch64/sve/pr97079.c b/gcc/testsuite/gcc.target/aarch64/sve/pr97079.c new file mode 100644 index 00000000000..06e6a7cde94 --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/sve/pr97079.c @@ -0,0 +1,22 @@ +/* { dg-do compile } */ +/* { dg-options "-O3 -march=armv8.2-a+sve" } */ + +void g(void); + +int a[8][3]; +int b; +void c(void) +{ + int d[] = {7, 3}; + int *e = a[0]; + int f; + b = 0; + for (; b < 8; b++) + { + f = 0; + for (; f < 3; f++) + a[b][f] = 0; + } + g(); + *e = (long)d; +} diff --git a/gcc/tree-vect-patterns.c b/gcc/tree-vect-patterns.c index 71e4e106202..6302bc42f46 100644 --- a/gcc/tree-vect-patterns.c +++ b/gcc/tree-vect-patterns.c @@ -1571,6 +1571,8 @@ vect_recog_over_widening_pattern (vec_info *vinfo, tree op = gimple_op (last_stmt, first_op + i); if (TREE_CODE (op) == INTEGER_CST) unprom[i].set_op (op, vect_constant_def); + else if (TREE_CODE (op) == POLY_INT_CST) + return NULL; else if (TREE_CODE (op) == SSA_NAME) { bool op_single_use_p = true; -- 2.28.0