Use the counted_by atribute info in builtin object size to compute the subobject size for flexible array members.
gcc/ChangeLog: PR C/108896 * tree-object-size.cc (addr_object_size): Use the counted_by attribute info. * tree.cc (component_ref_has_counted_by_p): New function. (component_ref_get_counted_by): New function. * tree.h (component_ref_has_counted_by_p): New prototype. (component_ref_get_counted_by): New prototype. gcc/testsuite/ChangeLog: PR C/108896 * gcc.dg/flex-array-counted-by-2.c: New test. * gcc.dg/flex-array-counted-by-3.c: New test. --- .../gcc.dg/flex-array-counted-by-2.c | 74 ++++++ .../gcc.dg/flex-array-counted-by-3.c | 210 ++++++++++++++++++ gcc/tree-object-size.cc | 37 ++- gcc/tree.cc | 95 +++++++- gcc/tree.h | 10 + 5 files changed, 418 insertions(+), 8 deletions(-) create mode 100644 gcc/testsuite/gcc.dg/flex-array-counted-by-2.c create mode 100644 gcc/testsuite/gcc.dg/flex-array-counted-by-3.c diff --git a/gcc/testsuite/gcc.dg/flex-array-counted-by-2.c b/gcc/testsuite/gcc.dg/flex-array-counted-by-2.c new file mode 100644 index 000000000000..ec580c1f1f01 --- /dev/null +++ b/gcc/testsuite/gcc.dg/flex-array-counted-by-2.c @@ -0,0 +1,74 @@ +/* test the attribute counted_by and its usage in + * __builtin_dynamic_object_size. */ +/* { dg-do run } */ +/* { dg-options "-O2" } */ + +#include "builtin-object-size-common.h" + +#define expect(p, _v) do { \ + size_t v = _v; \ + if (p == v) \ + __builtin_printf ("ok: %s == %zd\n", #p, p); \ + else \ + { \ + __builtin_printf ("WAT: %s == %zd (expected %zd)\n", #p, p, v); \ + FAIL (); \ + } \ +} while (0); + +struct flex { + int b; + int c[]; +} *array_flex; + +struct annotated { + int b; + int c[] __attribute__ ((counted_by (b))); +} *array_annotated; + +struct nested_annotated { + struct { + union { + int b; + float f; + }; + int n; + }; + int c[] __attribute__ ((counted_by (b))); +} *array_nested_annotated; + +void __attribute__((__noinline__)) setup (int normal_count, int attr_count) +{ + array_flex + = (struct flex *)malloc (sizeof (struct flex) + + normal_count * sizeof (int)); + array_flex->b = normal_count; + + array_annotated + = (struct annotated *)malloc (sizeof (struct annotated) + + attr_count * sizeof (int)); + array_annotated->b = attr_count; + + array_nested_annotated + = (struct nested_annotated *)malloc (sizeof (struct nested_annotated) + + attr_count * sizeof (int)); + array_nested_annotated->b = attr_count; + + return; +} + +void __attribute__((__noinline__)) test () +{ + expect(__builtin_dynamic_object_size(array_flex->c, 1), -1); + expect(__builtin_dynamic_object_size(array_annotated->c, 1), + array_annotated->b * sizeof (int)); + expect(__builtin_dynamic_object_size(array_nested_annotated->c, 1), + array_nested_annotated->b * sizeof (int)); +} + +int main(int argc, char *argv[]) +{ + setup (10,10); + test (); + DONE (); +} diff --git a/gcc/testsuite/gcc.dg/flex-array-counted-by-3.c b/gcc/testsuite/gcc.dg/flex-array-counted-by-3.c new file mode 100644 index 000000000000..a0c3cb88ec71 --- /dev/null +++ b/gcc/testsuite/gcc.dg/flex-array-counted-by-3.c @@ -0,0 +1,210 @@ +/* test the attribute counted_by and its usage in +__builtin_dynamic_object_size: what's the correct behavior when the +allocation size mismatched with the value of counted_by attribute? */ +/* { dg-do run } */ +/* { dg-options "-O -fstrict-flex-arrays=3" } */ + +#include "builtin-object-size-common.h" + +struct annotated { + size_t foo; + char others; + char array[] __attribute__((counted_by (foo))); +}; + +#define expect(p, _v) do { \ + size_t v = _v; \ + if (p == v) \ + __builtin_printf ("ok: %s == %zd\n", #p, p); \ + else \ + { \ + __builtin_printf ("WAT: %s == %zd (expected %zd)\n", #p, p, v); \ + FAIL (); \ + } \ +} while (0); + +#define noinline __attribute__((__noinline__)) +#define SIZE_BUMP 10 +#define MAX(a, b) ((a) > (b) ? (a) : (b)) +#define MIN(a, b) ((a) < (b) ? (a) : (b)) + +/* In general, Due to type casting, the type for the pointee of a pointer + does not say anything about the object it points to, + So, __builtin_object_size can not directly use the type of the pointee + to decide the size of the object the pointer points to. + + there are only two reliable ways: + A. observed allocations (call to the allocation functions in the routine) + B. observed accesses (read or write access to the location of the + pointer points to) + + that provide information about the type/existence of an object at + the corresponding address. + + for A, we use the "alloc_size" attribute for the corresponding allocation + functions to determine the object size; + + For B, we use the SIZE info of the TYPE attached to the corresponding access. + (We treat counted_by attribute as a complement to the SIZE info of the TYPE + for FMA) + + The only other way in C which ensures that a pointer actually points + to an object of the correct type is 'static': + + void foo(struct P *p[static 1]); + + See https://gcc.gnu.org/pipermail/gcc-patches/2023-July/624814.html + for more details. */ + +/* in the following function, malloc allocated more space than the value + of counted_by attribute. Then what's the correct behavior we expect + the __builtin_dynamic_object_size should have for each of the cases? */ + +static struct annotated * noinline alloc_buf_more (size_t index) +{ + struct annotated *p; + size_t allocated_size + = MAX (sizeof (struct annotated), + (__builtin_offsetof (struct annotated, array[0]) + + (index + SIZE_BUMP) * sizeof (char))); + p = (struct annotated *) malloc (allocated_size); + + p->foo = index; + + /*when checking the observed access p->array, we have info on both + observered allocation and observed access, + A. from observed allocation: + allocated_size - offsetof (struct annotated, array[0]) + B. from observed access: p->foo * sizeof (char) + */ + + /* for size in the whole object: always uses A. */ + /* for size in the sub-object: chose the smaller of A and B. + * Please see https://gcc.gnu.org/pipermail/gcc-patches/2023-July/625891.html + * for details on why. */ + + /* for MAXIMUM size in the whole object: use the allocation size + for the whole object. */ + expect(__builtin_dynamic_object_size(p->array, 0), + allocated_size - __builtin_offsetof (struct annotated, array[0])); + + /* for MAXIMUM size in the sub-object. use the smaller of A and B. */ + expect(__builtin_dynamic_object_size(p->array, 1), + MIN (allocated_size - __builtin_offsetof (struct annotated, array[0]), + (p->foo) * sizeof(char))); + + /* for MINIMUM size in the whole object: use the allocation size + for the whole object. */ + expect(__builtin_dynamic_object_size(p->array, 2), + allocated_size - __builtin_offsetof (struct annotated, array[0])); + + /* for MINIMUM size in the sub-object: use the smaller of A and B. */ + expect(__builtin_dynamic_object_size(p->array, 3), + MIN (allocated_size - __builtin_offsetof (struct annotated, array[0]), + (p->foo) * sizeof(char))); + + /*when checking the pointer p, we only have info on the observed allocation. + So, the object size info can only been obtained from the call to malloc. + for both MAXIMUM and MINIMUM: A = (index + SIZE_BUMP) * sizeof (char) */ + expect(__builtin_dynamic_object_size(p, 0), allocated_size); + expect(__builtin_dynamic_object_size(p, 1), allocated_size); + expect(__builtin_dynamic_object_size(p, 2), allocated_size); + expect(__builtin_dynamic_object_size(p, 3), allocated_size); + return p; +} + +/* in the following function, malloc allocated less space than the value + of counted_by attribute. Then what's the correct behavior we expect + the __builtin_dynamic_object_size should have for each of the cases? + NOTE: this is an user error, GCC should issue warnings for such case. + this is a seperate issue we should address later. */ + +static struct annotated * noinline alloc_buf_less (size_t index) +{ + struct annotated *p; + size_t allocated_size + = MAX (sizeof (struct annotated), + (__builtin_offsetof (struct annotated, array[0]) + + (index) * sizeof (char))); + p = (struct annotated *) malloc (allocated_size); + + p->foo = index + SIZE_BUMP; + + /*when checking the observed access p->array, we have info on both + observered allocation and observed access, + A. from observed allocation: + allocated_size - offsetof (struct annotated, array[0]) + B. from observed access: p->foo * sizeof (char) + */ + + /* for size in the whole object: always uses A. */ + /* for size in the sub-object: chose the smaller of A and B. + * Please see https://gcc.gnu.org/pipermail/gcc-patches/2023-July/625891.html + * for details on why. */ + + /* for MAXIMUM size in the whole object: use the allocation size + for the whole object. */ + expect(__builtin_dynamic_object_size(p->array, 0), + allocated_size - __builtin_offsetof (struct annotated, array[0])); + + /* for MAXIMUM size in the sub-object. use the smaller of A and B. */ + expect(__builtin_dynamic_object_size(p->array, 1), + MIN (allocated_size - __builtin_offsetof (struct annotated, array[0]), + (p->foo) * sizeof(char))); + + /* for MINIMUM size in the whole object: use the allocation size + for the whole object. */ + expect(__builtin_dynamic_object_size(p->array, 2), + allocated_size - __builtin_offsetof (struct annotated, array[0])); + + /* for MINIMUM size in the sub-object: use the smaller of A and B. */ + expect(__builtin_dynamic_object_size(p->array, 3), + MIN (allocated_size - __builtin_offsetof (struct annotated, array[0]), + (p->foo) * sizeof(char))); + + /*when checking the pointer p, we only have info on the observed + allocation. So, the object size info can only been obtained from + the call to malloc. */ + expect(__builtin_dynamic_object_size(p, 0), allocated_size); + expect(__builtin_dynamic_object_size(p, 1), allocated_size); + expect(__builtin_dynamic_object_size(p, 2), allocated_size); + expect(__builtin_dynamic_object_size(p, 3), allocated_size); + return p; +} + +int main () +{ + struct annotated *p, *q; + p = alloc_buf_more (10); + q = alloc_buf_less (10); + + /*when checking the observed access p->array, we only have info on the + observed access, i.e, the TYPE_SIZE info from the access. We don't have + info on the whole object. */ + expect(__builtin_dynamic_object_size(p->array, 0), -1); + expect(__builtin_dynamic_object_size(p->array, 1), p->foo * sizeof(char)); + expect(__builtin_dynamic_object_size(p->array, 2), 0); + expect(__builtin_dynamic_object_size(p->array, 3), p->foo * sizeof(char)); + /*when checking the pointer p, we have no observed allocation nor observed + access, therefore, we cannot determine the size info here. */ + expect(__builtin_dynamic_object_size(p, 0), -1); + expect(__builtin_dynamic_object_size(p, 1), -1); + expect(__builtin_dynamic_object_size(p, 2), 0); + expect(__builtin_dynamic_object_size(p, 3), 0); + + /*when checking the observed access p->array, we only have info on the + observed access, i.e, the TYPE_SIZE info from the access. We don't have + info on the whole object. */ + expect(__builtin_dynamic_object_size(q->array, 0), -1); + expect(__builtin_dynamic_object_size(q->array, 1), q->foo * sizeof(char)); + expect(__builtin_dynamic_object_size(q->array, 2), 0); + expect(__builtin_dynamic_object_size(q->array, 3), q->foo * sizeof(char)); + /*when checking the pointer p, we have no observed allocation nor observed + access, therefore, we cannot determine the size info here. */ + expect(__builtin_dynamic_object_size(q, 0), -1); + expect(__builtin_dynamic_object_size(q, 1), -1); + expect(__builtin_dynamic_object_size(q, 2), 0); + expect(__builtin_dynamic_object_size(q, 3), 0); + + DONE (); +} diff --git a/gcc/tree-object-size.cc b/gcc/tree-object-size.cc index a62af0500563..cf7843c5684b 100644 --- a/gcc/tree-object-size.cc +++ b/gcc/tree-object-size.cc @@ -585,6 +585,7 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, if (pt_var != TREE_OPERAND (ptr, 0)) { tree var; + tree counted_by_ref = NULL_TREE; if (object_size_type & OST_SUBOBJECT) { @@ -600,11 +601,12 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, var = TREE_OPERAND (var, 0); if (var != pt_var && TREE_CODE (var) == ARRAY_REF) var = TREE_OPERAND (var, 0); - if (! TYPE_SIZE_UNIT (TREE_TYPE (var)) + if (! component_ref_has_counted_by_p (var) + && ((! TYPE_SIZE_UNIT (TREE_TYPE (var)) || ! tree_fits_uhwi_p (TYPE_SIZE_UNIT (TREE_TYPE (var))) || (pt_var_size && TREE_CODE (pt_var_size) == INTEGER_CST && tree_int_cst_lt (pt_var_size, - TYPE_SIZE_UNIT (TREE_TYPE (var))))) + TYPE_SIZE_UNIT (TREE_TYPE (var))))))) var = pt_var; else if (var != pt_var && TREE_CODE (pt_var) == MEM_REF) { @@ -612,6 +614,7 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, /* For &X->fld, compute object size if fld isn't a flexible array member. */ bool is_flexible_array_mem_ref = false; + while (v && v != pt_var) switch (TREE_CODE (v)) { @@ -660,6 +663,8 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, /* Now the ref is to an array type. */ gcc_assert (TREE_CODE (TREE_TYPE (v)) == ARRAY_TYPE); is_flexible_array_mem_ref = array_ref_flexible_size_p (v); + counted_by_ref = component_ref_get_counted_by (v); + while (v != pt_var && TREE_CODE (v) == COMPONENT_REF) if (TREE_CODE (TREE_TYPE (TREE_OPERAND (v, 0))) != UNION_TYPE @@ -673,8 +678,11 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, == RECORD_TYPE) { /* compute object size only if v is not a - flexible array member. */ - if (!is_flexible_array_mem_ref) + flexible array member or the flexible array member + has a known element count indicated by the user + through attribute counted_by. */ + if (!is_flexible_array_mem_ref + || counted_by_ref) { v = NULL_TREE; break; @@ -707,9 +715,24 @@ addr_object_size (struct object_size_info *osi, const_tree ptr, if (var != pt_var) { - var_size = TYPE_SIZE_UNIT (TREE_TYPE (var)); - if (!TREE_CONSTANT (var_size)) - var_size = get_or_create_ssa_default_def (cfun, var_size); + if (!counted_by_ref) + { + var_size = TYPE_SIZE_UNIT (TREE_TYPE (var)); + if (!TREE_CONSTANT (var_size)) + var_size = get_or_create_ssa_default_def (cfun, var_size); + } + else + { + gcc_assert (TREE_CODE (var) == COMPONENT_REF + && TREE_CODE (TREE_TYPE (var)) == ARRAY_TYPE); + tree element_size = TYPE_SIZE_UNIT (TREE_TYPE (TREE_TYPE (var))); + var_size + = size_binop (MULT_EXPR, + fold_convert (sizetype, counted_by_ref), + fold_convert (sizetype, element_size)); + if (!todo) + todo = TODO_update_ssa_only_virtuals; + } if (!var_size) return false; } diff --git a/gcc/tree.cc b/gcc/tree.cc index fcd36ae0cd74..3b6ddcbdcbf8 100644 --- a/gcc/tree.cc +++ b/gcc/tree.cc @@ -12745,6 +12745,32 @@ array_ref_element_size (tree exp) return SUBSTITUTE_PLACEHOLDER_IN_EXPR (TYPE_SIZE_UNIT (elmt_type), exp); } +/* For a component_ref that has an array type ARRAY_REF, return TRUE when + an counted_by attribute attached to the corresponding FIELD_DECL. + return FALSE otherwise. */ +bool +component_ref_has_counted_by_p (tree array_ref) +{ + if (TREE_CODE (array_ref) != COMPONENT_REF) + return false; + + if (TREE_CODE (TREE_TYPE (array_ref)) != ARRAY_TYPE) + return false; + + tree struct_object = TREE_OPERAND (array_ref, 0); + tree struct_type = TREE_TYPE (struct_object); + + if (!RECORD_OR_UNION_TYPE_P (struct_type)) + return false; + tree field_decl = TREE_OPERAND (array_ref, 1); + tree attr_counted_by = lookup_attribute ("counted_by", + DECL_ATTRIBUTES (field_decl)); + + if (!attr_counted_by) + return false; + return true; +} + /* Given a field list, FIELDLIST, of a structure/union, return a TREE_LIST, with each TREE_VALUE a FIELD_DECL stepping down the chain to the FIELD whose name is FIELDNAME, which is the last TREE_VALUE of the list. @@ -12771,7 +12797,7 @@ get_named_field (tree fieldlist, const char *fieldname) fields inside it recursively. */ else if (RECORD_OR_UNION_TYPE_P (TREE_TYPE (field))) if ((named_field = get_named_field (TYPE_FIELDS (TREE_TYPE (field)), - fieldname)) != NULL_TREE) + fieldname)) != NULL_TREE) { named_field = tree_cons (NULL_TREE, field, named_field); break; @@ -12784,6 +12810,73 @@ get_named_field (tree fieldlist, const char *fieldname) return named_field; } +/* For a component_ref that has an array type ARRAY_REF, get the object that + represents its counted_by per the attribute counted_by attached to + the corresponding FIELD_DECL. return NULL_TREE when cannot find such + object. + For example, if: + + struct P { + int k; + int x[] __attribute__ ((counted_by (k))); + } *p; + + for the following reference: + + p->x[b] + + the object that represents its element count will be: + + p->k + + So, when component_ref_get_counted_by (p->x[b]) is called, p->k should be + returned. +*/ + +tree +component_ref_get_counted_by (tree array_ref) +{ + if (! component_ref_has_counted_by_p (array_ref)) + return NULL_TREE; + + tree struct_object = TREE_OPERAND (array_ref, 0); + tree struct_type = TREE_TYPE (struct_object); + tree field_decl = TREE_OPERAND (array_ref, 1); + tree attr_counted_by = lookup_attribute ("counted_by", + DECL_ATTRIBUTES (field_decl)); + gcc_assert (attr_counted_by); + + /* If there is an counted_by attribute attached to the field, + get the field that maps to the counted_by. */ + + const char *fieldname + = IDENTIFIER_POINTER (TREE_VALUE (TREE_VALUE (attr_counted_by))); + + tree counted_by_field = get_named_field (TYPE_FIELDS (struct_type), + fieldname); + + gcc_assert (counted_by_field); + + /* generate the tree node that represent the counted_by of this array + ref. This is a (possible nested) COMPONENT_REF to the counted_by_field + of the containing structure. */ + + tree counted_by_ref = NULL_TREE; + tree object = struct_object; + do + { + tree field = TREE_VALUE (counted_by_field); + + counted_by_ref = build3 (COMPONENT_REF, + TREE_TYPE (field), + unshare_expr (object), field, + NULL_TREE); + object = counted_by_ref; + counted_by_field = TREE_CHAIN (counted_by_field); + } + while (counted_by_field); + return counted_by_ref; +} /* Return a tree representing the lower bound of the array mentioned in EXP, an ARRAY_REF or an ARRAY_RANGE_REF. */ diff --git a/gcc/tree.h b/gcc/tree.h index 4859becaa1e7..07eed7219835 100644 --- a/gcc/tree.h +++ b/gcc/tree.h @@ -5619,11 +5619,21 @@ extern tree get_base_address (tree t); of EXP, an ARRAY_REF or an ARRAY_RANGE_REF. */ extern tree array_ref_element_size (tree); +/* Give a component_ref that has an array type, return true when an + attribute counted_by attached to the corresponding FIELD_DECL. */ +extern bool component_ref_has_counted_by_p (tree); + /* Given a field list, FIELDLIST, of a structure/union, return the FIELD whose name is FIELDNAME, return NULL_TREE if such field is not found. searching nested anonymous structure/union recursively. */ extern tree get_named_field (tree, const char *); +/* Give a component_ref that has an array type, return the object that + represents its counted_by per the attribute counted_by attached to + the corresponding FIELD_DECL. return NULL_TREE when cannot find such + object. */ +extern tree component_ref_get_counted_by (tree); + /* Return a typenode for the "standard" C type with a given name. */ extern tree get_typenode_from_name (const char *); -- 2.31.1