c++: make initializer_list array static again [PR110070]

After the maybe_init_list_as_* patches, I noticed that we were putting the
array of strings into .rodata, but then memcpying it into an automatic
array, which is pointless; we should be able to use it directly.

This doesn't happen automatically because TREE_ADDRESSABLE is set (since
r12-657 for PR100464), and so gimplify_init_constructor won't promote the
variable to static.  Theoretically we could do escape analysis to recognize
that the address, though taken, never leaves the function; that would allow
promotion when we're only using the address for indexing within the
function, as in initlist-opt2.C.  But this would be a new pass.

And in initlist-opt1.C, we're passing the array address to another function,
so it definitely escapes; it's only safe in this case because it's calling a
standard library function that we know only uses it for indexing.  So, a
flag seems needed.  I first thought to put the flag on the TARGET_EXPR, but
the VAR_DECL seems more appropriate.

In a previous revision of the patch I called this flag DECL_NOT_OBSERVABLE,
but I think DECL_MERGEABLE is a better name, especially if we're going to
apply it to the backing array of initializer_list, which is observable.  I
then also check it in places that check for -fmerge-all-constants, so that
multiple equivalent initializer-lists can also be combined.  And then it
seemed to make sense for [[no_unique_address]] to have this meaning for
user-written variables.

I think the note in [dcl.init.list]/6 intended to allow this kind of merging
for initializer_lists, but it didn't actually work; for an explicit array
with the same initializer, if the address escapes the program could tell
whether the same variable in two frames have the same address.  P2752 is
trying to correct this defect, so I'm going to assume that this is the
intent.

	PR c++/110070
	PR c++/105838

gcc/ChangeLog:

	* tree.h (DECL_MERGEABLE): New.
	* tree-core.h (struct tree_decl_common): Mention it.
	* gimplify.cc (gimplify_init_constructor): Check it.
	* cgraph.cc (symtab_node::address_can_be_compared_p): Likewise.
	* varasm.cc (categorize_decl_for_section): Likewise.

gcc/cp/ChangeLog:

	* call.cc (maybe_init_list_as_array): Set DECL_MERGEABLE.
	(convert_like_internal) [ck_list]: Set it.
	(set_up_extended_ref_temp): Copy it.
	* tree.cc (handle_no_unique_addr_attribute): Set it.

gcc/testsuite/ChangeLog:

	* g++.dg/tree-ssa/initlist-opt1.C: Check for static array.
	* g++.dg/tree-ssa/initlist-opt2.C: Likewise.
	* g++.dg/tree-ssa/initlist-opt4.C: New test.
	* g++.dg/opt/icf1.C: New test.
	* g++.dg/opt/icf2.C: New test.
	* g++.dg/opt/icf3.C: New test.
	* g++.dg/tree-ssa/array-temp1.C: Revert r12-657 change.
This commit is contained in:
Jason Merrill 2022-12-07 11:40:53 -05:00
parent 99566c0c6b
commit 4d935f52b0
14 changed files with 104 additions and 8 deletions

View file

@ -158,7 +158,7 @@ symtab_node::address_can_be_compared_p ()
flag_merge_constants permits us to assume the same on readonly vars. */
if (is_a <varpool_node *> (this)
&& (DECL_IN_CONSTANT_POOL (decl)
|| (flag_merge_constants >= 2
|| ((flag_merge_constants >= 2 || DECL_MERGEABLE (decl))
&& TREE_READONLY (decl) && !TREE_THIS_VOLATILE (decl))))
return false;
return true;

View file

@ -4274,7 +4274,9 @@ maybe_init_list_as_array (tree elttype, tree init)
init_elttype = cp_build_qualified_type (init_elttype, TYPE_QUAL_CONST);
tree arr = build_array_of_n_type (init_elttype, CONSTRUCTOR_NELTS (init));
return finish_compound_literal (arr, init, tf_none);
arr = finish_compound_literal (arr, init, tf_none);
DECL_MERGEABLE (TARGET_EXPR_SLOT (arr)) = true;
return arr;
}
/* If we were going to call e.g. vector(initializer_list<string>) starting
@ -8558,6 +8560,8 @@ convert_like_internal (conversion *convs, tree expr, tree fn, int argnum,
(elttype, cp_type_quals (elttype) | TYPE_QUAL_CONST);
array = build_array_of_n_type (elttype, len);
array = finish_compound_literal (array, new_ctor, complain);
/* This is dubious now, should be blessed by P2752. */
DECL_MERGEABLE (TARGET_EXPR_SLOT (array)) = true;
/* Take the address explicitly rather than via decay_conversion
to avoid the error about taking the address of a temporary. */
array = cp_build_addr_expr (array, complain);
@ -13571,8 +13575,13 @@ set_up_extended_ref_temp (tree decl, tree expr, vec<tree, va_gc> **cleanups,
VAR. */
if (TREE_CODE (expr) != TARGET_EXPR)
expr = get_target_expr (expr);
else if (TREE_ADDRESSABLE (expr))
TREE_ADDRESSABLE (var) = 1;
else
{
if (TREE_ADDRESSABLE (expr))
TREE_ADDRESSABLE (var) = 1;
if (DECL_MERGEABLE (TARGET_EXPR_SLOT (expr)))
DECL_MERGEABLE (var) = true;
}
if (TREE_CODE (decl) == FIELD_DECL
&& extra_warnings && !warning_suppressed_p (decl))

View file

@ -5045,7 +5045,14 @@ handle_no_unique_addr_attribute (tree* node,
int /*flags*/,
bool* no_add_attrs)
{
if (TREE_CODE (*node) != FIELD_DECL)
if (TREE_CODE (*node) == VAR_DECL)
{
DECL_MERGEABLE (*node) = true;
if (pedantic)
warning (OPT_Wattributes, "%qE attribute can only be applied to "
"non-static data members", name);
}
else if (TREE_CODE (*node) != FIELD_DECL)
{
warning (OPT_Wattributes, "%qE attribute can only be applied to "
"non-static data members", name);

View file

@ -5253,7 +5253,8 @@ gimplify_init_constructor (tree *expr_p, gimple_seq *pre_p, gimple_seq *post_p,
&& TREE_READONLY (object)
&& VAR_P (object)
&& !DECL_REGISTER (object)
&& (flag_merge_constants >= 2 || !TREE_ADDRESSABLE (object))
&& (flag_merge_constants >= 2 || !TREE_ADDRESSABLE (object)
|| DECL_MERGEABLE (object))
/* For ctors that have many repeated nonzero elements
represented through RANGE_EXPRs, prefer initializing
those through runtime loops over copies of large amounts

View file

@ -0,0 +1,16 @@
// Test that -fipa-icf combines i and j.
// { dg-do run { target c++11 } }
// { dg-options -fipa-icf }
[[no_unique_address]] extern const int i[] = { 1,2,3 };
[[no_unique_address]] extern const int j[] = { 1,2,3 };
[[gnu::noipa]] void f (const void *a, const void *b)
{
if (a != b) __builtin_abort();
}
int main()
{
f (&i, &j);
}

View file

@ -0,0 +1,17 @@
// Test that -fipa-icf combines the backing arrays for a and b.
// { dg-do run { target c++11 } }
// { dg-options -fipa-icf }
#include <initializer_list>
[[gnu::noipa]] void f (const void *a, const void *b)
{
if (a != b) __builtin_abort();
}
int main()
{
auto a = { 1, 2 };
auto b = { 1, 2 };
f (a.begin(), b.begin());
}

View file

@ -0,0 +1,17 @@
// Test that -fipa-icf combines the backing arrays for a and b.
// { dg-do run { target c++11 } }
// { dg-options -fipa-icf }
#include <initializer_list>
template <class T>
[[gnu::noipa]] void f (std::initializer_list<T> a,
std::initializer_list<T> b)
{
if (a.begin() != b.begin()) __builtin_abort();
}
int main()
{
f ({1,2}, {1,2});
}

View file

@ -13,3 +13,9 @@ int f()
using AR = const int[];
return AR{ 1,42,3,4,5,6,7,8,9,0 }[5];
}
int g()
{
std::initializer_list<int> a = {1,42,3};
return a.begin()[0];
}

View file

@ -4,6 +4,7 @@
// Test that we do range-initialization from const char *.
// { dg-final { scan-tree-dump {_M_range_initialize<const char\* const\*>} "gimple" } }
// { dg-final { scan-tree-dump {static const char.*72} "gimple" } }
#include <string>
#include <vector>

View file

@ -4,6 +4,8 @@
// Test that we do range-initialization from const char *.
// { dg-final { scan-tree-dump {_M_range_initialize<const char\* const\*>} "gimple" } }
// And that the backing array is static.
// { dg-final { scan-tree-dump {static const char.*72} "gimple" } }
#include <string>
#include <vector>

View file

@ -0,0 +1,13 @@
// PR c++/110070
// { dg-additional-options -fdump-tree-gimple }
// { dg-do compile { target c++11 } }
// { dg-final { scan-tree-dump {static const int [^\n]*\[4\] = } "gimple" } }
#include <initializer_list>
extern void ext(int);
void foo()
{
for (int i: {1,2,4,6})
ext(i);
}

View file

@ -1803,7 +1803,8 @@ struct GTY(()) tree_decl_common {
In VAR_DECL, PARM_DECL and RESULT_DECL, this is
DECL_HAS_VALUE_EXPR_P. */
unsigned decl_flag_2 : 1;
/* In FIELD_DECL, this is DECL_PADDING_P. */
/* In FIELD_DECL, this is DECL_PADDING_P.
In VAR_DECL, this is DECL_MERGEABLE. */
unsigned decl_flag_3 : 1;
/* Logically, these two would go in a theoretical base shared by var and
parm decl. */

View file

@ -3233,6 +3233,12 @@ extern void decl_fini_priority_insert (tree, priority_type);
#define DECL_NONALIASED(NODE) \
(VAR_DECL_CHECK (NODE)->base.nothrow_flag)
/* In a VAR_DECL, nonzero if this variable is not required to have a distinct
address from other variables with the same constant value. In other words,
consider -fmerge-all-constants to be on for this VAR_DECL. */
#define DECL_MERGEABLE(NODE) \
(VAR_DECL_CHECK (NODE)->decl_common.decl_flag_3)
/* This field is used to reference anything in decl.result and is meant only
for use by the garbage collector. */
#define DECL_RESULT_FLD(NODE) \

View file

@ -7032,7 +7032,7 @@ categorize_decl_for_section (const_tree decl, int reloc)
}
else if (reloc & targetm.asm_out.reloc_rw_mask ())
ret = reloc == 1 ? SECCAT_DATA_REL_RO_LOCAL : SECCAT_DATA_REL_RO;
else if (reloc || flag_merge_constants < 2
else if (reloc || (flag_merge_constants < 2 && !DECL_MERGEABLE (decl))
|| ((flag_sanitize & SANITIZE_ADDRESS)
/* PR 81697: for architectures that use section anchors we
need to ignore DECL_RTL_SET_P (decl) for string constants