[PATCH v23 02/33] c-family, c++: Look up built-in traits via identifier node
Ken Matsui
kmatsui@cs.washington.edu
Fri Oct 20 20:00:51 GMT 2023
On Fri, Oct 20, 2023 at 12:12 PM Patrick Palka <ppalka@redhat.com> wrote:
>
> On Fri, Oct 20, 2023 at 10:02 AM Ken Matsui <kmatsui@gcc.gnu.org> wrote:
> >
> > Since RID_MAX soon reaches 255 and all built-in traits are used approximately
> > once in a C++ translation unit, this patch removes all RID values for built-in
> > traits and uses the identifier node to look up the specific trait. Rather
> > than holding traits as keywords, we set all trait identifiers as cik_trait,
> > which is a new cp_identifier_kind. As cik_reserved_for_udlit was unused and
> > cp_identifier_kind is 3 bits, we replaced the unused field with the new
> > cik_trait. Also, the later patch handles a subsequent token to the built-in
> > identifier so that we accept the use of non-function-like built-in traitreviewed but can be pushed incrementally if anything
> > identifiers.
>
> Thanks a lot, patches 1-31 in this series LGTM.
>
Thank you!!!
>
>
>
> >
> > gcc/c-family/ChangeLog:
> >
> > * c-common.cc (c_common_reswords): Remove all mappings of
> > built-in traits.
> > * c-common.h (enum rid): Remove all RID values for built-in traits.
> >
> > gcc/cp/ChangeLog:
> >
> > * cp-objcp-common.cc (names_builtin_p): Remove all RID value
> > cases for built-in traits. Check for built-in traits via
> > the new cik_trait kind.
> > * cp-tree.h (enum cp_trait_kind): Set its underlying type to
> > addr_space_t.
> > (struct cp_trait): New struct to hold trait information.
> > (cp_traits): New array to hold a mapping to all traits.
> > (cik_reserved_for_udlit): Rename to ...
> > (cik_trait): ... this.
> > (IDENTIFIER_ANY_OP_P): Exclude cik_trait.
> > (IDENTIFIER_TRAIT_P): New macro to detect cik_trait.
> > * lex.cc (cp_traits): Define its values, declared in cp-tree.h.
> > (init_cp_traits): New function to set cik_trait and
> > IDENTIFIER_CP_INDEX for all built-in trait identifiers.
> > (cxx_init): Call init_cp_traits function.
> > * parser.cc (cp_lexer_lookup_trait): New function to look up a
> > built-in trait by IDENTIFIER_CP_INDEX.
> > (cp_lexer_lookup_trait_expr): Likewise, look up an
> > expression-yielding built-in trait.
> > (cp_lexer_lookup_trait_type): Likewise, look up a type-yielding
> > built-in trait.
> > (cp_keyword_starts_decl_specifier_p): Remove all RID value cases
> > for built-in traits.
> > (cp_lexer_next_token_is_decl_specifier_keyword): Handle
> > type-yielding built-in traits.
> > (cp_parser_primary_expression): Remove all RID value cases for
> > built-in traits. Handle expression-yielding built-in traits.
> > (cp_parser_trait): Handle cp_trait instead of enum rid.
> > (cp_parser_simple_type_specifier): Remove all RID value cases
> > for built-in traits. Handle type-yielding built-in traits.
> >
> > Co-authored-by: Patrick Palka <ppalka@redhat.com>
> > Signed-off-by: Ken Matsui <kmatsui@gcc.gnu.org>
> > ---
> > gcc/c-family/c-common.cc | 7 ---
> > gcc/c-family/c-common.h | 5 --
> > gcc/cp/cp-objcp-common.cc | 8 +--
> > gcc/cp/cp-tree.h | 32 +++++++++---
> > gcc/cp/lex.cc | 34 ++++++++++++
> > gcc/cp/parser.cc | 105 +++++++++++++++++++++++---------------
> > 6 files changed, 126 insertions(+), 65 deletions(-)
> >
> > diff --git a/gcc/c-family/c-common.cc b/gcc/c-family/c-common.cc
> > index f044db5b797..21fd333ef57 100644
> > --- a/gcc/c-family/c-common.cc
> > +++ b/gcc/c-family/c-common.cc
> > @@ -508,13 +508,6 @@ const struct c_common_resword c_common_reswords[] =
> > { "wchar_t", RID_WCHAR, D_CXXONLY },
> > { "while", RID_WHILE, 0 },
> >
> > -#define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > - { NAME, RID_##CODE, D_CXXONLY },
> > -#include "cp/cp-trait.def"
> > -#undef DEFTRAIT
> > - /* An alias for __is_same. */
> > - { "__is_same_as", RID_IS_SAME, D_CXXONLY },
> > -
> > /* C++ transactional memory. */
> > { "synchronized", RID_SYNCHRONIZED, D_CXX_OBJC | D_TRANSMEM },
> > { "atomic_noexcept", RID_ATOMIC_NOEXCEPT, D_CXXONLY | D_TRANSMEM },
> > diff --git a/gcc/c-family/c-common.h b/gcc/c-family/c-common.h
> > index 1fdba7ef3ea..051a442e0f4 100644
> > --- a/gcc/c-family/c-common.h
> > +++ b/gcc/c-family/c-common.h
> > @@ -168,11 +168,6 @@ enum rid
> > RID_BUILTIN_LAUNDER,
> > RID_BUILTIN_BIT_CAST,
> >
> > -#define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > - RID_##CODE,
> > -#include "cp/cp-trait.def"
> > -#undef DEFTRAIT
> > -
> > /* C++11 */
> > RID_CONSTEXPR, RID_DECLTYPE, RID_NOEXCEPT, RID_NULLPTR, RID_STATIC_ASSERT,
> >
> > diff --git a/gcc/cp/cp-objcp-common.cc b/gcc/cp/cp-objcp-common.cc
> > index 93b027b80ce..b1adacfec07 100644
> > --- a/gcc/cp/cp-objcp-common.cc
> > +++ b/gcc/cp/cp-objcp-common.cc
> > @@ -421,6 +421,10 @@ names_builtin_p (const char *name)
> > }
> > }
> >
> > + /* Check for built-in traits. */
> > + if (IDENTIFIER_TRAIT_P (id))
> > + return true;
> > +
> > /* Also detect common reserved C++ words that aren't strictly built-in
> > functions. */
> > switch (C_RID_CODE (id))
> > @@ -434,10 +438,6 @@ names_builtin_p (const char *name)
> > case RID_BUILTIN_ASSOC_BARRIER:
> > case RID_BUILTIN_BIT_CAST:
> > case RID_OFFSETOF:
> > -#define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > - case RID_##CODE:
> > -#include "cp-trait.def"
> > -#undef DEFTRAIT
> > return true;
> > default:
> > break;
> > diff --git a/gcc/cp/cp-tree.h b/gcc/cp/cp-tree.h
> > index efcd2de54e5..e62e4df4db0 100644
> > --- a/gcc/cp/cp-tree.h
> > +++ b/gcc/cp/cp-tree.h
> > @@ -1226,7 +1226,7 @@ enum cp_identifier_kind {
> > cik_simple_op = 4, /* Non-assignment operator name. */
> > cik_assign_op = 5, /* An assignment operator name. */
> > cik_conv_op = 6, /* Conversion operator name. */
> > - cik_reserved_for_udlit = 7, /* Not yet in use */
> > + cik_trait = 7, /* Built-in trait name. */
> > cik_max
> > };
> >
> > @@ -1271,9 +1271,9 @@ enum cp_identifier_kind {
> > & IDENTIFIER_KIND_BIT_0 (NODE))
> >
> > /* True if this identifier is for any operator name (including
> > - conversions). Value 4, 5, 6 or 7. */
> > + conversions). Value 4, 5, or 6. */
> > #define IDENTIFIER_ANY_OP_P(NODE) \
> > - (IDENTIFIER_KIND_BIT_2 (NODE))
> > + (IDENTIFIER_KIND_BIT_2 (NODE) && !IDENTIFIER_TRAIT_P (NODE))
> >
> > /* True if this identifier is for an overloaded operator. Values 4, 5. */
> > #define IDENTIFIER_OVL_OP_P(NODE) \
> > @@ -1286,12 +1286,18 @@ enum cp_identifier_kind {
> > & IDENTIFIER_KIND_BIT_0 (NODE))
> >
> > /* True if this identifier is the name of a type-conversion
> > - operator. Value 7. */
> > + operator. Value 6. */
> > #define IDENTIFIER_CONV_OP_P(NODE) \
> > (IDENTIFIER_ANY_OP_P (NODE) \
> > & IDENTIFIER_KIND_BIT_1 (NODE) \
> > & (!IDENTIFIER_KIND_BIT_0 (NODE)))
> >
> > +/* True if this identifier is the name of a built-in trait. */
> > +#define IDENTIFIER_TRAIT_P(NODE) \
> > + (IDENTIFIER_KIND_BIT_0 (NODE) \
> > + && IDENTIFIER_KIND_BIT_1 (NODE) \
> > + && IDENTIFIER_KIND_BIT_2 (NODE))
> > +
> > /* True if this identifier is a new or delete operator. */
> > #define IDENTIFIER_NEWDEL_OP_P(NODE) \
> > (IDENTIFIER_OVL_OP_P (NODE) \
> > @@ -1375,16 +1381,26 @@ struct GTY (()) tree_argument_pack_select {
> > int index;
> > };
> >
> > -/* The different kinds of traits that we encounter. */
> > -
> > -enum cp_trait_kind
> > -{
> > +/* The different kinds of traits that we encounter. The size is limited to
> > + addr_space_t since a trait is looked up by IDENTIFIER_CP_INDEX. */
> > +enum cp_trait_kind : addr_space_t {
> > #define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > CPTK_##CODE,
> > #include "cp-trait.def"
> > #undef DEFTRAIT
> > };
> >
> > +/* The trait type. */
> > +struct cp_trait {
> > + const char *name;
> > + cp_trait_kind kind;
> > + short arity;
> > + bool type;
> > +};
> > +
> > +/* The trait table indexed by cp_trait_kind. */
> > +extern const struct cp_trait cp_traits[];
> > +
> > /* The types that we are processing. */
> > #define TRAIT_EXPR_TYPE1(NODE) \
> > (((struct tree_trait_expr *)TRAIT_EXPR_CHECK (NODE))->type1)
> > diff --git a/gcc/cp/lex.cc b/gcc/cp/lex.cc
> > index 64bcfb18196..a939e2e5f13 100644
> > --- a/gcc/cp/lex.cc
> > +++ b/gcc/cp/lex.cc
> > @@ -35,6 +35,7 @@ along with GCC; see the file COPYING3. If not see
> > #include "langhooks.h"
> >
> > static int interface_strcmp (const char *);
> > +static void init_cp_traits (void);
> > static void init_cp_pragma (void);
> >
> > static tree parse_strconst_pragma (const char *, int);
> > @@ -97,6 +98,19 @@ ovl_op_info_t ovl_op_info[2][OVL_OP_MAX] =
> > unsigned char ovl_op_mapping[MAX_TREE_CODES];
> > unsigned char ovl_op_alternate[OVL_OP_MAX];
> >
> > +/* The trait table, declared in cp-tree.h. */
> > +const cp_trait cp_traits[] =
> > +{
> > +#define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > + { NAME, CPTK_##CODE, ARITY, (TCC == tcc_type) },
> > +#include "cp-trait.def"
> > +#undef DEFTRAIT
> > +};
> > +/* The trait table cannot have more than 255 (addr_space_t) entries since
> > + the index is retrieved through IDENTIFIER_CP_INDEX. */
> > +static_assert(ARRAY_SIZE (cp_traits) <= 255,
> > + "cp_traits array cannot have more than 255 entries");
> > +
> > /* Get the name of the kind of identifier T. */
> >
> > const char *
> > @@ -283,6 +297,25 @@ init_reswords (void)
> > }
> > }
> >
> > +/* Initialize the C++ traits. */
> > +static void
> > +init_cp_traits (void)
> > +{
> > + tree id;
> > +
> > + for (unsigned int i = 0; i < ARRAY_SIZE (cp_traits); ++i)
> > + {
> > + id = get_identifier (cp_traits[i].name);
> > + IDENTIFIER_CP_INDEX (id) = cp_traits[i].kind;
> > + set_identifier_kind (id, cik_trait);
> > + }
> > +
> > + /* An alias for __is_same. */
> > + id = get_identifier ("__is_same_as");
> > + IDENTIFIER_CP_INDEX (id) = CPTK_IS_SAME;
> > + set_identifier_kind (id, cik_trait);
> > +}
> > +
> > static void
> > init_cp_pragma (void)
> > {
> > @@ -324,6 +357,7 @@ cxx_init (void)
> > input_location = BUILTINS_LOCATION;
> >
> > init_reswords ();
> > + init_cp_traits ();
> > init_tree ();
> > init_cp_semantics ();
> > init_operators ();
> > diff --git a/gcc/cp/parser.cc b/gcc/cp/parser.cc
> > index 59b9852895e..f87d4c0a855 100644
> > --- a/gcc/cp/parser.cc
> > +++ b/gcc/cp/parser.cc
> > @@ -246,6 +246,12 @@ static void cp_lexer_start_debugging
> > (cp_lexer *) ATTRIBUTE_UNUSED;
> > static void cp_lexer_stop_debugging
> > (cp_lexer *) ATTRIBUTE_UNUSED;
> > +static const cp_trait *cp_lexer_lookup_trait
> > + (const cp_token *);
> > +static const cp_trait *cp_lexer_lookup_trait_expr
> > + (const cp_token *);
> > +static const cp_trait *cp_lexer_lookup_trait_type
> > + (const cp_token *);
> >
> > static cp_token_cache *cp_token_cache_new
> > (cp_token *, cp_token *);
> > @@ -1167,12 +1173,6 @@ cp_keyword_starts_decl_specifier_p (enum rid keyword)
> > case RID_CONSTEVAL:
> > return true;
> >
> > -#define DEFTRAIT_TYPE(CODE, NAME, ARITY) \
> > - case RID_##CODE:
> > -#include "cp-trait.def"
> > -#undef DEFTRAIT_TYPE
> > - return true;
> > -
> > default:
> > if (keyword >= RID_FIRST_INT_N
> > && keyword < RID_FIRST_INT_N + NUM_INT_N_ENTS
> > @@ -1182,6 +1182,44 @@ cp_keyword_starts_decl_specifier_p (enum rid keyword)
> > }
> > }
> >
> > +/* Look ups the corresponding built-in trait if a given token is
> > + a built-in trait. Otherwise, returns nullptr. */
> > +
> > +static const cp_trait *
> > +cp_lexer_lookup_trait (const cp_token *token)
> > +{
> > + if (token->type == CPP_NAME && IDENTIFIER_TRAIT_P (token->u.value))
> > + return &cp_traits[IDENTIFIER_CP_INDEX (token->u.value)];
> > +
> > + return nullptr;
> > +}
> > +
> > +/* Similarly, but only if the token is an expression-yielding
> > + built-in trait. */
> > +
> > +static const cp_trait *
> > +cp_lexer_lookup_trait_expr (const cp_token *token)
> > +{
> > + const cp_trait *trait = cp_lexer_lookup_trait (token);
> > + if (trait && !trait->type)
> > + return trait;
> > +
> > + return nullptr;
> > +}
> > +
> > +/* Similarly, but only if the token is a type-yielding
> > + built-in trait. */
> > +
> > +static const cp_trait *
> > +cp_lexer_lookup_trait_type (const cp_token *token)
> > +{
> > + const cp_trait *trait = cp_lexer_lookup_trait (token);
> > + if (trait && trait->type)
> > + return trait;
> > +
> > + return nullptr;
> > +}
> > +
> > /* Return true if the next token is a keyword for a decl-specifier. */
> >
> > static bool
> > @@ -1190,6 +1228,8 @@ cp_lexer_next_token_is_decl_specifier_keyword (cp_lexer *lexer)
> > cp_token *token;
> >
> > token = cp_lexer_peek_token (lexer);
> > + if (cp_lexer_lookup_trait_type (token))
> > + return true;
> > return cp_keyword_starts_decl_specifier_p (token->keyword);
> > }
> >
> > @@ -2854,7 +2894,7 @@ static void cp_parser_late_parsing_default_args
> > static tree cp_parser_sizeof_operand
> > (cp_parser *, enum rid);
> > static cp_expr cp_parser_trait
> > - (cp_parser *, enum rid);
> > + (cp_parser *, const cp_trait *);
> > static bool cp_parser_declares_only_class_p
> > (cp_parser *);
> > static void cp_parser_set_storage_class
> > @@ -6029,12 +6069,6 @@ cp_parser_primary_expression (cp_parser *parser,
> > case RID_OFFSETOF:
> > return cp_parser_builtin_offsetof (parser);
> >
> > -#define DEFTRAIT_EXPR(CODE, NAME, ARITY) \
> > - case RID_##CODE:
> > -#include "cp-trait.def"
> > -#undef DEFTRAIT_EXPR
> > - return cp_parser_trait (parser, token->keyword);
> > -
> > // C++ concepts
> > case RID_REQUIRES:
> > return cp_parser_requires_expression (parser);
> > @@ -6073,6 +6107,9 @@ cp_parser_primary_expression (cp_parser *parser,
> > `::' as the beginning of a qualified-id, or the "operator"
> > keyword. */
> > case CPP_NAME:
> > + if (const cp_trait* trait = cp_lexer_lookup_trait_expr (token))
> > + return cp_parser_trait (parser, trait);
> > + /* FALLTHRU */
> > case CPP_SCOPE:
> > case CPP_TEMPLATE_ID:
> > case CPP_NESTED_NAME_SPECIFIER:
> > @@ -11041,28 +11078,13 @@ cp_parser_builtin_offsetof (cp_parser *parser)
> > /* Parse a builtin trait expression or type. */
> >
> > static cp_expr
> > -cp_parser_trait (cp_parser* parser, enum rid keyword)
> > +cp_parser_trait (cp_parser* parser, const cp_trait* trait)
> > {
> > - cp_trait_kind kind;
> > + const cp_trait_kind kind = trait->kind;
> > tree type1, type2 = NULL_TREE;
> > - bool binary = false;
> > - bool variadic = false;
> > - bool type = false;
> > -
> > - switch (keyword)
> > - {
> > -#define DEFTRAIT(TCC, CODE, NAME, ARITY) \
> > - case RID_##CODE: \
> > - kind = CPTK_##CODE; \
> > - binary = (ARITY == 2); \
> > - variadic = (ARITY == -1); \
> > - type = (TCC == tcc_type); \
> > - break;
> > -#include "cp-trait.def"
> > -#undef DEFTRAIT
> > - default:
> > - gcc_unreachable ();
> > - }
> > + const bool binary = (trait->arity == 2);
> > + const bool variadic = (trait->arity == -1);
> > + const bool type = trait->type;
> >
> > /* Get location of initial token. */
> > location_t start_loc = cp_lexer_peek_token (parser->lexer)->location;
> > @@ -20089,20 +20111,21 @@ cp_parser_simple_type_specifier (cp_parser* parser,
> >
> > return type;
> >
> > -#define DEFTRAIT_TYPE(CODE, NAME, ARITY) \
> > - case RID_##CODE:
> > -#include "cp-trait.def"
> > -#undef DEFTRAIT_TYPE
> > - type = cp_parser_trait (parser, token->keyword);
> > + default:
> > + break;
> > + }
> > +
> > + /* If token is a type-yielding built-in traits, parse it. */
> > + const cp_trait* trait = cp_lexer_lookup_trait_type (token);
> > + if (trait)
> > + {
> > + type = cp_parser_trait (parser, trait);
> > if (decl_specs)
> > cp_parser_set_decl_spec_type (decl_specs, type,
> > token,
> > /*type_definition_p=*/false);
> >
> > return type;
> > -
> > - default:
> > - break;
> > }
> >
> > /* If token is an already-parsed decltype not followed by ::,
> > --
> > 2.42.0
> >
>
More information about the Libstdc++
mailing list