X-Git-Url: http://drtracing.org/?a=blobdiff_plain;f=gdb%2Fmacroexp.c;h=e132a3bc26ca62f1e98236c94f13587aa337bfea;hb=7f31862a8d9f3eea51fc58bd66abeb70c730feaf;hp=8102bc081f00b366a9e12e4a1487a6f73a755b71;hpb=ccb3ac8a121682a5fc5fd767f80872ef3e5c7b47;p=deliverable%2Fbinutils-gdb.git diff --git a/gdb/macroexp.c b/gdb/macroexp.c index 8102bc081f..e132a3bc26 100644 --- a/gdb/macroexp.c +++ b/gdb/macroexp.c @@ -1,5 +1,5 @@ /* C preprocessor macro expansion for GDB. - Copyright (C) 2002, 2007, 2008 Free Software Foundation, Inc. + Copyright (C) 2002-2016 Free Software Foundation, Inc. Contributed by Red Hat, Inc. This file is part of GDB. @@ -22,7 +22,7 @@ #include "bcache.h" #include "macrotab.h" #include "macroexp.h" -#include "gdb_assert.h" +#include "c-lang.h" @@ -112,6 +112,17 @@ free_buffer (struct macro_buffer *b) xfree (b->text); } +/* Like free_buffer, but return the text as an xstrdup()d string. + This only exists to try to make the API relatively clean. */ + +static char * +free_buffer_return_text (struct macro_buffer *b) +{ + gdb_assert (! b->shared); + gdb_assert (b->size); + /* Nothing to do. */ + return b->text; +} /* A cleanup function for macro buffers. */ static void @@ -135,7 +146,7 @@ resize_buffer (struct macro_buffer *b, int n) while (b->size <= n) b->size *= 2; - b->text = xrealloc (b->text, b->size); + b->text = (char *) xrealloc (b->text, b->size); } @@ -204,7 +215,7 @@ set_token (struct macro_buffer *tok, char *start, char *end) init_shared_buffer (tok, start, end - start); tok->last_token = 0; - /* Presumed; get_identifier may overwrite this. */ + /* Presumed; get_identifier may overwrite this. */ tok->is_identifier = 0; } @@ -278,20 +289,22 @@ get_pp_number (struct macro_buffer *tok, char *p, char *end) { if (p < end && (macro_is_digit (*p) - || *p == '.')) + || (*p == '.' + && p + 2 <= end + && macro_is_digit (p[1])))) { char *tok_start = p; while (p < end) { - if (macro_is_digit (*p) - || macro_is_identifier_nondigit (*p) - || *p == '.') - p++; - else if (p + 2 <= end - && strchr ("eEpP.", *p) - && (p[1] == '+' || p[1] == '-')) + if (p + 2 <= end + && strchr ("eEpP", *p) + && (p[1] == '+' || p[1] == '-')) p += 2; + else if (macro_is_digit (*p) + || macro_is_identifier_nondigit (*p) + || *p == '.') + p++; else break; } @@ -318,26 +331,27 @@ get_character_constant (struct macro_buffer *tok, char *p, char *end) way GDB's C/C++ lexer does. So we call parse_escape in utils.c to handle escape sequences. */ if ((p + 1 <= end && *p == '\'') - || (p + 2 <= end && p[0] == 'L' && p[1] == '\'')) + || (p + 2 <= end + && (p[0] == 'L' || p[0] == 'u' || p[0] == 'U') + && p[1] == '\'')) { char *tok_start = p; - char *body_start; + int char_count = 0; if (*p == '\'') p++; - else if (*p == 'L') + else if (*p == 'L' || *p == 'u' || *p == 'U') p += 2; else - gdb_assert (0); + gdb_assert_not_reached ("unexpected character constant"); - body_start = p; for (;;) { if (p >= end) error (_("Unmatched single quote.")); else if (*p == '\'') { - if (p == body_start) + if (!char_count) error (_("A character constant must contain at least one " "character.")); p++; @@ -345,11 +359,17 @@ get_character_constant (struct macro_buffer *tok, char *p, char *end) } else if (*p == '\\') { - p++; - parse_escape (&p); + const char *s, *o; + + s = o = ++p; + char_count += c_parse_escape (&s, NULL); + p += s - o; } else - p++; + { + p++; + char_count++; + } } set_token (tok, tok_start, p); @@ -368,25 +388,25 @@ static int get_string_literal (struct macro_buffer *tok, char *p, char *end) { if ((p + 1 <= end - && *p == '\"') + && *p == '"') || (p + 2 <= end - && p[0] == 'L' - && p[1] == '\"')) + && (p[0] == 'L' || p[0] == 'u' || p[0] == 'U') + && p[1] == '"')) { char *tok_start = p; - if (*p == '\"') + if (*p == '"') p++; - else if (*p == 'L') + else if (*p == 'L' || *p == 'u' || *p == 'U') p += 2; else - gdb_assert (0); + gdb_assert_not_reached ("unexpected string literal"); for (;;) { if (p >= end) error (_("Unterminated string in expression.")); - else if (*p == '\"') + else if (*p == '"') { p++; break; @@ -396,8 +416,11 @@ get_string_literal (struct macro_buffer *tok, char *p, char *end) "constants.")); else if (*p == '\\') { - p++; - parse_escape (&p); + const char *s, *o; + + s = o = ++p; + c_parse_escape (&s, NULL); + p += s - o; } else p++; @@ -516,6 +539,7 @@ get_token (struct macro_buffer *tok, { /* How many characters did we consume, including whitespace? */ int consumed = p - src->text + tok->len; + src->text += consumed; src->len -= consumed; return 1; @@ -625,6 +649,67 @@ append_tokens_without_splicing (struct macro_buffer *dest, _("unable to avoid splicing tokens during macro expansion")); } +/* Stringify an argument, and insert it into DEST. ARG is the text to + stringify; it is LEN bytes long. */ + +static void +stringify (struct macro_buffer *dest, const char *arg, int len) +{ + /* Trim initial whitespace from ARG. */ + while (len > 0 && macro_is_whitespace (*arg)) + { + ++arg; + --len; + } + + /* Trim trailing whitespace from ARG. */ + while (len > 0 && macro_is_whitespace (arg[len - 1])) + --len; + + /* Insert the string. */ + appendc (dest, '"'); + while (len > 0) + { + /* We could try to handle strange cases here, like control + characters, but there doesn't seem to be much point. */ + if (macro_is_whitespace (*arg)) + { + /* Replace a sequence of whitespace with a single space. */ + appendc (dest, ' '); + while (len > 1 && macro_is_whitespace (arg[1])) + { + ++arg; + --len; + } + } + else if (*arg == '\\' || *arg == '"') + { + appendc (dest, '\\'); + appendc (dest, *arg); + } + else + appendc (dest, *arg); + ++arg; + --len; + } + appendc (dest, '"'); + dest->last_token = dest->len; +} + +/* See macroexp.h. */ + +char * +macro_stringify (const char *str) +{ + struct macro_buffer buffer; + int len = strlen (str); + + init_buffer (&buffer, len); + stringify (&buffer, str, len); + appendc (&buffer, '\0'); + + return free_buffer_return_text (&buffer); +} /* Expanding macros! */ @@ -647,7 +732,7 @@ struct macro_name_list { particular macro, and otherwise delegates the decision to another function/baton pair. But that makes the linked list of excluded macros chained through untyped baton pointers, which will make it - harder to debug. :( */ + harder to debug. :( */ static int currently_rescanning (struct macro_name_list *list, const char *name) { @@ -674,6 +759,11 @@ currently_rescanning (struct macro_name_list *list, const char *name) If SRC doesn't contain a properly terminated argument list, then raise an error. + + For a variadic macro, NARGS holds the number of formal arguments to + the macro. For a GNU-style variadic macro, this should be the + number of named arguments. For a non-variadic macro, NARGS should + be -1. Otherwise, return a pointer to the first element of an array of macro buffers referring to the argument texts, and set *ARGC_P to @@ -694,7 +784,8 @@ currently_rescanning (struct macro_name_list *list, const char *name) following the invocation. */ static struct macro_buffer * -gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) +gather_arguments (const char *name, struct macro_buffer *src, + int nargs, int *argc_p) { struct macro_buffer tok; int args_len, args_size; @@ -706,6 +797,7 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) paren. */ { struct macro_buffer temp; + init_shared_buffer (&temp, src->text, src->len); if (! get_token (&tok, &temp) @@ -722,7 +814,7 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) args_len = 0; args_size = 6; - args = (struct macro_buffer *) xmalloc (sizeof (*args) * args_size); + args = XNEWVEC (struct macro_buffer, args_size); for (;;) { @@ -733,7 +825,7 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) if (args_len >= args_size) { args_size *= 2; - args = xrealloc (args, sizeof (*args) * args_size); + args = XRESIZEVEC (struct macro_buffer, args, args_size); } /* Initialize the next argument. */ @@ -744,8 +836,6 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) depth = 0; for (;;) { - char *start = src->text; - if (! get_token (&tok, src)) error (_("Malformed argument list for macro `%s'."), name); @@ -760,6 +850,21 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) the end of the argument list. */ if (depth == 0) { + /* In the varargs case, the last argument may be + missing. Add an empty argument in this case. */ + if (nargs != -1 && args_len == nargs - 1) + { + /* Make sure we have room for the argument. */ + if (args_len >= args_size) + { + args_size++; + args = XRESIZEVEC (struct macro_buffer, args, + args_size); + } + arg = &args[args_len++]; + set_token (arg, src->text, src->text); + } + discard_cleanups (back_to); *argc_p = args_len; return args; @@ -769,8 +874,11 @@ gather_arguments (const char *name, struct macro_buffer *src, int *argc_p) } /* If tok is a comma at top level, then that's the end of - the current argument. */ - else if (tok.len == 1 && tok.text[0] == ',' && depth == 0) + the current argument. However, if we are handling a + variadic macro and we are computing the last argument, we + want to include the comma and remaining tokens. */ + else if (tok.len == 1 && tok.text[0] == ',' && depth == 0 + && (nargs == -1 || args_len < nargs)) break; /* Extend the current argument to enclose this token. If @@ -801,17 +909,58 @@ static void scan (struct macro_buffer *dest, void *lookup_baton); +/* A helper function for substitute_args. + + ARGV is a vector of all the arguments; ARGC is the number of + arguments. IS_VARARGS is true if the macro being substituted is a + varargs macro; in this case VA_ARG_NAME is the name of the + "variable" argument. VA_ARG_NAME is ignored if IS_VARARGS is + false. + + If the token TOK is the name of a parameter, return the parameter's + index. If TOK is not an argument, return -1. */ + +static int +find_parameter (const struct macro_buffer *tok, + int is_varargs, const struct macro_buffer *va_arg_name, + int argc, const char * const *argv) +{ + int i; + + if (! tok->is_identifier) + return -1; + + for (i = 0; i < argc; ++i) + if (tok->len == strlen (argv[i]) + && !memcmp (tok->text, argv[i], tok->len)) + return i; + + if (is_varargs && tok->len == va_arg_name->len + && ! memcmp (tok->text, va_arg_name->text, tok->len)) + return argc - 1; + + return -1; +} + /* Given the macro definition DEF, being invoked with the actual arguments given by ARGC and ARGV, substitute the arguments into the replacement list, and store the result in DEST. + IS_VARARGS should be true if DEF is a varargs macro. In this case, + VA_ARG_NAME should be the name of the "variable" argument -- either + __VA_ARGS__ for c99-style varargs, or the final argument name, for + GNU-style varargs. If IS_VARARGS is false, this parameter is + ignored. + If it is necessary to expand macro invocations in one of the arguments, use LOOKUP_FUNC and LOOKUP_BATON to find the macro definitions, and don't expand invocations of the macros listed in NO_LOOP. */ + static void substitute_args (struct macro_buffer *dest, struct macro_definition *def, + int is_varargs, const struct macro_buffer *va_arg_name, int argc, struct macro_buffer *argv, struct macro_name_list *no_loop, macro_lookup_ftype *lookup_func, @@ -819,6 +968,17 @@ substitute_args (struct macro_buffer *dest, { /* A macro buffer for the macro's replacement list. */ struct macro_buffer replacement_list; + /* The token we are currently considering. */ + struct macro_buffer tok; + /* The replacement list's pointer from just before TOK was lexed. */ + char *original_rl_start; + /* We have a single lookahead token to handle token splicing. */ + struct macro_buffer lookahead; + /* The lookahead token might not be valid. */ + int lookahead_valid; + /* The replacement list's pointer from just before LOOKAHEAD was + lexed. */ + char *lookahead_rl_start; init_shared_buffer (&replacement_list, (char *) def->replacement, strlen (def->replacement)); @@ -826,16 +986,14 @@ substitute_args (struct macro_buffer *dest, gdb_assert (dest->len == 0); dest->last_token = 0; + original_rl_start = replacement_list.text; + if (! get_token (&tok, &replacement_list)) + return; + lookahead_rl_start = replacement_list.text; + lookahead_valid = get_token (&lookahead, &replacement_list); + for (;;) { - struct macro_buffer tok; - char *original_rl_start = replacement_list.text; - int substituted = 0; - - /* Find the next token in the replacement list. */ - if (! get_token (&tok, &replacement_list)) - break; - /* Just for aesthetics. If we skipped some whitespace, copy that to DEST. */ if (tok.text > original_rl_start) @@ -847,46 +1005,163 @@ substitute_args (struct macro_buffer *dest, /* Is this token the stringification operator? */ if (tok.len == 1 && tok.text[0] == '#') - error (_("Stringification is not implemented yet.")); + { + int arg; - /* Is this token the splicing operator? */ - if (tok.len == 2 - && tok.text[0] == '#' - && tok.text[1] == '#') - error (_("Token splicing is not implemented yet.")); + if (!lookahead_valid) + error (_("Stringification operator requires an argument.")); - /* Is this token an identifier? */ - if (tok.is_identifier) - { - int i; - - /* Is it the magic varargs parameter? */ - if (tok.len == 11 - && ! memcmp (tok.text, "__VA_ARGS__", 11)) - error (_("Variable-arity macros not implemented yet.")); - - /* Is it one of the parameters? */ - for (i = 0; i < def->argc; i++) - if (tok.len == strlen (def->argv[i]) - && ! memcmp (tok.text, def->argv[i], tok.len)) - { - struct macro_buffer arg_src; - - /* Expand any macro invocations in the argument text, - and append the result to dest. Remember that scan - mutates its source, so we need to scan a new buffer - referring to the argument's text, not the argument - itself. */ - init_shared_buffer (&arg_src, argv[i].text, argv[i].len); - scan (dest, &arg_src, no_loop, lookup_func, lookup_baton); - substituted = 1; - break; - } - } + arg = find_parameter (&lookahead, is_varargs, va_arg_name, + def->argc, def->argv); + if (arg == -1) + error (_("Argument to stringification operator must name " + "a macro parameter.")); - /* If it wasn't a parameter, then just copy it across. */ - if (! substituted) - append_tokens_without_splicing (dest, &tok); + stringify (dest, argv[arg].text, argv[arg].len); + + /* Read one token and let the loop iteration code handle the + rest. */ + lookahead_rl_start = replacement_list.text; + lookahead_valid = get_token (&lookahead, &replacement_list); + } + /* Is this token the splicing operator? */ + else if (tok.len == 2 + && tok.text[0] == '#' + && tok.text[1] == '#') + error (_("Stray splicing operator")); + /* Is the next token the splicing operator? */ + else if (lookahead_valid + && lookahead.len == 2 + && lookahead.text[0] == '#' + && lookahead.text[1] == '#') + { + int finished = 0; + int prev_was_comma = 0; + + /* Note that GCC warns if the result of splicing is not a + token. In the debugger there doesn't seem to be much + benefit from doing this. */ + + /* Insert the first token. */ + if (tok.len == 1 && tok.text[0] == ',') + prev_was_comma = 1; + else + { + int arg = find_parameter (&tok, is_varargs, va_arg_name, + def->argc, def->argv); + + if (arg != -1) + appendmem (dest, argv[arg].text, argv[arg].len); + else + appendmem (dest, tok.text, tok.len); + } + + /* Apply a possible sequence of ## operators. */ + for (;;) + { + if (! get_token (&tok, &replacement_list)) + error (_("Splicing operator at end of macro")); + + /* Handle a comma before a ##. If we are handling + varargs, and the token on the right hand side is the + varargs marker, and the final argument is empty or + missing, then drop the comma. This is a GNU + extension. There is one ambiguous case here, + involving pedantic behavior with an empty argument, + but we settle that in favor of GNU-style (GCC uses an + option). If we aren't dealing with varargs, we + simply insert the comma. */ + if (prev_was_comma) + { + if (! (is_varargs + && tok.len == va_arg_name->len + && !memcmp (tok.text, va_arg_name->text, tok.len) + && argv[argc - 1].len == 0)) + appendmem (dest, ",", 1); + prev_was_comma = 0; + } + + /* Insert the token. If it is a parameter, insert the + argument. If it is a comma, treat it specially. */ + if (tok.len == 1 && tok.text[0] == ',') + prev_was_comma = 1; + else + { + int arg = find_parameter (&tok, is_varargs, va_arg_name, + def->argc, def->argv); + + if (arg != -1) + appendmem (dest, argv[arg].text, argv[arg].len); + else + appendmem (dest, tok.text, tok.len); + } + + /* Now read another token. If it is another splice, we + loop. */ + original_rl_start = replacement_list.text; + if (! get_token (&tok, &replacement_list)) + { + finished = 1; + break; + } + + if (! (tok.len == 2 + && tok.text[0] == '#' + && tok.text[1] == '#')) + break; + } + + if (prev_was_comma) + { + /* We saw a comma. Insert it now. */ + appendmem (dest, ",", 1); + } + + dest->last_token = dest->len; + if (finished) + lookahead_valid = 0; + else + { + /* Set up for the loop iterator. */ + lookahead = tok; + lookahead_rl_start = original_rl_start; + lookahead_valid = 1; + } + } + else + { + /* Is this token an identifier? */ + int substituted = 0; + int arg = find_parameter (&tok, is_varargs, va_arg_name, + def->argc, def->argv); + + if (arg != -1) + { + struct macro_buffer arg_src; + + /* Expand any macro invocations in the argument text, + and append the result to dest. Remember that scan + mutates its source, so we need to scan a new buffer + referring to the argument's text, not the argument + itself. */ + init_shared_buffer (&arg_src, argv[arg].text, argv[arg].len); + scan (dest, &arg_src, no_loop, lookup_func, lookup_baton); + substituted = 1; + } + + /* If it wasn't a parameter, then just copy it across. */ + if (! substituted) + append_tokens_without_splicing (dest, &tok); + } + + if (! lookahead_valid) + break; + + tok = lookahead; + original_rl_start = lookahead_rl_start; + + lookahead_rl_start = replacement_list.text; + lookahead_valid = get_token (&lookahead, &replacement_list); } } @@ -895,7 +1170,7 @@ substitute_args (struct macro_buffer *dest, its expansion to DEST. SRC is the input text following the ID token. We are currently rescanning the expansions of the macros named in NO_LOOP; don't re-expand them. Use LOOKUP_FUNC and - LOOKUP_BATON to find definitions for any nested macro references. + LOOKUP_BATON to find definitions for any nested macro references. Return 1 if we decided to expand it, zero otherwise. (If it's a function-like macro name that isn't followed by an argument list, @@ -937,13 +1212,40 @@ expand (const char *id, struct macro_buffer *argv = NULL; struct macro_buffer substituted; struct macro_buffer substituted_src; - - if (def->argc >= 1 - && strcmp (def->argv[def->argc - 1], "...") == 0) - error (_("Varargs macros not implemented yet.")); + struct macro_buffer va_arg_name = {0}; + int is_varargs = 0; + + if (def->argc >= 1) + { + if (strcmp (def->argv[def->argc - 1], "...") == 0) + { + /* In C99-style varargs, substitution is done using + __VA_ARGS__. */ + init_shared_buffer (&va_arg_name, "__VA_ARGS__", + strlen ("__VA_ARGS__")); + is_varargs = 1; + } + else + { + int len = strlen (def->argv[def->argc - 1]); + + if (len > 3 + && strcmp (def->argv[def->argc - 1] + len - 3, "...") == 0) + { + /* In GNU-style varargs, the name of the + substitution parameter is the name of the formal + argument without the "...". */ + init_shared_buffer (&va_arg_name, + (char *) def->argv[def->argc - 1], + len - 3); + is_varargs = 1; + } + } + } make_cleanup (free_current_contents, &argv); - argv = gather_arguments (id, src, &argc); + argv = gather_arguments (id, src, is_varargs ? def->argc : -1, + &argc); /* If we couldn't find any argument list, then we don't expand this macro. */ @@ -957,12 +1259,16 @@ expand (const char *id, this macro. */ if (argc != def->argc) { + if (is_varargs && argc >= def->argc - 1) + { + /* Ok. */ + } /* Remember that a sequence of tokens like "foo()" is a valid invocation of a macro expecting either zero or one arguments. */ - if (! (argc == 1 - && argv[0].len == 0 - && def->argc == 0)) + else if (! (argc == 1 + && argv[0].len == 0 + && def->argc == 0)) error (_("Wrong number of arguments to macro `%s' " "(expected %d, got %d)."), id, def->argc, argc); @@ -976,8 +1282,8 @@ expand (const char *id, expand an argument until we see how it's being used. */ init_buffer (&substituted, 0); make_cleanup (cleanup_macro_buffer, &substituted); - substitute_args (&substituted, def, argc, argv, no_loop, - lookup_func, lookup_baton); + substitute_args (&substituted, def, is_varargs, &va_arg_name, + argc, argv, no_loop, lookup_func, lookup_baton); /* Now `substituted' is the macro's replacement list, with all argument values substituted into it properly. Re-scan it for @@ -1025,8 +1331,9 @@ maybe_expand (struct macro_buffer *dest, { /* Make a null-terminated copy of it, since that's what our lookup function expects. */ - char *id = xmalloc (src_first->len + 1); + char *id = (char *) xmalloc (src_first->len + 1); struct cleanup *back_to = make_cleanup (xfree, id); + memcpy (id, src_first->text, src_first->len); id[src_first->len] = 0; @@ -1133,7 +1440,7 @@ macro_expand_once (const char *source, char * -macro_expand_next (char **lexptr, +macro_expand_next (const char **lexptr, macro_lookup_ftype *lookup_func, void *lookup_baton) { @@ -1141,7 +1448,7 @@ macro_expand_next (char **lexptr, struct cleanup *back_to; /* Set up SRC to refer to the input text, pointed to by *lexptr. */ - init_shared_buffer (&src, *lexptr, strlen (*lexptr)); + init_shared_buffer (&src, (char *) *lexptr, strlen (*lexptr)); /* Set up DEST to receive the expansion, if there is one. */ init_buffer (&dest, 0);