| /* Check calls to formatted I/O functions (-Wformat). |
| Copyright (C) 1992-2021 Free Software Foundation, Inc. |
| |
| This file is part of GCC. |
| |
| GCC is free software; you can redistribute it and/or modify it under |
| the terms of the GNU General Public License as published by the Free |
| Software Foundation; either version 3, or (at your option) any later |
| version. |
| |
| GCC is distributed in the hope that it will be useful, but WITHOUT ANY |
| WARRANTY; without even the implied warranty of MERCHANTABILITY or |
| FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
| for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with GCC; see the file COPYING3. If not see |
| <http://www.gnu.org/licenses/>. */ |
| |
| #include "config.h" |
| #include "system.h" |
| #include "coretypes.h" |
| #include "tm.h" |
| #include "c-target.h" |
| #include "c-common.h" |
| #include "alloc-pool.h" |
| #include "stringpool.h" |
| #include "c-objc.h" |
| #include "intl.h" |
| #include "langhooks.h" |
| #include "c-format.h" |
| #include "diagnostic.h" |
| #include "substring-locations.h" |
| #include "selftest.h" |
| #include "selftest-diagnostic.h" |
| #include "builtins.h" |
| #include "attribs.h" |
| #include "gcc-rich-location.h" |
| |
| /* Handle attributes associated with format checking. */ |
| |
| /* This must be in the same order as format_types, except for |
| format_type_error. Target-specific format types do not have |
| matching enum values. */ |
| enum format_type { printf_format_type, asm_fprintf_format_type, |
| gcc_diag_format_type, gcc_tdiag_format_type, |
| gcc_cdiag_format_type, |
| gcc_cxxdiag_format_type, gcc_gfc_format_type, |
| gcc_dump_printf_format_type, |
| gcc_objc_string_format_type, |
| format_type_error = -1}; |
| |
| struct function_format_info |
| { |
| enum format_type format_type; /* type of format (printf, scanf, etc.) */ |
| /* IS_RAW is relevant only for GCC diagnostic format functions. |
| It is set for "raw" formatting functions like pp_printf that |
| are not intended to produce complete diagnostics according to |
| GCC guidelines, and clear for others like error and warning |
| whose format string is checked for proper quoting and spelling. */ |
| bool is_raw; |
| unsigned HOST_WIDE_INT format_num; /* number of format argument */ |
| unsigned HOST_WIDE_INT first_arg_num; /* number of first arg (zero for varargs) */ |
| }; |
| |
| /* Initialized in init_dynamic_diag_info. */ |
| static GTY(()) tree local_tree_type_node; |
| static GTY(()) tree local_event_ptr_node; |
| static GTY(()) tree local_gimple_ptr_node; |
| static GTY(()) tree local_cgraph_node_ptr_node; |
| static GTY(()) tree locus; |
| |
| static bool decode_format_attr (const_tree, tree, tree, function_format_info *, |
| bool); |
| static format_type decode_format_type (const char *, bool * = NULL); |
| |
| static bool check_format_string (const_tree argument, |
| unsigned HOST_WIDE_INT format_num, |
| int flags, bool *no_add_attrs, |
| int expected_format_type); |
| static tree get_constant (const_tree fntype, const_tree atname, tree expr, |
| int argno, unsigned HOST_WIDE_INT *value, |
| int flags, bool validated_p); |
| static const char *convert_format_name_to_system_name (const char *attr_name); |
| |
| static int first_target_format_type; |
| static const char *format_name (int format_num); |
| static int format_flags (int format_num); |
| |
| /* Emit a warning as per format_warning_va, but construct the substring_loc |
| for the character at offset (CHAR_IDX - 1) within a string constant |
| FORMAT_STRING_CST at FMT_STRING_LOC. */ |
| |
| ATTRIBUTE_GCC_DIAG (5,6) |
| static bool |
| format_warning_at_char (location_t fmt_string_loc, tree format_string_cst, |
| int char_idx, int opt, const char *gmsgid, ...) |
| { |
| va_list ap; |
| va_start (ap, gmsgid); |
| tree string_type = TREE_TYPE (format_string_cst); |
| |
| /* The callers are of the form: |
| format_warning (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| where format_chars has already been incremented, so that |
| CHAR_IDX is one character beyond where the warning should |
| be emitted. Fix it. */ |
| char_idx -= 1; |
| |
| substring_loc fmt_loc (fmt_string_loc, string_type, char_idx, char_idx, |
| char_idx); |
| format_string_diagnostic_t diag (fmt_loc, NULL, UNKNOWN_LOCATION, NULL, |
| NULL); |
| bool warned = diag.emit_warning_va (opt, gmsgid, &ap); |
| va_end (ap); |
| |
| return warned; |
| } |
| |
| |
| /* Emit a warning as per format_warning_va, but construct the substring_loc |
| for the substring at offset (POS1, POS2 - 1) within a string constant |
| FORMAT_STRING_CST at FMT_STRING_LOC. */ |
| |
| ATTRIBUTE_GCC_DIAG (6,7) |
| static bool |
| format_warning_substr (location_t fmt_string_loc, tree format_string_cst, |
| int pos1, int pos2, int opt, const char *gmsgid, ...) |
| { |
| va_list ap; |
| va_start (ap, gmsgid); |
| tree string_type = TREE_TYPE (format_string_cst); |
| |
| pos2 -= 1; |
| |
| substring_loc fmt_loc (fmt_string_loc, string_type, pos1, pos1, pos2); |
| format_string_diagnostic_t diag (fmt_loc, NULL, UNKNOWN_LOCATION, NULL, |
| NULL); |
| bool warned = diag.emit_warning_va (opt, gmsgid, &ap); |
| va_end (ap); |
| |
| return warned; |
| } |
| |
| |
| /* Check that we have a pointer to a string suitable for use as a format. |
| The default is to check for a char type. |
| For objective-c dialects, this is extended to include references to string |
| objects validated by objc_string_ref_type_p (). |
| Targets may also provide a string object type that can be used within c and |
| c++ and shared with their respective objective-c dialects. In this case the |
| reference to a format string is checked for validity via a hook. |
| |
| The function returns true if strref points to any string type valid for the |
| language dialect and target. */ |
| |
| bool |
| valid_format_string_type_p (tree strref) |
| { |
| return (strref != NULL |
| && TREE_CODE (strref) == POINTER_TYPE |
| && (TYPE_MAIN_VARIANT (TREE_TYPE (strref)) == char_type_node |
| || objc_string_ref_type_p (strref) |
| || (*targetcm.string_object_ref_type_p) ((const_tree) strref))); |
| } |
| |
| /* Handle a "format_arg" attribute; arguments as in |
| struct attribute_spec.handler. */ |
| tree |
| handle_format_arg_attribute (tree *node, tree atname, |
| tree args, int flags, bool *no_add_attrs) |
| { |
| tree type = *node; |
| /* Note that TREE_VALUE (args) is changed in place below. */ |
| tree *format_num_expr = &TREE_VALUE (args); |
| unsigned HOST_WIDE_INT format_num = 0; |
| |
| if (tree val = get_constant (type, atname, *format_num_expr, 0, &format_num, |
| 0, false)) |
| *format_num_expr = val; |
| else |
| { |
| *no_add_attrs = true; |
| return NULL_TREE; |
| } |
| |
| if (prototype_p (type)) |
| { |
| /* The format arg can be any string reference valid for the language and |
| target. We cannot be more specific in this case. */ |
| if (!check_format_string (type, format_num, flags, no_add_attrs, -1)) |
| return NULL_TREE; |
| } |
| |
| if (!valid_format_string_type_p (TREE_TYPE (type))) |
| { |
| if (!(flags & (int) ATTR_FLAG_BUILT_IN)) |
| error ("function does not return string type"); |
| *no_add_attrs = true; |
| return NULL_TREE; |
| } |
| |
| return NULL_TREE; |
| } |
| |
| /* Verify that the format_num argument is actually a string reference suitable, |
| for the language dialect and target (in case the format attribute is in |
| error). When we know the specific reference type expected, this is also |
| checked. */ |
| static bool |
| check_format_string (const_tree fntype, unsigned HOST_WIDE_INT format_num, |
| int flags, bool *no_add_attrs, int expected_format_type) |
| { |
| unsigned HOST_WIDE_INT i; |
| bool is_objc_sref, is_target_sref, is_char_ref; |
| tree ref; |
| int fmt_flags; |
| function_args_iterator iter; |
| |
| i = 1; |
| FOREACH_FUNCTION_ARGS (fntype, ref, iter) |
| { |
| if (i == format_num) |
| break; |
| i++; |
| } |
| |
| if (!ref |
| || !valid_format_string_type_p (ref)) |
| { |
| if (!(flags & (int) ATTR_FLAG_BUILT_IN)) |
| error ("format string argument is not a string type"); |
| *no_add_attrs = true; |
| return false; |
| } |
| |
| /* We only know that we want a suitable string reference. */ |
| if (expected_format_type < 0) |
| return true; |
| |
| /* Now check that the arg matches the expected type. */ |
| is_char_ref = |
| (TYPE_MAIN_VARIANT (TREE_TYPE (ref)) == char_type_node); |
| |
| fmt_flags = format_flags (expected_format_type); |
| is_objc_sref = is_target_sref = false; |
| if (!is_char_ref) |
| is_objc_sref = objc_string_ref_type_p (ref); |
| |
| if (!(fmt_flags & FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL)) |
| { |
| if (is_char_ref) |
| return true; /* OK, we expected a char and found one. */ |
| else |
| { |
| /* We expected a char but found an extended string type. */ |
| if (is_objc_sref) |
| error ("found a %qs reference but the format argument should" |
| " be a string", format_name (gcc_objc_string_format_type)); |
| else |
| error ("found a %qT but the format argument should be a string", |
| ref); |
| *no_add_attrs = true; |
| return false; |
| } |
| } |
| |
| /* We expect a string object type as the format arg. */ |
| if (is_char_ref) |
| { |
| error ("format argument should be a %qs reference but" |
| " a string was found", format_name (expected_format_type)); |
| *no_add_attrs = true; |
| return false; |
| } |
| |
| /* We will assert that objective-c will support either its own string type |
| or the target-supplied variant. */ |
| if (!is_objc_sref) |
| is_target_sref = (*targetcm.string_object_ref_type_p) ((const_tree) ref); |
| |
| if (expected_format_type == (int) gcc_objc_string_format_type |
| && (is_objc_sref || is_target_sref)) |
| return true; |
| |
| /* We will allow a target string ref to match only itself. */ |
| if (first_target_format_type |
| && expected_format_type >= first_target_format_type |
| && is_target_sref) |
| return true; |
| else |
| { |
| error ("format argument should be a %qs reference", |
| format_name (expected_format_type)); |
| *no_add_attrs = true; |
| return false; |
| } |
| |
| gcc_unreachable (); |
| } |
| |
| /* Under the control of FLAGS, verify EXPR is a valid constant that |
| refers to a positional argument ARGNO having a string type (char* |
| or, for targets like Darwin, a pointer to struct CFString) to |
| a function type FNTYPE declared with attribute ATNAME. |
| If valid, store the constant's integer value in *VALUE and return |
| the value. |
| If VALIDATED_P is true assert the validation is successful. |
| Returns the converted constant value on success, null otherwise. */ |
| |
| static tree |
| get_constant (const_tree fntype, const_tree atname, tree expr, int argno, |
| unsigned HOST_WIDE_INT *value, int flags, bool validated_p) |
| { |
| /* Require the referenced argument to have a string type. For targets |
| like Darwin, also accept pointers to struct CFString. */ |
| if (tree val = positional_argument (fntype, atname, expr, STRING_CST, |
| argno, flags)) |
| { |
| *value = TREE_INT_CST_LOW (val); |
| return val; |
| } |
| |
| gcc_assert (!validated_p); |
| return NULL_TREE; |
| } |
| |
| /* Decode the arguments to a "format" attribute into a |
| function_format_info structure. It is already known that the list |
| is of the right length. If VALIDATED_P is true, then these |
| attributes have already been validated and must not be erroneous; |
| if false, it will give an error message. Returns true if the |
| attributes are successfully decoded, false otherwise. */ |
| |
| static bool |
| decode_format_attr (const_tree fntype, tree atname, tree args, |
| function_format_info *info, bool validated_p) |
| { |
| tree format_type_id = TREE_VALUE (args); |
| /* Note that TREE_VALUE (args) is changed in place below. Ditto |
| for the value of the next element on the list. */ |
| tree *format_num_expr = &TREE_VALUE (TREE_CHAIN (args)); |
| tree *first_arg_num_expr = &TREE_VALUE (TREE_CHAIN (TREE_CHAIN (args))); |
| |
| if (TREE_CODE (format_type_id) != IDENTIFIER_NODE) |
| { |
| gcc_assert (!validated_p); |
| error ("unrecognized format specifier"); |
| return false; |
| } |
| else |
| { |
| const char *p = IDENTIFIER_POINTER (format_type_id); |
| |
| info->format_type = decode_format_type (p, &info->is_raw); |
| |
| if (!c_dialect_objc () |
| && info->format_type == gcc_objc_string_format_type) |
| { |
| gcc_assert (!validated_p); |
| warning (OPT_Wformat_, "%qE is only allowed in Objective-C dialects", |
| format_type_id); |
| info->format_type = format_type_error; |
| return false; |
| } |
| |
| if (info->format_type == format_type_error) |
| { |
| gcc_assert (!validated_p); |
| warning (OPT_Wformat_, "%qE is an unrecognized format function type", |
| format_type_id); |
| return false; |
| } |
| } |
| |
| if (tree val = get_constant (fntype, atname, *format_num_expr, |
| 2, &info->format_num, 0, validated_p)) |
| *format_num_expr = val; |
| else |
| return false; |
| |
| if (tree val = get_constant (fntype, atname, *first_arg_num_expr, |
| 3, &info->first_arg_num, |
| (POSARG_ZERO | POSARG_ELLIPSIS), validated_p)) |
| *first_arg_num_expr = val; |
| else |
| return false; |
| |
| if (info->first_arg_num != 0 && info->first_arg_num <= info->format_num) |
| { |
| gcc_assert (!validated_p); |
| error ("format string argument follows the arguments to be formatted"); |
| return false; |
| } |
| |
| return true; |
| } |
| |
| /* Check a call to a format function against a parameter list. */ |
| |
| /* The C standard version C++ is treated as equivalent to |
| or inheriting from, for the purpose of format features supported. */ |
| #define CPLUSPLUS_STD_VER (cxx_dialect < cxx11 ? STD_C94 : STD_C99) |
| /* The C standard version we are checking formats against when pedantic. */ |
| #define C_STD_VER ((int) (c_dialect_cxx () \ |
| ? CPLUSPLUS_STD_VER \ |
| : (flag_isoc2x \ |
| ? STD_C2X \ |
| : (flag_isoc99 \ |
| ? STD_C99 \ |
| : (flag_isoc94 ? STD_C94 : STD_C89))))) |
| /* The name to give to the standard version we are warning about when |
| pedantic. FEATURE_VER is the version in which the feature warned out |
| appeared, which is higher than C_STD_VER. */ |
| #define C_STD_NAME(FEATURE_VER) (c_dialect_cxx () \ |
| ? (cxx_dialect < cxx11 ? "ISO C++98" \ |
| : "ISO C++11") \ |
| : ((FEATURE_VER) == STD_EXT \ |
| ? "ISO C" \ |
| : ((FEATURE_VER) == STD_C2X \ |
| ? "ISO C17" \ |
| : "ISO C90"))) |
| /* Adjust a C standard version, which may be STD_C9L, to account for |
| -Wno-long-long. Returns other standard versions unchanged. */ |
| #define ADJ_STD(VER) ((int) ((VER) == STD_C9L \ |
| ? (warn_long_long ? STD_C99 : STD_C89) \ |
| : (VER))) |
| |
| /* Enum describing the kind of specifiers present in the format and |
| requiring an argument. */ |
| enum format_specifier_kind { |
| CF_KIND_FORMAT, |
| CF_KIND_FIELD_WIDTH, |
| CF_KIND_FIELD_PRECISION |
| }; |
| |
| static const char *kind_descriptions[] = { |
| N_("format"), |
| N_("field width specifier"), |
| N_("field precision specifier") |
| }; |
| |
| /* Structure describing details of a type expected in format checking, |
| and the type to check against it. */ |
| struct format_wanted_type |
| { |
| /* The type wanted. */ |
| tree wanted_type; |
| /* The name of this type to use in diagnostics. */ |
| const char *wanted_type_name; |
| /* Should be type checked just for scalar width identity. */ |
| int scalar_identity_flag; |
| /* The level of indirection through pointers at which this type occurs. */ |
| int pointer_count; |
| /* Whether, when pointer_count is 1, to allow any character type when |
| pedantic, rather than just the character or void type specified. */ |
| int char_lenient_flag; |
| /* Whether the argument, dereferenced once, is written into and so the |
| argument must not be a pointer to a const-qualified type. */ |
| int writing_in_flag; |
| /* Whether the argument, dereferenced once, is read from and so |
| must not be a NULL pointer. */ |
| int reading_from_flag; |
| /* The kind of specifier that this type is used for. */ |
| enum format_specifier_kind kind; |
| /* The starting character of the specifier. This never includes the |
| initial percent sign. */ |
| const char *format_start; |
| /* The length of the specifier. */ |
| int format_length; |
| /* The actual parameter to check against the wanted type. */ |
| tree param; |
| /* The argument number of that parameter. */ |
| int arg_num; |
| /* The offset location of this argument with respect to the format |
| string location. */ |
| unsigned int offset_loc; |
| /* The next type to check for this format conversion, or NULL if none. */ |
| struct format_wanted_type *next; |
| }; |
| |
| /* Convenience macro for format_length_info meaning unused. */ |
| #define NO_FMT NULL, FMT_LEN_none, STD_C89 |
| |
| static const format_length_info printf_length_specs[] = |
| { |
| { "h", FMT_LEN_h, STD_C89, "hh", FMT_LEN_hh, STD_C99, 0 }, |
| { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C9L, 0 }, |
| { "q", FMT_LEN_ll, STD_EXT, NO_FMT, 0 }, |
| { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, |
| { "z", FMT_LEN_z, STD_C99, NO_FMT, 0 }, |
| { "Z", FMT_LEN_z, STD_EXT, NO_FMT, 0 }, |
| { "t", FMT_LEN_t, STD_C99, NO_FMT, 0 }, |
| { "j", FMT_LEN_j, STD_C99, NO_FMT, 0 }, |
| { "H", FMT_LEN_H, STD_EXT, NO_FMT, 0 }, |
| { "D", FMT_LEN_D, STD_EXT, "DD", FMT_LEN_DD, STD_EXT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| /* Length specifiers valid for asm_fprintf. */ |
| static const format_length_info asm_fprintf_length_specs[] = |
| { |
| { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C89, 0 }, |
| { "w", FMT_LEN_w, STD_C89, NO_FMT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| /* Length specifiers valid for GCC diagnostics. */ |
| static const format_length_info gcc_diag_length_specs[] = |
| { |
| { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C89, 0 }, |
| { "w", FMT_LEN_w, STD_C89, NO_FMT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| /* The custom diagnostics all accept the same length specifiers. */ |
| #define gcc_tdiag_length_specs gcc_diag_length_specs |
| #define gcc_cdiag_length_specs gcc_diag_length_specs |
| #define gcc_cxxdiag_length_specs gcc_diag_length_specs |
| #define gcc_dump_printf_length_specs gcc_diag_length_specs |
| |
| /* This differs from printf_length_specs only in that "Z" is not accepted. */ |
| static const format_length_info scanf_length_specs[] = |
| { |
| { "h", FMT_LEN_h, STD_C89, "hh", FMT_LEN_hh, STD_C99, 0 }, |
| { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C9L, 0 }, |
| { "q", FMT_LEN_ll, STD_EXT, NO_FMT, 0 }, |
| { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, |
| { "z", FMT_LEN_z, STD_C99, NO_FMT, 0 }, |
| { "t", FMT_LEN_t, STD_C99, NO_FMT, 0 }, |
| { "j", FMT_LEN_j, STD_C99, NO_FMT, 0 }, |
| { "H", FMT_LEN_H, STD_EXT, NO_FMT, 0 }, |
| { "D", FMT_LEN_D, STD_EXT, "DD", FMT_LEN_DD, STD_EXT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| |
| /* All tables for strfmon use STD_C89 everywhere, since -pedantic warnings |
| make no sense for a format type not part of any C standard version. */ |
| static const format_length_info strfmon_length_specs[] = |
| { |
| /* A GNU extension. */ |
| { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| |
| /* For now, the Fortran front-end routines only use l as length modifier. */ |
| static const format_length_info gcc_gfc_length_specs[] = |
| { |
| { "l", FMT_LEN_l, STD_C89, NO_FMT, 0 }, |
| { NO_FMT, NO_FMT, 0 } |
| }; |
| |
| |
| static const format_flag_spec printf_flag_specs[] = |
| { |
| { ' ', 0, 0, 0, N_("' ' flag"), N_("the ' ' printf flag"), STD_C89 }, |
| { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, |
| { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, |
| { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' printf flag"), STD_C89 }, |
| { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' printf flag"), STD_C89 }, |
| { '\'', 0, 0, 0, N_("''' flag"), N_("the ''' printf flag"), STD_EXT }, |
| { 'I', 0, 0, 0, N_("'I' flag"), N_("the 'I' printf flag"), STD_EXT }, |
| { 'w', 0, 0, 0, N_("field width"), N_("field width in printf format"), STD_C89 }, |
| { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, |
| { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| |
| static const format_flag_pair printf_flag_pairs[] = |
| { |
| { ' ', '+', 1, 0 }, |
| { '0', '-', 1, 0 }, |
| { '0', 'p', 1, 'i' }, |
| { 0, 0, 0, 0 } |
| }; |
| |
| static const format_flag_spec asm_fprintf_flag_specs[] = |
| { |
| { ' ', 0, 0, 0, N_("' ' flag"), N_("the ' ' printf flag"), STD_C89 }, |
| { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, |
| { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, |
| { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' printf flag"), STD_C89 }, |
| { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' printf flag"), STD_C89 }, |
| { 'w', 0, 0, 0, N_("field width"), N_("field width in printf format"), STD_C89 }, |
| { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, |
| { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| static const format_flag_pair asm_fprintf_flag_pairs[] = |
| { |
| { ' ', '+', 1, 0 }, |
| { '0', '-', 1, 0 }, |
| { '0', 'p', 1, 'i' }, |
| { 0, 0, 0, 0 } |
| }; |
| |
| static const format_flag_pair gcc_diag_flag_pairs[] = |
| { |
| { 0, 0, 0, 0 } |
| }; |
| |
| #define gcc_tdiag_flag_pairs gcc_diag_flag_pairs |
| #define gcc_cdiag_flag_pairs gcc_diag_flag_pairs |
| #define gcc_cxxdiag_flag_pairs gcc_diag_flag_pairs |
| #define gcc_gfc_flag_pairs gcc_diag_flag_pairs |
| #define gcc_dump_printf_flag_pairs gcc_diag_flag_pairs |
| |
| static const format_flag_spec gcc_diag_flag_specs[] = |
| { |
| { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, |
| { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, |
| { 'q', 0, 0, 1, N_("'q' flag"), N_("the 'q' diagnostic flag"), STD_C89 }, |
| { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, |
| { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| #define gcc_tdiag_flag_specs gcc_diag_flag_specs |
| #define gcc_cdiag_flag_specs gcc_diag_flag_specs |
| #define gcc_cxxdiag_flag_specs gcc_diag_flag_specs |
| #define gcc_gfc_flag_specs gcc_diag_flag_specs |
| #define gcc_dump_printf_flag_specs gcc_diag_flag_specs |
| |
| static const format_flag_spec scanf_flag_specs[] = |
| { |
| { '*', 0, 0, 0, N_("assignment suppression"), N_("the assignment suppression scanf feature"), STD_C89 }, |
| { 'a', 0, 0, 0, N_("'a' flag"), N_("the 'a' scanf flag"), STD_EXT }, |
| { 'm', 0, 0, 0, N_("'m' flag"), N_("the 'm' scanf flag"), STD_EXT }, |
| { 'w', 0, 0, 0, N_("field width"), N_("field width in scanf format"), STD_C89 }, |
| { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in scanf format"), STD_C89 }, |
| { '\'', 0, 0, 0, N_("''' flag"), N_("the ''' scanf flag"), STD_EXT }, |
| { 'I', 0, 0, 0, N_("'I' flag"), N_("the 'I' scanf flag"), STD_EXT }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| |
| static const format_flag_pair scanf_flag_pairs[] = |
| { |
| { '*', 'L', 0, 0 }, |
| { 'a', 'm', 0, 0 }, |
| { 0, 0, 0, 0 } |
| }; |
| |
| |
| static const format_flag_spec strftime_flag_specs[] = |
| { |
| { '_', 0, 0, 0, N_("'_' flag"), N_("the '_' strftime flag"), STD_EXT }, |
| { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' strftime flag"), STD_EXT }, |
| { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' strftime flag"), STD_EXT }, |
| { '^', 0, 0, 0, N_("'^' flag"), N_("the '^' strftime flag"), STD_EXT }, |
| { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' strftime flag"), STD_EXT }, |
| { 'w', 0, 0, 0, N_("field width"), N_("field width in strftime format"), STD_EXT }, |
| { 'E', 0, 0, 0, N_("'E' modifier"), N_("the 'E' strftime modifier"), STD_C99 }, |
| { 'O', 0, 0, 0, N_("'O' modifier"), N_("the 'O' strftime modifier"), STD_C99 }, |
| { 'O', 'o', 0, 0, NULL, N_("the 'O' modifier"), STD_EXT }, |
| { 'O', 'p', 0, 0, NULL, N_("the 'O' modifier"), STD_C2X }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| |
| static const format_flag_pair strftime_flag_pairs[] = |
| { |
| { 'E', 'O', 0, 0 }, |
| { '_', '-', 0, 0 }, |
| { '_', '0', 0, 0 }, |
| { '-', '0', 0, 0 }, |
| { '^', '#', 0, 0 }, |
| { 0, 0, 0, 0 } |
| }; |
| |
| |
| static const format_flag_spec strfmon_flag_specs[] = |
| { |
| { '=', 0, 1, 0, N_("fill character"), N_("fill character in strfmon format"), STD_C89 }, |
| { '^', 0, 0, 0, N_("'^' flag"), N_("the '^' strfmon flag"), STD_C89 }, |
| { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' strfmon flag"), STD_C89 }, |
| { '(', 0, 0, 0, N_("'(' flag"), N_("the '(' strfmon flag"), STD_C89 }, |
| { '!', 0, 0, 0, N_("'!' flag"), N_("the '!' strfmon flag"), STD_C89 }, |
| { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' strfmon flag"), STD_C89 }, |
| { 'w', 0, 0, 0, N_("field width"), N_("field width in strfmon format"), STD_C89 }, |
| { '#', 0, 0, 0, N_("left precision"), N_("left precision in strfmon format"), STD_C89 }, |
| { 'p', 0, 0, 0, N_("right precision"), N_("right precision in strfmon format"), STD_C89 }, |
| { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in strfmon format"), STD_C89 }, |
| { 0, 0, 0, 0, NULL, NULL, STD_C89 } |
| }; |
| |
| static const format_flag_pair strfmon_flag_pairs[] = |
| { |
| { '+', '(', 0, 0 }, |
| { 0, 0, 0, 0 } |
| }; |
| |
| |
| static const format_char_info print_char_table[] = |
| { |
| /* C89 conversion specifiers. */ |
| { "di", 0, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, TEX_LL, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN }, "-wp0 +'I", "i", NULL }, |
| { "oxX", 0, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN }, "-wp0#", "i", NULL }, |
| { "u", 0, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN }, "-wp0'I", "i", NULL }, |
| { "fgG", 0, STD_C89, { T89_D, BADLEN, BADLEN, T99_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "-wp0 +#'I", "", NULL }, |
| { "eE", 0, STD_C89, { T89_D, BADLEN, BADLEN, T99_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "-wp0 +#I", "", NULL }, |
| { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, T94_WI, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, |
| { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "cR", NULL }, |
| { "p", 1, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "c", NULL }, |
| { "n", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN }, "", "W", NULL }, |
| /* C99 conversion specifiers. */ |
| { "F", 0, STD_C99, { T99_D, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "-wp0 +#'I", "", NULL }, |
| { "aA", 0, STD_C99, { T99_D, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "-wp0 +#", "", NULL }, |
| /* X/Open conversion specifiers. */ |
| { "C", 0, STD_EXT, { TEX_WI, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, |
| { "S", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "R", NULL }, |
| /* GNU conversion specifiers. */ |
| { "m", 0, STD_EXT, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info asm_fprintf_char_table[] = |
| { |
| /* C89 conversion specifiers. */ |
| { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, T9L_LL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +", "i", NULL }, |
| { "oxX", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0#", "i", NULL }, |
| { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0", "i", NULL }, |
| { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, |
| { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "cR", NULL }, |
| |
| /* asm_fprintf conversion specifiers. */ |
| { "O", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "R", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "I", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "L", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "U", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "r", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "", NULL }, |
| { "z", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { "@", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| /* GCC-specific format_char_info arrays. */ |
| |
| /* The conversion specifiers implemented within pp_format, and thus supported |
| by all pretty_printer instances within GCC. */ |
| |
| #define PP_FORMAT_CHAR_TABLE \ |
| { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, T9L_LL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ |
| { "ox", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ |
| { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ |
| { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ |
| { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "pq", "cR", NULL }, \ |
| { "p", 1, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "c", NULL }, \ |
| { "r", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "//cR", NULL }, \ |
| { "@", 1, STD_C89, { T_EVENT_PTR, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, \ |
| { "<", 0, STD_C89, NOARGUMENTS, "", "<", NULL }, \ |
| { ">", 0, STD_C89, NOARGUMENTS, "", ">", NULL }, \ |
| { "'" , 0, STD_C89, NOARGUMENTS, "", "", NULL }, \ |
| { "{", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "cR", NULL }, \ |
| { "}", 0, STD_C89, NOARGUMENTS, "", "", NULL }, \ |
| { "R", 0, STD_C89, NOARGUMENTS, "", "\\", NULL }, \ |
| { "m", 0, STD_C89, NOARGUMENTS, "q", "", NULL }, \ |
| { "Z", 1, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "", &gcc_diag_char_table[0] } |
| |
| static const format_char_info gcc_diag_char_table[] = |
| { |
| /* The conversion specifiers implemented within pp_format. */ |
| PP_FORMAT_CHAR_TABLE, |
| |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info gcc_tdiag_char_table[] = |
| { |
| /* The conversion specifiers implemented within pp_format. */ |
| PP_FORMAT_CHAR_TABLE, |
| |
| /* Custom conversion specifiers implemented by default_tree_printer. */ |
| |
| /* These will require a "tree" at runtime. */ |
| { "DFTV", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "'", NULL }, |
| { "E", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "", NULL }, |
| { "K", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* G requires a "gimple*" argument at runtime. */ |
| { "G", 1, STD_C89, { T89_G, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info gcc_cdiag_char_table[] = |
| { |
| /* The conversion specifiers implemented within pp_format. */ |
| PP_FORMAT_CHAR_TABLE, |
| |
| /* Custom conversion specifiers implemented by c_tree_printer. */ |
| |
| /* These will require a "tree" at runtime. */ |
| { "DFTV", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "'", NULL }, |
| { "E", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "", NULL }, |
| { "K", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* G requires a "gimple*" argument at runtime. */ |
| { "G", 1, STD_C89, { T89_G, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| { "v", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q#", "", NULL }, |
| |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info gcc_cxxdiag_char_table[] = |
| { |
| /* The conversion specifiers implemented within pp_format. */ |
| PP_FORMAT_CHAR_TABLE, |
| |
| /* Custom conversion specifiers implemented by cp_printer. */ |
| |
| /* These will require a "tree" at runtime. */ |
| { "ADFHISTVX",1,STD_C89,{ T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+#", "'", NULL }, |
| { "E", 1,STD_C89,{ T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+#", "", NULL }, |
| { "K", 1, STD_C89,{ T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* G requires a "gimple*" argument at runtime. */ |
| { "G", 1, STD_C89,{ T89_G, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* These accept either an 'int' or an 'enum tree_code' (which is handled as an 'int'.) */ |
| { "CLOPQ",0,STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, |
| |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info gcc_gfc_char_table[] = |
| { |
| /* C89 conversion specifiers. */ |
| { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, |
| { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, |
| { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, |
| { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "cR", NULL }, |
| |
| /* gfc conversion specifiers. */ |
| |
| { "C", 0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| |
| /* This will require a "locus" at runtime. */ |
| { "L", 0, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "R", NULL }, |
| |
| /* These will require nothing. */ |
| { "<>",0, STD_C89, NOARGUMENTS, "", "", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info gcc_dump_printf_char_table[] = |
| { |
| /* The conversion specifiers implemented within pp_format. */ |
| PP_FORMAT_CHAR_TABLE, |
| |
| /* Custom conversion specifiers implemented by dump_pretty_printer. */ |
| |
| /* E and G require a "gimple *" argument at runtime. */ |
| { "EG", 1, STD_C89, { T89_G, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* C requires a "cgraph_node *" argument at runtime. */ |
| { "C", 1, STD_C89, { T_CGRAPH_NODE, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* T requires a "tree" at runtime. */ |
| { "T", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| /* %f requires a "double"; it doesn't support modifiers. */ |
| { "f", 0, STD_C89, { T89_D, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, |
| |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info scan_char_table[] = |
| { |
| /* C89 conversion specifiers. */ |
| { "di", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, TEX_LL, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN }, "*w'I", "W", NULL }, |
| { "u", 1, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN }, "*w'I", "W", NULL }, |
| { "oxX", 1, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN }, "*w", "W", NULL }, |
| { "efgEG", 1, STD_C89, { T89_F, BADLEN, BADLEN, T89_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "*w'", "W", NULL }, |
| { "c", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*mw", "cW", NULL }, |
| { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "cW", NULL }, |
| { "[", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "cW[", NULL }, |
| { "p", 2, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*w", "W", NULL }, |
| { "n", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN }, "", "W", NULL }, |
| /* C99 conversion specifiers. */ |
| { "F", 1, STD_C99, { T99_F, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "*w'", "W", NULL }, |
| { "aA", 1, STD_C99, { T99_F, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, TEX_D32, TEX_D64, TEX_D128 }, "*w'", "W", NULL }, |
| /* X/Open conversion specifiers. */ |
| { "C", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*mw", "W", NULL }, |
| { "S", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "W", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info time_char_table[] = |
| { |
| /* C89 conversion specifiers. */ |
| { "AZa", 0, STD_C89, NOLENGTHS, "^#", "", NULL }, |
| { "Bb", 0, STD_C89, NOLENGTHS, "O^#", "p", NULL }, |
| { "cx", 0, STD_C89, NOLENGTHS, "E", "3", NULL }, |
| { "HIMSUWdmw", 0, STD_C89, NOLENGTHS, "-_0Ow", "", NULL }, |
| { "j", 0, STD_C89, NOLENGTHS, "-_0Ow", "o", NULL }, |
| { "p", 0, STD_C89, NOLENGTHS, "#", "", NULL }, |
| { "X", 0, STD_C89, NOLENGTHS, "E", "", NULL }, |
| { "y", 0, STD_C89, NOLENGTHS, "EO-_0w", "4", NULL }, |
| { "Y", 0, STD_C89, NOLENGTHS, "-_0EOw", "o", NULL }, |
| { "%", 0, STD_C89, NOLENGTHS, "", "", NULL }, |
| /* C99 conversion specifiers. */ |
| { "C", 0, STD_C99, NOLENGTHS, "-_0EOw", "o", NULL }, |
| { "D", 0, STD_C99, NOLENGTHS, "", "2", NULL }, |
| { "eVu", 0, STD_C99, NOLENGTHS, "-_0Ow", "", NULL }, |
| { "FRTnrt", 0, STD_C99, NOLENGTHS, "", "", NULL }, |
| { "g", 0, STD_C99, NOLENGTHS, "O-_0w", "2o", NULL }, |
| { "G", 0, STD_C99, NOLENGTHS, "-_0Ow", "o", NULL }, |
| { "h", 0, STD_C99, NOLENGTHS, "^#", "", NULL }, |
| { "z", 0, STD_C99, NOLENGTHS, "O", "o", NULL }, |
| /* GNU conversion specifiers. */ |
| { "kls", 0, STD_EXT, NOLENGTHS, "-_0Ow", "", NULL }, |
| { "P", 0, STD_EXT, NOLENGTHS, "", "", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| static const format_char_info monetary_char_table[] = |
| { |
| { "in", 0, STD_C89, { T89_D, BADLEN, BADLEN, BADLEN, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "=^+(!-w#p", "", NULL }, |
| { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } |
| }; |
| |
| /* This must be in the same order as enum format_type. */ |
| static const format_kind_info format_types_orig[] = |
| { |
| { "gnu_printf", printf_length_specs, print_char_table, " +#0-'I", NULL, |
| printf_flag_specs, printf_flag_pairs, |
| FMT_FLAG_ARG_CONVERT|FMT_FLAG_DOLLAR_MULTIPLE|FMT_FLAG_USE_DOLLAR|FMT_FLAG_EMPTY_PREC_OK, |
| 'w', 0, 'p', 0, 'L', 0, |
| &integer_type_node, &integer_type_node |
| }, |
| { "asm_fprintf", asm_fprintf_length_specs, asm_fprintf_char_table, " +#0-", NULL, |
| asm_fprintf_flag_specs, asm_fprintf_flag_pairs, |
| FMT_FLAG_ARG_CONVERT|FMT_FLAG_EMPTY_PREC_OK, |
| 'w', 0, 'p', 0, 'L', 0, |
| NULL, NULL |
| }, |
| { "gcc_diag", gcc_diag_length_specs, gcc_diag_char_table, "q+#", NULL, |
| gcc_diag_flag_specs, gcc_diag_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 'p', 0, 'L', 0, |
| NULL, &integer_type_node |
| }, |
| { "gcc_tdiag", gcc_tdiag_length_specs, gcc_tdiag_char_table, "q+#", NULL, |
| gcc_tdiag_flag_specs, gcc_tdiag_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 'p', 0, 'L', 0, |
| NULL, &integer_type_node |
| }, |
| { "gcc_cdiag", gcc_cdiag_length_specs, gcc_cdiag_char_table, "q+#", NULL, |
| gcc_cdiag_flag_specs, gcc_cdiag_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 'p', 0, 'L', 0, |
| NULL, &integer_type_node |
| }, |
| { "gcc_cxxdiag", gcc_cxxdiag_length_specs, gcc_cxxdiag_char_table, "q+#", NULL, |
| gcc_cxxdiag_flag_specs, gcc_cxxdiag_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 'p', 0, 'L', 0, |
| NULL, &integer_type_node |
| }, |
| { "gcc_gfc", gcc_gfc_length_specs, gcc_gfc_char_table, "q+#", NULL, |
| gcc_gfc_flag_specs, gcc_gfc_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 0, 0, 0, 0, |
| NULL, NULL |
| }, |
| { "gcc_dump_printf", gcc_dump_printf_length_specs, |
| gcc_dump_printf_char_table, "q+#", NULL, |
| gcc_dump_printf_flag_specs, gcc_dump_printf_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, |
| 0, 0, 'p', 0, 'L', 0, |
| NULL, &integer_type_node |
| }, |
| { "NSString", NULL, NULL, NULL, NULL, |
| NULL, NULL, |
| FMT_FLAG_ARG_CONVERT|FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL, 0, 0, 0, 0, 0, 0, |
| NULL, NULL |
| }, |
| { "gnu_scanf", scanf_length_specs, scan_char_table, "*'I", NULL, |
| scanf_flag_specs, scanf_flag_pairs, |
| FMT_FLAG_ARG_CONVERT|FMT_FLAG_SCANF_A_KLUDGE|FMT_FLAG_USE_DOLLAR|FMT_FLAG_ZERO_WIDTH_BAD|FMT_FLAG_DOLLAR_GAP_POINTER_OK, |
| 'w', 0, 0, '*', 'L', 'm', |
| NULL, NULL |
| }, |
| { "gnu_strftime", NULL, time_char_table, "_-0^#", "EO", |
| strftime_flag_specs, strftime_flag_pairs, |
| FMT_FLAG_FANCY_PERCENT_OK, 'w', 0, 0, 0, 0, 0, |
| NULL, NULL |
| }, |
| { "gnu_strfmon", strfmon_length_specs, monetary_char_table, "=^+(!-", NULL, |
| strfmon_flag_specs, strfmon_flag_pairs, |
| FMT_FLAG_ARG_CONVERT, 'w', '#', 'p', 0, 'L', 0, |
| NULL, NULL |
| } |
| }; |
| |
| /* This layer of indirection allows GCC to reassign format_types with |
| new data if necessary, while still allowing the original data to be |
| const. */ |
| static const format_kind_info *format_types = format_types_orig; |
| /* We can modify this one. We also add target-specific format types |
| to the end of the array. */ |
| static format_kind_info *dynamic_format_types; |
| |
| static int n_format_types = ARRAY_SIZE (format_types_orig); |
| |
| /* Structure detailing the results of checking a format function call |
| where the format expression may be a conditional expression with |
| many leaves resulting from nested conditional expressions. */ |
| struct format_check_results |
| { |
| /* Number of leaves of the format argument that could not be checked |
| as they were not string literals. */ |
| int number_non_literal; |
| /* Number of leaves of the format argument that were null pointers or |
| string literals, but had extra format arguments. */ |
| int number_extra_args; |
| location_t extra_arg_loc; |
| /* Number of leaves of the format argument that were null pointers or |
| string literals, but had extra format arguments and used $ operand |
| numbers. */ |
| int number_dollar_extra_args; |
| /* Number of leaves of the format argument that were wide string |
| literals. */ |
| int number_wide; |
| /* Number of leaves of the format argument that are not array of "char". */ |
| int number_non_char; |
| /* Number of leaves of the format argument that were empty strings. */ |
| int number_empty; |
| /* Number of leaves of the format argument that were unterminated |
| strings. */ |
| int number_unterminated; |
| /* Number of leaves of the format argument that were not counted above. */ |
| int number_other; |
| /* Location of the format string. */ |
| location_t format_string_loc; |
| }; |
| |
| struct format_check_context |
| { |
| format_check_results *res; |
| function_format_info *info; |
| tree params; |
| vec<location_t> *arglocs; |
| }; |
| |
| /* Return the format name (as specified in the original table) for the format |
| type indicated by format_num. */ |
| static const char * |
| format_name (int format_num) |
| { |
| if (format_num >= 0 && format_num < n_format_types) |
| return format_types[format_num].name; |
| gcc_unreachable (); |
| } |
| |
| /* Return the format flags (as specified in the original table) for the format |
| type indicated by format_num. */ |
| static int |
| format_flags (int format_num) |
| { |
| if (format_num >= 0 && format_num < n_format_types) |
| return format_types[format_num].flags; |
| gcc_unreachable (); |
| } |
| |
| static void check_format_info (function_format_info *, tree, |
| vec<location_t> *); |
| static void check_format_arg (void *, tree, unsigned HOST_WIDE_INT); |
| static void check_format_info_main (format_check_results *, |
| function_format_info *, const char *, |
| location_t, tree, |
| int, tree, |
| unsigned HOST_WIDE_INT, |
| object_allocator<format_wanted_type> &, |
| vec<location_t> *); |
| |
| static void init_dollar_format_checking (int, tree); |
| static int maybe_read_dollar_number (const char **, int, |
| tree, tree *, const format_kind_info *); |
| static bool avoid_dollar_number (const char *); |
| static void finish_dollar_format_checking (format_check_results *, int); |
| |
| static const format_flag_spec *get_flag_spec (const format_flag_spec *, |
| int, const char *); |
| |
| static void check_format_types (const substring_loc &fmt_loc, |
| format_wanted_type *, |
| const format_kind_info *fki, |
| int offset_to_type_start, |
| char conversion_char, |
| vec<location_t> *arglocs); |
| static void format_type_warning (const substring_loc &fmt_loc, |
| location_t param_loc, |
| format_wanted_type *, tree, |
| tree, |
| const format_kind_info *fki, |
| int offset_to_type_start, |
| char conversion_char); |
| |
| /* Decode a format type from a string, returning the type, or |
| format_type_error if not valid, in which case the caller should |
| print an error message. On success, when IS_RAW is non-null, set |
| *IS_RAW when the format type corresponds to a GCC "raw" diagnostic |
| formatting function and clear it otherwise. */ |
| static format_type |
| decode_format_type (const char *s, bool *is_raw /* = NULL */) |
| { |
| bool is_raw_buf; |
| |
| if (!is_raw) |
| is_raw = &is_raw_buf; |
| |
| *is_raw = false; |
| |
| s = convert_format_name_to_system_name (s); |
| |
| size_t slen = strlen (s); |
| for (int i = 0; i < n_format_types; i++) |
| { |
| /* Check for a match with no underscores. */ |
| if (!strcmp (s, format_types[i].name)) |
| return static_cast<format_type> (i); |
| |
| /* Check for leading and trailing underscores. */ |
| size_t alen = strlen (format_types[i].name); |
| if (slen == alen + 4 && s[0] == '_' && s[1] == '_' |
| && s[slen - 1] == '_' && s[slen - 2] == '_' |
| && !strncmp (s + 2, format_types[i].name, alen)) |
| return static_cast<format_type>(i); |
| |
| /* Check for the "_raw" suffix and no leading underscores. */ |
| if (slen == alen + 4 |
| && !strncmp (s, format_types[i].name, alen) |
| && !strcmp (s + alen, "_raw")) |
| { |
| *is_raw = true; |
| return static_cast<format_type>(i); |
| } |
| |
| /* Check for the "_raw__" suffix and leading underscores. */ |
| if (slen == alen + 8 && s[0] == '_' && s[1] == '_' |
| && !strncmp (s + 2, format_types[i].name, alen) |
| && !strcmp (s + 2 + alen, "_raw__")) |
| { |
| *is_raw = true; |
| return static_cast<format_type>(i); |
| } |
| } |
| |
| return format_type_error; |
| } |
| |
| |
| /* Check the argument list of a call to printf, scanf, etc. |
| ATTRS are the attributes on the function type. There are NARGS argument |
| values in the array ARGARRAY. |
| Also, if -Wsuggest-attribute=format, |
| warn for calls to vprintf or vscanf in functions with no such format |
| attribute themselves. */ |
| |
| void |
| check_function_format (const_tree fntype, tree attrs, int nargs, |
| tree *argarray, vec<location_t> *arglocs) |
| { |
| tree a; |
| |
| tree atname = get_identifier ("format"); |
| |
| /* See if this function has any format attributes. */ |
| for (a = attrs; a; a = TREE_CHAIN (a)) |
| { |
| if (is_attribute_p ("format", get_attribute_name (a))) |
| { |
| /* Yup; check it. */ |
| function_format_info info; |
| decode_format_attr (fntype, atname, TREE_VALUE (a), &info, |
| /*validated=*/true); |
| if (warn_format) |
| { |
| /* FIXME: Rewrite all the internal functions in this file |
| to use the ARGARRAY directly instead of constructing this |
| temporary list. */ |
| tree params = NULL_TREE; |
| int i; |
| for (i = nargs - 1; i >= 0; i--) |
| params = tree_cons (NULL_TREE, argarray[i], params); |
| check_format_info (&info, params, arglocs); |
| } |
| |
| /* Attempt to detect whether the current function might benefit |
| from the format attribute if the called function is decorated |
| with it. Avoid using calls with string literal formats for |
| guidance since those are unlikely to be viable candidates. */ |
| if (warn_suggest_attribute_format |
| && current_function_decl != NULL_TREE |
| && info.first_arg_num == 0 |
| && (format_types[info.format_type].flags |
| & (int) FMT_FLAG_ARG_CONVERT) |
| /* c_strlen will fail for a function parameter but succeed |
| for a literal or constant array. */ |
| && !c_strlen (argarray[info.format_num - 1], 1)) |
| { |
| tree c; |
| for (c = TYPE_ATTRIBUTES (TREE_TYPE (current_function_decl)); |
| c; |
| c = TREE_CHAIN (c)) |
| if (is_attribute_p ("format", TREE_PURPOSE (c)) |
| && (decode_format_type (IDENTIFIER_POINTER |
| (TREE_VALUE (TREE_VALUE (c)))) |
| == info.format_type)) |
| break; |
| if (c == NULL_TREE) |
| { |
| /* Check if the current function has a parameter to which |
| the format attribute could be attached; if not, it |
| can't be a candidate for a format attribute, despite |
| the vprintf-like or vscanf-like call. */ |
| tree args; |
| for (args = DECL_ARGUMENTS (current_function_decl); |
| args != 0; |
| args = DECL_CHAIN (args)) |
| { |
| if (TREE_CODE (TREE_TYPE (args)) == POINTER_TYPE |
| && (TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (args))) |
| == char_type_node)) |
| break; |
| } |
| if (args != 0) |
| warning (OPT_Wsuggest_attribute_format, "function %qD " |
| "might be a candidate for %qs format attribute", |
| current_function_decl, |
| format_types[info.format_type].name); |
| } |
| } |
| } |
| } |
| } |
| |
| |
| /* Variables used by the checking of $ operand number formats. */ |
| static char *dollar_arguments_used = NULL; |
| static char *dollar_arguments_pointer_p = NULL; |
| static int dollar_arguments_alloc = 0; |
| static int dollar_arguments_count; |
| static int dollar_first_arg_num; |
| static int dollar_max_arg_used; |
| static int dollar_format_warned; |
| |
| /* Initialize the checking for a format string that may contain $ |
| parameter number specifications; we will need to keep track of whether |
| each parameter has been used. FIRST_ARG_NUM is the number of the first |
| argument that is a parameter to the format, or 0 for a vprintf-style |
| function; PARAMS is the list of arguments starting at this argument. */ |
| |
| static void |
| init_dollar_format_checking (int first_arg_num, tree params) |
| { |
| tree oparams = params; |
| |
| dollar_first_arg_num = first_arg_num; |
| dollar_arguments_count = 0; |
| dollar_max_arg_used = 0; |
| dollar_format_warned = 0; |
| if (first_arg_num > 0) |
| { |
| while (params) |
| { |
| dollar_arguments_count++; |
| params = TREE_CHAIN (params); |
| } |
| } |
| if (dollar_arguments_alloc < dollar_arguments_count) |
| { |
| free (dollar_arguments_used); |
| free (dollar_arguments_pointer_p); |
| dollar_arguments_alloc = dollar_arguments_count; |
| dollar_arguments_used = XNEWVEC (char, dollar_arguments_alloc); |
| dollar_arguments_pointer_p = XNEWVEC (char, dollar_arguments_alloc); |
| } |
| if (dollar_arguments_alloc) |
| { |
| memset (dollar_arguments_used, 0, dollar_arguments_alloc); |
| if (first_arg_num > 0) |
| { |
| int i = 0; |
| params = oparams; |
| while (params) |
| { |
| dollar_arguments_pointer_p[i] = (TREE_CODE (TREE_TYPE (TREE_VALUE (params))) |
| == POINTER_TYPE); |
| params = TREE_CHAIN (params); |
| i++; |
| } |
| } |
| } |
| } |
| |
| |
| /* Look for a decimal number followed by a $ in *FORMAT. If DOLLAR_NEEDED |
| is set, it is an error if one is not found; otherwise, it is OK. If |
| such a number is found, check whether it is within range and mark that |
| numbered operand as being used for later checking. Returns the operand |
| number if found and within range, zero if no such number was found and |
| this is OK, or -1 on error. PARAMS points to the first operand of the |
| format; PARAM_PTR is made to point to the parameter referred to. If |
| a $ format is found, *FORMAT is updated to point just after it. */ |
| |
| static int |
| maybe_read_dollar_number (const char **format, |
| int dollar_needed, tree params, tree *param_ptr, |
| const format_kind_info *fki) |
| { |
| int argnum; |
| int overflow_flag; |
| const char *fcp = *format; |
| if (!ISDIGIT (*fcp)) |
| { |
| if (dollar_needed) |
| { |
| warning (OPT_Wformat_, "missing $ operand number in format"); |
| return -1; |
| } |
| else |
| return 0; |
| } |
| argnum = 0; |
| overflow_flag = 0; |
| while (ISDIGIT (*fcp)) |
| { |
| HOST_WIDE_INT nargnum |
| = HOST_WIDE_INT_UC (10) * argnum + (*fcp - '0'); |
| if ((int) nargnum != nargnum) |
| overflow_flag = 1; |
| argnum = nargnum; |
| fcp++; |
| } |
| if (*fcp != '$') |
| { |
| if (dollar_needed) |
| { |
| warning (OPT_Wformat_, "missing $ operand number in format"); |
| return -1; |
| } |
| else |
| return 0; |
| } |
| *format = fcp + 1; |
| if (pedantic && !dollar_format_warned) |
| { |
| warning (OPT_Wformat_, "%s does not support %%n$ operand number formats", |
| C_STD_NAME (STD_EXT)); |
| dollar_format_warned = 1; |
| } |
| if (overflow_flag || argnum == 0 |
| || (dollar_first_arg_num && argnum > dollar_arguments_count)) |
| { |
| warning (OPT_Wformat_, "operand number out of range in format"); |
| return -1; |
| } |
| if (argnum > dollar_max_arg_used) |
| dollar_max_arg_used = argnum; |
| /* For vprintf-style functions we may need to allocate more memory to |
| track which arguments are used. */ |
| while (dollar_arguments_alloc < dollar_max_arg_used) |
| { |
| int nalloc; |
| nalloc = 2 * dollar_arguments_alloc + 16; |
| dollar_arguments_used = XRESIZEVEC (char, dollar_arguments_used, |
| nalloc); |
| dollar_arguments_pointer_p = XRESIZEVEC (char, dollar_arguments_pointer_p, |
| nalloc); |
| memset (dollar_arguments_used + dollar_arguments_alloc, 0, |
| nalloc - dollar_arguments_alloc); |
| dollar_arguments_alloc = nalloc; |
| } |
| if (!(fki->flags & (int) FMT_FLAG_DOLLAR_MULTIPLE) |
| && dollar_arguments_used[argnum - 1] == 1) |
| { |
| dollar_arguments_used[argnum - 1] = 2; |
| warning (OPT_Wformat_, "format argument %d used more than once in %s format", |
| argnum, fki->name); |
| } |
| else |
| dollar_arguments_used[argnum - 1] = 1; |
| if (dollar_first_arg_num) |
| { |
| int i; |
| *param_ptr = params; |
| for (i = 1; i < argnum && *param_ptr != 0; i++) |
| *param_ptr = TREE_CHAIN (*param_ptr); |
| |
| /* This case shouldn't be caught here. */ |
| gcc_assert (*param_ptr); |
| } |
| else |
| *param_ptr = 0; |
| return argnum; |
| } |
| |
| /* Ensure that FORMAT does not start with a decimal number followed by |
| a $; give a diagnostic and return true if it does, false otherwise. */ |
| |
| static bool |
| avoid_dollar_number (const char *format) |
| { |
| if (!ISDIGIT (*format)) |
| return false; |
| while (ISDIGIT (*format)) |
| format++; |
| if (*format == '$') |
| { |
| warning (OPT_Wformat_, |
| "%<$%>operand number used after format without operand number"); |
| return true; |
| } |
| return false; |
| } |
| |
| |
| /* Finish the checking for a format string that used $ operand number formats |
| instead of non-$ formats. We check for unused operands before used ones |
| (a serious error, since the implementation of the format function |
| can't know what types to pass to va_arg to find the later arguments). |
| and for unused operands at the end of the format (if we know how many |
| arguments the format had, so not for vprintf). If there were operand |
| numbers out of range on a non-vprintf-style format, we won't have reached |
| here. If POINTER_GAP_OK, unused arguments are OK if all arguments are |
| pointers. */ |
| |
| static void |
| finish_dollar_format_checking (format_check_results *res, int pointer_gap_ok) |
| { |
| int i; |
| bool found_pointer_gap = false; |
| for (i = 0; i < dollar_max_arg_used; i++) |
| { |
| if (!dollar_arguments_used[i]) |
| { |
| if (pointer_gap_ok && (dollar_first_arg_num == 0 |
| || dollar_arguments_pointer_p[i])) |
| found_pointer_gap = true; |
| else |
| warning_at (res->format_string_loc, OPT_Wformat_, |
| "format argument %d unused before used argument %d " |
| "in %<$%>-style format", |
| i + 1, dollar_max_arg_used); |
| } |
| } |
| if (found_pointer_gap |
| || (dollar_first_arg_num |
| && dollar_max_arg_used < dollar_arguments_count)) |
| { |
| res->number_other--; |
| res->number_dollar_extra_args++; |
| } |
| } |
| |
| |
| /* Retrieve the specification for a format flag. SPEC contains the |
| specifications for format flags for the applicable kind of format. |
| FLAG is the flag in question. If PREDICATES is NULL, the basic |
| spec for that flag must be retrieved and must exist. If |
| PREDICATES is not NULL, it is a string listing possible predicates |
| for the spec entry; if an entry predicated on any of these is |
| found, it is returned, otherwise NULL is returned. */ |
| |
| static const format_flag_spec * |
| get_flag_spec (const format_flag_spec *spec, int flag, const char *predicates) |
| { |
| int i; |
| for (i = 0; spec[i].flag_char != 0; i++) |
| { |
| if (spec[i].flag_char != flag) |
| continue; |
| if (predicates != NULL) |
| { |
| if (spec[i].predicate != 0 |
| && strchr (predicates, spec[i].predicate) != 0) |
| return &spec[i]; |
| } |
| else if (spec[i].predicate == 0) |
| return &spec[i]; |
| } |
| gcc_assert (predicates); |
| return NULL; |
| } |
| |
| |
| /* Check the argument list of a call to printf, scanf, etc. |
| INFO points to the function_format_info structure. |
| PARAMS is the list of argument values. */ |
| |
| static void |
| check_format_info (function_format_info *info, tree params, |
| vec<location_t> *arglocs) |
| { |
| format_check_context format_ctx; |
| unsigned HOST_WIDE_INT arg_num; |
| tree format_tree; |
| format_check_results res; |
| /* Skip to format argument. If the argument isn't available, there's |
| no work for us to do; prototype checking will catch the problem. */ |
| for (arg_num = 1; ; ++arg_num) |
| { |
| if (params == 0) |
| return; |
| if (arg_num == info->format_num) |
| break; |
| params = TREE_CHAIN (params); |
| } |
| format_tree = TREE_VALUE (params); |
| params = TREE_CHAIN (params); |
| if (format_tree == 0) |
| return; |
| |
| res.number_non_literal = 0; |
| res.number_extra_args = 0; |
| res.extra_arg_loc = UNKNOWN_LOCATION; |
| res.number_dollar_extra_args = 0; |
| res.number_wide = 0; |
| res.number_non_char = 0; |
| res.number_empty = 0; |
| res.number_unterminated = 0; |
| res.number_other = 0; |
| res.format_string_loc = input_location; |
| |
| format_ctx.res = &res; |
| format_ctx.info = info; |
| format_ctx.params = params; |
| format_ctx.arglocs = arglocs; |
| |
| check_function_arguments_recurse (check_format_arg, &format_ctx, |
| format_tree, arg_num); |
| |
| location_t loc = format_ctx.res->format_string_loc; |
| |
| if (res.number_non_literal > 0) |
| { |
| /* Functions taking a va_list normally pass a non-literal format |
| string. These functions typically are declared with |
| first_arg_num == 0, so avoid warning in those cases. */ |
| if (!(format_types[info->format_type].flags & (int) FMT_FLAG_ARG_CONVERT)) |
| { |
| /* For strftime-like formats, warn for not checking the format |
| string; but there are no arguments to check. */ |
| warning_at (loc, OPT_Wformat_nonliteral, |
| "format not a string literal, format string not checked"); |
| } |
| else if (info->first_arg_num != 0) |
| { |
| /* If there are no arguments for the format at all, we may have |
| printf (foo) which is likely to be a security hole. */ |
| while (arg_num + 1 < info->first_arg_num) |
| { |
| if (params == 0) |
| break; |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| if (params == 0 && warn_format_security) |
| warning_at (loc, OPT_Wformat_security, |
| "format not a string literal and no format arguments"); |
| else if (params == 0 && warn_format_nonliteral) |
| warning_at (loc, OPT_Wformat_nonliteral, |
| "format not a string literal and no format arguments"); |
| else |
| warning_at (loc, OPT_Wformat_nonliteral, |
| "format not a string literal, argument types not checked"); |
| } |
| } |
| |
| /* If there were extra arguments to the format, normally warn. However, |
| the standard does say extra arguments are ignored, so in the specific |
| case where we have multiple leaves (conditional expressions or |
| ngettext) allow extra arguments if at least one leaf didn't have extra |
| arguments, but was otherwise OK (either non-literal or checked OK). |
| If the format is an empty string, this should be counted similarly to the |
| case of extra format arguments. */ |
| if (res.number_extra_args > 0 && res.number_non_literal == 0 |
| && res.number_other == 0) |
| { |
| if (res.extra_arg_loc == UNKNOWN_LOCATION) |
| res.extra_arg_loc = loc; |
| warning_at (res.extra_arg_loc, OPT_Wformat_extra_args, |
| "too many arguments for format"); |
| } |
| if (res.number_dollar_extra_args > 0 && res.number_non_literal == 0 |
| && res.number_other == 0) |
| warning_at (loc, OPT_Wformat_extra_args, |
| "unused arguments in %<$%>-style format"); |
| if (res.number_empty > 0 && res.number_non_literal == 0 |
| && res.number_other == 0) |
| warning_at (loc, OPT_Wformat_zero_length, "zero-length %s format string", |
| format_types[info->format_type].name); |
| |
| if (res.number_wide > 0) |
| warning_at (loc, OPT_Wformat_, "format is a wide character string"); |
| |
| if (res.number_non_char > 0) |
| warning_at (loc, OPT_Wformat_, |
| "format string is not an array of type %qs", "char"); |
| |
| if (res.number_unterminated > 0) |
| warning_at (loc, OPT_Wformat_, "unterminated format string"); |
| } |
| |
| /* Callback from check_function_arguments_recurse to check a |
| format string. FORMAT_TREE is the format parameter. ARG_NUM |
| is the number of the format argument. CTX points to a |
| format_check_context. */ |
| |
| static void |
| check_format_arg (void *ctx, tree format_tree, |
| unsigned HOST_WIDE_INT arg_num) |
| { |
| format_check_context *format_ctx = (format_check_context *) ctx; |
| format_check_results *res = format_ctx->res; |
| function_format_info *info = format_ctx->info; |
| tree params = format_ctx->params; |
| vec<location_t> *arglocs = format_ctx->arglocs; |
| |
| int format_length; |
| HOST_WIDE_INT offset; |
| const char *format_chars; |
| tree array_size = 0; |
| tree array_init; |
| |
| location_t fmt_param_loc = EXPR_LOC_OR_LOC (format_tree, input_location); |
| |
| /* Pull out a constant value if the front end didn't, and handle location |
| wrappers. */ |
| format_tree = fold_for_warn (format_tree); |
| STRIP_NOPS (format_tree); |
| |
| if (integer_zerop (format_tree)) |
| { |
| /* Skip to first argument to check, so we can see if this format |
| has any arguments (it shouldn't). */ |
| while (arg_num + 1 < info->first_arg_num) |
| { |
| if (params == 0) |
| return; |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| |
| if (params == 0) |
| res->number_other++; |
| else |
| { |
| if (res->number_extra_args == 0) |
| res->extra_arg_loc = EXPR_LOC_OR_LOC (TREE_VALUE (params), |
| input_location); |
| res->number_extra_args++; |
| } |
| return; |
| } |
| |
| offset = 0; |
| if (TREE_CODE (format_tree) == POINTER_PLUS_EXPR) |
| { |
| tree arg0, arg1; |
| |
| arg0 = TREE_OPERAND (format_tree, 0); |
| arg1 = TREE_OPERAND (format_tree, 1); |
| STRIP_NOPS (arg0); |
| STRIP_NOPS (arg1); |
| if (TREE_CODE (arg1) == INTEGER_CST) |
| format_tree = arg0; |
| else |
| { |
| res->number_non_literal++; |
| return; |
| } |
| /* POINTER_PLUS_EXPR offsets are to be interpreted signed. */ |
| if (!cst_and_fits_in_hwi (arg1)) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| offset = int_cst_value (arg1); |
| } |
| if (TREE_CODE (format_tree) != ADDR_EXPR) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| res->format_string_loc = EXPR_LOC_OR_LOC (format_tree, input_location); |
| format_tree = TREE_OPERAND (format_tree, 0); |
| if (format_types[info->format_type].flags |
| & (int) FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL) |
| { |
| bool objc_str = (info->format_type == gcc_objc_string_format_type); |
| /* We cannot examine this string here - but we can check that it is |
| a valid type. */ |
| if (TREE_CODE (format_tree) != CONST_DECL |
| || !((objc_str && objc_string_ref_type_p (TREE_TYPE (format_tree))) |
| || (*targetcm.string_object_ref_type_p) |
| ((const_tree) TREE_TYPE (format_tree)))) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| /* Skip to first argument to check. */ |
| while (arg_num + 1 < info->first_arg_num) |
| { |
| if (params == 0) |
| return; |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| /* So, we have a valid literal string object and one or more params. |
| We need to use an external helper to parse the string into format |
| info. For Objective-C variants we provide the resource within the |
| objc tree, for target variants, via a hook. */ |
| if (objc_str) |
| objc_check_format_arg (format_tree, params); |
| else if (targetcm.check_string_object_format_arg) |
| (*targetcm.check_string_object_format_arg) (format_tree, params); |
| /* Else we can't handle it and retire quietly. */ |
| return; |
| } |
| if (TREE_CODE (format_tree) == ARRAY_REF |
| && tree_fits_shwi_p (TREE_OPERAND (format_tree, 1)) |
| && (offset += tree_to_shwi (TREE_OPERAND (format_tree, 1))) >= 0) |
| format_tree = TREE_OPERAND (format_tree, 0); |
| if (offset < 0) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| if (VAR_P (format_tree) |
| && TREE_CODE (TREE_TYPE (format_tree)) == ARRAY_TYPE |
| && (array_init = decl_constant_value (format_tree)) != format_tree |
| && TREE_CODE (array_init) == STRING_CST) |
| { |
| /* Extract the string constant initializer. Note that this may include |
| a trailing NUL character that is not in the array (e.g. |
| const char a[3] = "foo";). */ |
| array_size = DECL_SIZE_UNIT (format_tree); |
| format_tree = array_init; |
| } |
| if (TREE_CODE (format_tree) != STRING_CST) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| tree underlying_type |
| = TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (format_tree))); |
| if (underlying_type != char_type_node) |
| { |
| if (underlying_type == char16_type_node |
| || underlying_type == char32_type_node |
| || underlying_type == wchar_type_node) |
| res->number_wide++; |
| else |
| res->number_non_char++; |
| return; |
| } |
| format_chars = TREE_STRING_POINTER (format_tree); |
| format_length = TREE_STRING_LENGTH (format_tree); |
| if (array_size != 0) |
| { |
| /* Variable length arrays can't be initialized. */ |
| gcc_assert (TREE_CODE (array_size) == INTEGER_CST); |
| |
| if (tree_fits_shwi_p (array_size)) |
| { |
| HOST_WIDE_INT array_size_value = tree_to_shwi (array_size); |
| if (array_size_value > 0 |
| && array_size_value == (int) array_size_value |
| && format_length > array_size_value) |
| format_length = array_size_value; |
| } |
| } |
| if (offset) |
| { |
| if (offset >= format_length) |
| { |
| res->number_non_literal++; |
| return; |
| } |
| format_chars += offset; |
| format_length -= offset; |
| } |
| if (format_length < 1 || format_chars[--format_length] != 0) |
| { |
| res->number_unterminated++; |
| return; |
| } |
| if (format_length == 0) |
| { |
| res->number_empty++; |
| return; |
| } |
| |
| /* Skip to first argument to check. */ |
| while (arg_num + 1 < info->first_arg_num) |
| { |
| if (params == 0) |
| return; |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| /* Provisionally increment res->number_other; check_format_info_main |
| will decrement it if it finds there are extra arguments, but this way |
| need not adjust it for every return. */ |
| res->number_other++; |
| object_allocator <format_wanted_type> fwt_pool ("format_wanted_type pool"); |
| check_format_info_main (res, info, format_chars, fmt_param_loc, format_tree, |
| format_length, params, arg_num, fwt_pool, arglocs); |
| } |
| |
| /* Support class for argument_parser and check_format_info_main. |
| Tracks any flag characters that have been applied to the |
| current argument. */ |
| |
| class flag_chars_t |
| { |
| public: |
| flag_chars_t (); |
| bool has_char_p (char ch) const; |
| void add_char (char ch); |
| void validate (const format_kind_info *fki, |
| const format_char_info *fci, |
| const format_flag_spec *flag_specs, |
| const char * const format_chars, |
| tree format_string_cst, |
| location_t format_string_loc, |
| const char * const orig_format_chars, |
| char format_char, |
| bool quoted); |
| int get_alloc_flag (const format_kind_info *fki); |
| int assignment_suppression_p (const format_kind_info *fki); |
| |
| private: |
| char m_flag_chars[256]; |
| }; |
| |
| /* Support struct for argument_parser and check_format_info_main. |
| Encapsulates any length modifier applied to the current argument. */ |
| |
| class length_modifier |
| { |
| public: |
| length_modifier () |
| : chars (NULL), val (FMT_LEN_none), std (STD_C89), |
| scalar_identity_flag (0) |
| { |
| } |
| |
| length_modifier (const char *chars_, |
| enum format_lengths val_, |
| enum format_std_version std_, |
| int scalar_identity_flag_) |
| : chars (chars_), val (val_), std (std_), |
| scalar_identity_flag (scalar_identity_flag_) |
| { |
| } |
| |
| const char *chars; |
| enum format_lengths val; |
| enum format_std_version std; |
| int scalar_identity_flag; |
| }; |
| |
| /* Parsing one argument within a format string. */ |
| |
| class argument_parser |
| { |
| public: |
| argument_parser (function_format_info *info, const char *&format_chars, |
| tree format_string_cst, |
| const char * const orig_format_chars, |
| location_t format_string_loc, flag_chars_t &flag_chars, |
| int &has_operand_number, tree first_fillin_param, |
| object_allocator <format_wanted_type> &fwt_pool_, |
| vec<location_t> *arglocs); |
| |
| bool read_any_dollar (); |
| |
| bool read_format_flags (); |
| |
| bool |
| read_any_format_width (tree ¶ms, |
| unsigned HOST_WIDE_INT &arg_num); |
| |
| void |
| read_any_format_left_precision (); |
| |
| bool |
| read_any_format_precision (tree ¶ms, |
| unsigned HOST_WIDE_INT &arg_num); |
| |
| void handle_alloc_chars (); |
| |
| length_modifier read_any_length_modifier (); |
| |
| void read_any_other_modifier (); |
| |
| const format_char_info *find_format_char_info (char format_char); |
| |
| void |
| validate_flag_pairs (const format_char_info *fci, |
| char format_char); |
| |
| void |
| give_y2k_warnings (const format_char_info *fci, |
| char format_char); |
| |
| void parse_any_scan_set (const format_char_info *fci); |
| |
| bool handle_conversions (const format_char_info *fci, |
| const length_modifier &len_modifier, |
| tree &wanted_type, |
| const char *&wanted_type_name, |
| unsigned HOST_WIDE_INT &arg_num, |
| tree ¶ms, |
| char format_char); |
| |
| bool |
| check_argument_type (const format_char_info *fci, |
| const length_modifier &len_modifier, |
| tree &wanted_type, |
| const char *&wanted_type_name, |
| const bool suppressed, |
| unsigned HOST_WIDE_INT &arg_num, |
| tree ¶ms, |
| const int alloc_flag, |
| const char * const format_start, |
| const char * const type_start, |
| location_t fmt_param_loc, |
| char conversion_char); |
| |
| private: |
| const function_format_info *const info; |
| const format_kind_info * const fki; |
| const format_flag_spec * const flag_specs; |
| const char *start_of_this_format; |
| const char *&format_chars; |
| const tree format_string_cst; |
| const char * const orig_format_chars; |
| const location_t format_string_loc; |
| object_allocator <format_wanted_type> &fwt_pool; |
| flag_chars_t &flag_chars; |
| int main_arg_num; |
| tree main_arg_params; |
| int &has_operand_number; |
| const tree first_fillin_param; |
| format_wanted_type width_wanted_type; |
| format_wanted_type precision_wanted_type; |
| public: |
| format_wanted_type main_wanted_type; |
| private: |
| format_wanted_type *first_wanted_type; |
| format_wanted_type *last_wanted_type; |
| vec<location_t> *arglocs; |
| }; |
| |
| /* flag_chars_t's constructor. */ |
| |
| flag_chars_t::flag_chars_t () |
| { |
| m_flag_chars[0] = 0; |
| } |
| |
| /* Has CH been seen as a flag within the current argument? */ |
| |
| bool |
| flag_chars_t::has_char_p (char ch) const |
| { |
| return strchr (m_flag_chars, ch) != 0; |
| } |
| |
| /* Add CH to the flags seen within the current argument. */ |
| |
| void |
| flag_chars_t::add_char (char ch) |
| { |
| int i = strlen (m_flag_chars); |
| m_flag_chars[i++] = ch; |
| m_flag_chars[i] = 0; |
| } |
| |
| /* Validate the individual flags used, removing any that are invalid. */ |
| |
| void |
| flag_chars_t::validate (const format_kind_info *fki, |
| const format_char_info *fci, |
| const format_flag_spec *flag_specs, |
| const char * const format_chars, |
| tree format_string_cst, |
| location_t format_string_loc, |
| const char * const orig_format_chars, |
| char format_char, |
| bool quoted) |
| { |
| int i; |
| int d = 0; |
| bool quotflag = false; |
| |
| for (i = 0; m_flag_chars[i] != 0; i++) |
| { |
| const format_flag_spec *s = get_flag_spec (flag_specs, |
| m_flag_chars[i], NULL); |
| m_flag_chars[i - d] = m_flag_chars[i]; |
| if (m_flag_chars[i] == fki->length_code_char) |
| continue; |
| |
| /* Remember if a quoting flag is seen. */ |
| quotflag |= s->quoting; |
| |
| if (strchr (fci->flag_chars, m_flag_chars[i]) == 0) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%s used with %<%%%c%> %s format", |
| _(s->name), format_char, fki->name); |
| d++; |
| continue; |
| } |
| if (pedantic) |
| { |
| const format_flag_spec *t; |
| if (ADJ_STD (s->std) > C_STD_VER) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "%s does not support %s", |
| C_STD_NAME (s->std), _(s->long_name)); |
| t = get_flag_spec (flag_specs, m_flag_chars[i], fci->flags2); |
| if (t != NULL && ADJ_STD (t->std) > ADJ_STD (s->std)) |
| { |
| const char *long_name = (t->long_name != NULL |
| ? t->long_name |
| : s->long_name); |
| if (ADJ_STD (t->std) > C_STD_VER) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "%s does not support %s with" |
| " the %<%%%c%> %s format", |
| C_STD_NAME (t->std), _(long_name), |
| format_char, fki->name); |
| } |
| } |
| |
| /* Detect quoting directives used within a quoted sequence, such |
| as GCC's "%<...%qE". */ |
| if (quoted && s->quoting) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars - 1, |
| OPT_Wformat_, |
| "%s used within a quoted sequence", |
| _(s->name)); |
| } |
| } |
| m_flag_chars[i - d] = 0; |
| |
| if (!quoted |
| && !quotflag |
| && strchr (fci->flags2, '\'')) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%qc conversion used unquoted", |
| format_char); |
| } |
| } |
| |
| /* Determine if an assignment-allocation has been set, requiring |
| an extra char ** for writing back a dynamically-allocated char *. |
| This is for handling the optional 'm' character in scanf. */ |
| |
| int |
| flag_chars_t::get_alloc_flag (const format_kind_info *fki) |
| { |
| if ((fki->flags & (int) FMT_FLAG_SCANF_A_KLUDGE) |
| && has_char_p ('a')) |
| return 1; |
| if (fki->alloc_char && has_char_p (fki->alloc_char)) |
| return 1; |
| return 0; |
| } |
| |
| /* Determine if an assignment-suppression character was seen. |
| ('*' in scanf, for discarding the converted input). */ |
| |
| int |
| flag_chars_t::assignment_suppression_p (const format_kind_info *fki) |
| { |
| if (fki->suppression_char |
| && has_char_p (fki->suppression_char)) |
| return 1; |
| return 0; |
| } |
| |
| /* Constructor for argument_parser. Initialize for parsing one |
| argument within a format string. */ |
| |
| argument_parser:: |
| argument_parser (function_format_info *info_, const char *&format_chars_, |
| tree format_string_cst_, |
| const char * const orig_format_chars_, |
| location_t format_string_loc_, |
| flag_chars_t &flag_chars_, |
| int &has_operand_number_, |
| tree first_fillin_param_, |
| object_allocator <format_wanted_type> &fwt_pool_, |
| vec<location_t> *arglocs_) |
| : info (info_), |
| fki (&format_types[info->format_type]), |
| flag_specs (fki->flag_specs), |
| start_of_this_format (format_chars_), |
| format_chars (format_chars_), |
| format_string_cst (format_string_cst_), |
| orig_format_chars (orig_format_chars_), |
| format_string_loc (format_string_loc_), |
| fwt_pool (fwt_pool_), |
| flag_chars (flag_chars_), |
| main_arg_num (0), |
| main_arg_params (NULL), |
| has_operand_number (has_operand_number_), |
| first_fillin_param (first_fillin_param_), |
| first_wanted_type (NULL), |
| last_wanted_type (NULL), |
| arglocs (arglocs_) |
| { |
| } |
| |
| /* Handle dollars at the start of format arguments, setting up main_arg_params |
| and main_arg_num. |
| |
| Return true if format parsing is to continue, false otherwise. */ |
| |
| bool |
| argument_parser::read_any_dollar () |
| { |
| if ((fki->flags & (int) FMT_FLAG_USE_DOLLAR) && has_operand_number != 0) |
| { |
| /* Possibly read a $ operand number at the start of the format. |
| If one was previously used, one is required here. If one |
| is not used here, we can't immediately conclude this is a |
| format without them, since it could be printf %m or scanf %*. */ |
| int opnum; |
| opnum = maybe_read_dollar_number (&format_chars, 0, |
| first_fillin_param, |
| &main_arg_params, fki); |
| if (opnum == -1) |
| return false; |
| else if (opnum > 0) |
| { |
| has_operand_number = 1; |
| main_arg_num = opnum + info->first_arg_num - 1; |
| } |
| } |
| else if (fki->flags & FMT_FLAG_USE_DOLLAR) |
| { |
| if (avoid_dollar_number (format_chars)) |
| return false; |
| } |
| return true; |
| } |
| |
| /* Read any format flags, but do not yet validate them beyond removing |
| duplicates, since in general validation depends on the rest of |
| the format. |
| |
| Return true if format parsing is to continue, false otherwise. */ |
| |
| bool |
| argument_parser::read_format_flags () |
| { |
| while (*format_chars != 0 |
| && strchr (fki->flag_chars, *format_chars) != 0) |
| { |
| const format_flag_spec *s = get_flag_spec (flag_specs, |
| *format_chars, NULL); |
| if (flag_chars.has_char_p (*format_chars)) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars + 1 - orig_format_chars, |
| OPT_Wformat_, |
| "repeated %s in format", _(s->name)); |
| } |
| else |
| flag_chars.add_char (*format_chars); |
| |
| if (s->skip_next_char) |
| { |
| ++format_chars; |
| if (*format_chars == 0) |
| { |
| warning_at (format_string_loc, OPT_Wformat_, |
| "missing fill character at end of strfmon format"); |
| return false; |
| } |
| } |
| ++format_chars; |
| } |
| |
| return true; |
| } |
| |
| /* Read any format width, possibly * or *m$. |
| |
| Return true if format parsing is to continue, false otherwise. */ |
| |
| bool |
| argument_parser:: |
| read_any_format_width (tree ¶ms, |
| unsigned HOST_WIDE_INT &arg_num) |
| { |
| if (!fki->width_char) |
| return true; |
| |
| if (fki->width_type != NULL && *format_chars == '*') |
| { |
| flag_chars.add_char (fki->width_char); |
| /* "...a field width...may be indicated by an asterisk. |
| In this case, an int argument supplies the field width..." */ |
| ++format_chars; |
| if (has_operand_number != 0) |
| { |
| int opnum; |
| opnum = maybe_read_dollar_number (&format_chars, |
| has_operand_number == 1, |
| first_fillin_param, |
| ¶ms, fki); |
| if (opnum == -1) |
| return false; |
| else if (opnum > 0) |
| { |
| has_operand_number = 1; |
| arg_num = opnum + info->first_arg_num - 1; |
| } |
| else |
| has_operand_number = 0; |
| } |
| else |
| { |
| if (avoid_dollar_number (format_chars)) |
| return false; |
| } |
| if (info->first_arg_num != 0) |
| { |
| tree cur_param; |
| if (params == 0) |
| cur_param = NULL; |
| else |
| { |
| cur_param = TREE_VALUE (params); |
| if (has_operand_number <= 0) |
| { |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| } |
| width_wanted_type.wanted_type = *fki->width_type; |
| width_wanted_type.wanted_type_name = NULL; |
| width_wanted_type.pointer_count = 0; |
| width_wanted_type.char_lenient_flag = 0; |
| width_wanted_type.scalar_identity_flag = 0; |
| width_wanted_type.writing_in_flag = 0; |
| width_wanted_type.reading_from_flag = 0; |
| width_wanted_type.kind = CF_KIND_FIELD_WIDTH; |
| width_wanted_type.format_start = format_chars - 1; |
| width_wanted_type.format_length = 1; |
| width_wanted_type.param = cur_param; |
| width_wanted_type.arg_num = arg_num; |
| width_wanted_type.offset_loc = |
| format_chars - orig_format_chars; |
| width_wanted_type.next = NULL; |
| if (last_wanted_type != 0) |
| last_wanted_type->next = &width_wanted_type; |
| if (first_wanted_type == 0) |
| first_wanted_type = &width_wanted_type; |
| last_wanted_type = &width_wanted_type; |
| } |
| } |
| else |
| { |
| /* Possibly read a numeric width. If the width is zero, |
| we complain if appropriate. */ |
| int non_zero_width_char = FALSE; |
| int found_width = FALSE; |
| while (ISDIGIT (*format_chars)) |
| { |
| found_width = TRUE; |
| if (*format_chars != '0') |
| non_zero_width_char = TRUE; |
| ++format_chars; |
| } |
| if (found_width && !non_zero_width_char && |
| (fki->flags & (int) FMT_FLAG_ZERO_WIDTH_BAD)) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "zero width in %s format", fki->name); |
| if (found_width) |
| flag_chars.add_char (fki->width_char); |
| } |
| |
| return true; |
| } |
| |
| /* Read any format left precision (must be a number, not *). */ |
| void |
| argument_parser::read_any_format_left_precision () |
| { |
| if (fki->left_precision_char == 0) |
| return; |
| if (*format_chars != '#') |
| return; |
| |
| ++format_chars; |
| flag_chars.add_char (fki->left_precision_char); |
| if (!ISDIGIT (*format_chars)) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "empty left precision in %s format", fki->name); |
| while (ISDIGIT (*format_chars)) |
| ++format_chars; |
| } |
| |
| /* Read any format precision, possibly * or *m$. |
| |
| Return true if format parsing is to continue, false otherwise. */ |
| |
| bool |
| argument_parser:: |
| read_any_format_precision (tree ¶ms, |
| unsigned HOST_WIDE_INT &arg_num) |
| { |
| if (fki->precision_char == 0) |
| return true; |
| if (*format_chars != '.') |
| return true; |
| |
| ++format_chars; |
| flag_chars.add_char (fki->precision_char); |
| if (fki->precision_type != NULL && *format_chars == '*') |
| { |
| /* "...a...precision...may be indicated by an asterisk. |
| In this case, an int argument supplies the...precision." */ |
| ++format_chars; |
| if (has_operand_number != 0) |
| { |
| int opnum; |
| opnum = maybe_read_dollar_number (&format_chars, |
| has_operand_number == 1, |
| first_fillin_param, |
| ¶ms, fki); |
| if (opnum == -1) |
| return false; |
| else if (opnum > 0) |
| { |
| has_operand_number = 1; |
| arg_num = opnum + info->first_arg_num - 1; |
| } |
| else |
| has_operand_number = 0; |
| } |
| else |
| { |
| if (avoid_dollar_number (format_chars)) |
| return false; |
| } |
| if (info->first_arg_num != 0) |
| { |
| tree cur_param; |
| if (params == 0) |
| cur_param = NULL; |
| else |
| { |
| cur_param = TREE_VALUE (params); |
| if (has_operand_number <= 0) |
| { |
| params = TREE_CHAIN (params); |
| ++arg_num; |
| } |
| } |
| precision_wanted_type.wanted_type = *fki->precision_type; |
| precision_wanted_type.wanted_type_name = NULL; |
| precision_wanted_type.pointer_count = 0; |
| precision_wanted_type.char_lenient_flag = 0; |
| precision_wanted_type.scalar_identity_flag = 0; |
| precision_wanted_type.writing_in_flag = 0; |
| precision_wanted_type.reading_from_flag = 0; |
| precision_wanted_type.kind = CF_KIND_FIELD_PRECISION; |
| precision_wanted_type.param = cur_param; |
| precision_wanted_type.format_start = format_chars - 2; |
| precision_wanted_type.format_length = 2; |
| precision_wanted_type.arg_num = arg_num; |
| precision_wanted_type.offset_loc = |
| format_chars - orig_format_chars; |
| precision_wanted_type.next = NULL; |
| if (last_wanted_type != 0) |
| last_wanted_type->next = &precision_wanted_type; |
| if (first_wanted_type == 0) |
| first_wanted_type = &precision_wanted_type; |
| last_wanted_type = &precision_wanted_type; |
| } |
| } |
| else |
| { |
| if (!(fki->flags & (int) FMT_FLAG_EMPTY_PREC_OK) |
| && !ISDIGIT (*format_chars)) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "empty precision in %s format", fki->name); |
| while (ISDIGIT (*format_chars)) |
| ++format_chars; |
| } |
| |
| return true; |
| } |
| |
| /* Parse any assignment-allocation flags, which request an extra |
| char ** for writing back a dynamically-allocated char *. |
| This is for handling the optional 'm' character in scanf, |
| and, before C99, 'a' (for compatibility with a non-standard |
| GNU libc extension). */ |
| |
| void |
| argument_parser::handle_alloc_chars () |
| { |
| if (fki->alloc_char && fki->alloc_char == *format_chars) |
| { |
| flag_chars.add_char (fki->alloc_char); |
| format_chars++; |
| } |
| |
| /* Handle the scanf allocation kludge. */ |
| if (fki->flags & (int) FMT_FLAG_SCANF_A_KLUDGE) |
| { |
| if (*format_chars == 'a' && !flag_isoc99) |
| { |
| if (format_chars[1] == 's' || format_chars[1] == 'S' |
| || format_chars[1] == '[') |
| { |
| /* 'a' is used as a flag. */ |
| flag_chars.add_char ('a'); |
| format_chars++; |
| } |
| } |
| } |
| } |
| |
| /* Look for length modifiers within the current format argument, |
| returning a length_modifier instance describing it (or the |
| default if one is not found). |
| |
| Issue warnings about non-standard modifiers. */ |
| |
| length_modifier |
| argument_parser::read_any_length_modifier () |
| { |
| length_modifier result; |
| |
| const format_length_info *fli = fki->length_char_specs; |
| if (!fli) |
| return result; |
| |
| while (fli->name != 0 |
| && strncmp (fli->name, format_chars, strlen (fli->name))) |
| fli++; |
| if (fli->name != 0) |
| { |
| format_chars += strlen (fli->name); |
| if (fli->double_name != 0 && fli->name[0] == *format_chars) |
| { |
| format_chars++; |
| result = length_modifier (fli->double_name, fli->double_index, |
| fli->double_std, 0); |
| } |
| else |
| { |
| result = length_modifier (fli->name, fli->index, fli->std, |
| fli->scalar_identity_flag); |
| } |
| flag_chars.add_char (fki->length_code_char); |
| } |
| if (pedantic) |
| { |
| /* Warn if the length modifier is non-standard. */ |
| if (ADJ_STD (result.std) > C_STD_VER) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "%s does not support the %qs %s length modifier", |
| C_STD_NAME (result.std), result.chars, |
| fki->name); |
| } |
| |
| return result; |
| } |
| |
| /* Read any other modifier (strftime E/O). */ |
| |
| void |
| argument_parser::read_any_other_modifier () |
| { |
| if (fki->modifier_chars == NULL) |
| return; |
| |
| while (*format_chars != 0 |
| && strchr (fki->modifier_chars, *format_chars) != 0) |
| { |
| if (flag_chars.has_char_p (*format_chars)) |
| { |
| const format_flag_spec *s = get_flag_spec (flag_specs, |
| *format_chars, NULL); |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "repeated %s in format", _(s->name)); |
| } |
| else |
| flag_chars.add_char (*format_chars); |
| ++format_chars; |
| } |
| } |
| |
| /* Return the format_char_info corresponding to FORMAT_CHAR, |
| potentially issuing a warning if the format char is |
| not supported in the C standard version we are checking |
| against. |
| |
| Issue a warning and return NULL if it is not found. |
| |
| Issue warnings about non-standard modifiers. */ |
| |
| const format_char_info * |
| argument_parser::find_format_char_info (char format_char) |
| { |
| const format_char_info *fci = fki->conversion_specs; |
| |
| while (fci->format_chars != 0 |
| && strchr (fci->format_chars, format_char) == 0) |
| ++fci; |
| if (fci->format_chars == 0) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "unknown conversion type character" |
| " %qc in format", |
| format_char); |
| return NULL; |
| } |
| |
| if (pedantic) |
| { |
| if (ADJ_STD (fci->std) > C_STD_VER) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%s does not support the %<%%%c%> %s format", |
| C_STD_NAME (fci->std), format_char, fki->name); |
| } |
| |
| return fci; |
| } |
| |
| /* Validate the pairs of flags used. |
| Issue warnings about incompatible combinations of flags. */ |
| |
| void |
| argument_parser::validate_flag_pairs (const format_char_info *fci, |
| char format_char) |
| { |
| const format_flag_pair * const bad_flag_pairs = fki->bad_flag_pairs; |
| |
| for (int i = 0; bad_flag_pairs[i].flag_char1 != 0; i++) |
| { |
| const format_flag_spec *s, *t; |
| if (!flag_chars.has_char_p (bad_flag_pairs[i].flag_char1)) |
| continue; |
| if (!flag_chars.has_char_p (bad_flag_pairs[i].flag_char2)) |
| continue; |
| if (bad_flag_pairs[i].predicate != 0 |
| && strchr (fci->flags2, bad_flag_pairs[i].predicate) == 0) |
| continue; |
| s = get_flag_spec (flag_specs, bad_flag_pairs[i].flag_char1, NULL); |
| t = get_flag_spec (flag_specs, bad_flag_pairs[i].flag_char2, NULL); |
| if (bad_flag_pairs[i].ignored) |
| { |
| if (bad_flag_pairs[i].predicate != 0) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "%s ignored with %s and %<%%%c%> %s format", |
| _(s->name), _(t->name), format_char, |
| fki->name); |
| else |
| warning_at (format_string_loc, OPT_Wformat_, |
| "%s ignored with %s in %s format", |
| _(s->name), _(t->name), fki->name); |
| } |
| else |
| { |
| if (bad_flag_pairs[i].predicate != 0) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "use of %s and %s together with %<%%%c%> %s format", |
| _(s->name), _(t->name), format_char, |
| fki->name); |
| else |
| warning_at (format_string_loc, OPT_Wformat_, |
| "use of %s and %s together in %s format", |
| _(s->name), _(t->name), fki->name); |
| } |
| } |
| } |
| |
| /* Give Y2K warnings. */ |
| |
| void |
| argument_parser::give_y2k_warnings (const format_char_info *fci, |
| char format_char) |
| { |
| if (!warn_format_y2k) |
| return; |
| |
| int y2k_level = 0; |
| if (strchr (fci->flags2, '4') != 0) |
| if (flag_chars.has_char_p ('E')) |
| y2k_level = 3; |
| else |
| y2k_level = 2; |
| else if (strchr (fci->flags2, '3') != 0) |
| y2k_level = 3; |
| else if (strchr (fci->flags2, '2') != 0) |
| y2k_level = 2; |
| if (y2k_level == 3) |
| warning_at (format_string_loc, OPT_Wformat_y2k, |
| "%<%%%c%> yields only last 2 digits of " |
| "year in some locales", format_char); |
| else if (y2k_level == 2) |
| warning_at (format_string_loc, OPT_Wformat_y2k, |
| "%<%%%c%> yields only last 2 digits of year", |
| format_char); |
| } |
| |
| /* Parse any "scan sets" enclosed in square brackets, e.g. |
| for scanf-style calls. */ |
| |
| void |
| argument_parser::parse_any_scan_set (const format_char_info *fci) |
| { |
| if (strchr (fci->flags2, '[') == NULL) |
| return; |
| |
| /* Skip over scan set, in case it happens to have '%' in it. */ |
| if (*format_chars == '^') |
| ++format_chars; |
| /* Find closing bracket; if one is hit immediately, then |
| it's part of the scan set rather than a terminator. */ |
| if (*format_chars == ']') |
| ++format_chars; |
| while (*format_chars && *format_chars != ']') |
| ++format_chars; |
| if (*format_chars != ']') |
| /* The end of the format string was reached. */ |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "no closing %<]%> for %<%%[%> format"); |
| } |
| |
| /* Return true if this argument is to be continued to be parsed, |
| false to skip to next argument. */ |
| |
| bool |
| argument_parser::handle_conversions (const format_char_info *fci, |
| const length_modifier &len_modifier, |
| tree &wanted_type, |
| const char *&wanted_type_name, |
| unsigned HOST_WIDE_INT &arg_num, |
| tree ¶ms, |
| char format_char) |
| { |
| enum format_std_version wanted_type_std; |
| |
| if (!(fki->flags & (int) FMT_FLAG_ARG_CONVERT)) |
| return true; |
| |
| wanted_type = (fci->types[len_modifier.val].type |
| ? *fci->types[len_modifier.val].type : 0); |
| wanted_type_name = fci->types[len_modifier.val].name; |
| wanted_type_std = fci->types[len_modifier.val].std; |
| if (wanted_type == 0) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "use of %qs length modifier with %qc type" |
| " character has either no effect" |
| " or undefined behavior", |
| len_modifier.chars, format_char); |
| /* Heuristic: skip one argument when an invalid length/type |
| combination is encountered. */ |
| arg_num++; |
| if (params != 0) |
| params = TREE_CHAIN (params); |
| return false; |
| } |
| else if (pedantic |
| /* Warn if non-standard, provided it is more non-standard |
| than the length and type characters that may already |
| have been warned for. */ |
| && ADJ_STD (wanted_type_std) > ADJ_STD (len_modifier.std) |
| && ADJ_STD (wanted_type_std) > ADJ_STD (fci->std)) |
| { |
| if (ADJ_STD (wanted_type_std) > C_STD_VER) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%s does not support the %<%%%s%c%> %s format", |
| C_STD_NAME (wanted_type_std), |
| len_modifier.chars, |
| format_char, fki->name); |
| } |
| |
| return true; |
| } |
| |
| /* Check type of argument against desired type. |
| |
| Return true if format parsing is to continue, false otherwise. */ |
| |
| bool |
| argument_parser:: |
| check_argument_type (const format_char_info *fci, |
| const length_modifier &len_modifier, |
| tree &wanted_type, |
| const char *&wanted_type_name, |
| const bool suppressed, |
| unsigned HOST_WIDE_INT &arg_num, |
| tree ¶ms, |
| const int alloc_flag, |
| const char * const format_start, |
| const char * const type_start, |
| location_t fmt_param_loc, |
| char conversion_char) |
| { |
| if (info->first_arg_num == 0) |
| return true; |
| |
| if ((fci->pointer_count == 0 && wanted_type == void_type_node) |
| || suppressed) |
| { |
| if (main_arg_num != 0) |
| { |
| if (suppressed) |
| warning_at (format_string_loc, OPT_Wformat_, |
| "operand number specified with " |
| "suppressed assignment"); |
| else |
| warning_at (format_string_loc, OPT_Wformat_, |
| "operand number specified for format " |
| "taking no argument"); |
| } |
| } |
| else |
| { |
| format_wanted_type *wanted_type_ptr; |
| |
| if (main_arg_num != 0) |
| { |
| arg_num = main_arg_num; |
| params = main_arg_params; |
| } |
| else |
| { |
| ++arg_num; |
| if (has_operand_number > 0) |
| { |
| warning_at (format_string_loc, OPT_Wformat_, |
| "missing $ operand number in format"); |
| return false; |
| } |
| else |
| has_operand_number = 0; |
| } |
| |
| wanted_type_ptr = &main_wanted_type; |
| while (fci) |
| { |
| tree cur_param; |
| if (params == 0) |
| cur_param = NULL; |
| else |
| { |
| cur_param = TREE_VALUE (params); |
| params = TREE_CHAIN (params); |
| } |
| |
| wanted_type_ptr->wanted_type = wanted_type; |
| wanted_type_ptr->wanted_type_name = wanted_type_name; |
| wanted_type_ptr->pointer_count = fci->pointer_count + alloc_flag; |
| wanted_type_ptr->char_lenient_flag = 0; |
| if (strchr (fci->flags2, 'c') != 0) |
| wanted_type_ptr->char_lenient_flag = 1; |
| wanted_type_ptr->scalar_identity_flag = 0; |
| if (len_modifier.scalar_identity_flag) |
| wanted_type_ptr->scalar_identity_flag = 1; |
| wanted_type_ptr->writing_in_flag = 0; |
| wanted_type_ptr->reading_from_flag = 0; |
| if (alloc_flag) |
| wanted_type_ptr->writing_in_flag = 1; |
| else |
| { |
| if (strchr (fci->flags2, 'W') != 0) |
| wanted_type_ptr->writing_in_flag = 1; |
| if (strchr (fci->flags2, 'R') != 0) |
| wanted_type_ptr->reading_from_flag = 1; |
| } |
| wanted_type_ptr->kind = CF_KIND_FORMAT; |
| wanted_type_ptr->param = cur_param; |
| wanted_type_ptr->arg_num = arg_num; |
| wanted_type_ptr->format_start = format_start; |
| wanted_type_ptr->format_length = format_chars - format_start; |
| wanted_type_ptr->offset_loc = format_chars - orig_format_chars; |
| wanted_type_ptr->next = NULL; |
| if (last_wanted_type != 0) |
| last_wanted_type->next = wanted_type_ptr; |
| if (first_wanted_type == 0) |
| first_wanted_type = wanted_type_ptr; |
| last_wanted_type = wanted_type_ptr; |
| |
| fci = fci->chain; |
| if (fci) |
| { |
| wanted_type_ptr = fwt_pool.allocate (); |
| arg_num++; |
| wanted_type = *fci->types[len_modifier.val].type; |
| wanted_type_name = fci->types[len_modifier.val].name; |
| } |
| } |
| } |
| |
| if (first_wanted_type != 0) |
| { |
| ptrdiff_t offset_to_format_start = (start_of_this_format - 1) - orig_format_chars; |
| ptrdiff_t offset_to_format_end = (format_chars - 1) - orig_format_chars; |
| /* By default, use the end of the range for the caret location. */ |
| substring_loc fmt_loc (fmt_param_loc, TREE_TYPE (format_string_cst), |
| offset_to_format_end, |
| offset_to_format_start, offset_to_format_end); |
| ptrdiff_t offset_to_type_start = type_start - orig_format_chars; |
| check_format_types (fmt_loc, first_wanted_type, fki, |
| offset_to_type_start, |
| conversion_char, arglocs); |
| } |
| |
| return true; |
| } |
| |
| /* Describes "paired tokens" within the format string that are |
| expected to be balanced. */ |
| |
| class baltoks_t |
| { |
| public: |
| baltoks_t (): singlequote (), doublequote () { } |
| |
| typedef auto_vec<const char *> balanced_tokens_t; |
| /* Vectors of pointers to opening brackets ('['), curly brackets ('{'), |
| quoting directives (like GCC "%<"), parentheses, and angle brackets |
| ('<'). Used to detect unbalanced tokens. */ |
| balanced_tokens_t brackets; |
| balanced_tokens_t curly; |
| balanced_tokens_t quotdirs; |
| balanced_tokens_t parens; |
| balanced_tokens_t pointy; |
| /* Pointer to the last opening quote. */ |
| const char *singlequote; |
| const char *doublequote; |
| }; |
| |
| /* Describes a keyword, operator, or other name. */ |
| |
| struct token_t |
| { |
| const char *name; /* Keyword/operator name. */ |
| unsigned char len; /* Its length. */ |
| const char *alt; /* Alternate spelling. */ |
| }; |
| |
| /* Helper for initializing global token_t arrays below. */ |
| #define NAME(name) { name, sizeof name - 1, NULL } |
| |
| /* C/C++ operators that are expected to be quoted within the format |
| string. */ |
| |
| static const token_t c_opers[] = |
| { |
| NAME ("!="), NAME ("%="), NAME ("&&"), NAME ("&="), NAME ("*="), |
| NAME ("++"), NAME ("+="), NAME ("--"), NAME ("-="), NAME ("->"), |
| NAME ("/="), NAME ("<<"), NAME ("<<="), NAME ("<="), NAME ("=="), |
| NAME (">="), NAME (">>="), NAME (">>"), NAME ("?:"), NAME ("^="), |
| NAME ("|="), NAME ("||") |
| }; |
| |
| static const token_t cxx_opers[] = |
| { |
| NAME ("->*"), NAME (".*"), NAME ("::"), NAME ("<=>") |
| }; |
| |
| /* Common C/C++ keywords that are expected to be quoted within the format |
| string. Keywords like auto, inline, or volatile are exccluded because |
| they are sometimes used in common terms like /auto variables/, /inline |
| function/, or /volatile access/ where they should not be quoted. */ |
| |
| static const token_t c_keywords[] = |
| { |
| #undef NAME |
| #define NAME(name, alt) { name, sizeof name - 1, alt } |
| |
| NAME ("alignas", NULL), |
| NAME ("alignof", NULL), |
| NAME ("asm", NULL), |
| NAME ("bool", NULL), |
| NAME ("char", NULL), |
| NAME ("const %", NULL), |
| NAME ("const-qualified", "%<const%>-qualified"), |
| NAME ("float", NULL), |
| NAME ("ifunc", NULL), |
| NAME ("int", NULL), |
| NAME ("long double", NULL), |
| NAME ("long int", NULL), |
| NAME ("long long", NULL), |
| NAME ("malloc", NULL), |
| NAME ("noclone", NULL), |
| NAME ("noinline", NULL), |
| NAME ("nonnull", NULL), |
| NAME ("noreturn", NULL), |
| NAME ("nothrow", NULL), |
| NAME ("offsetof", NULL), |
| NAME ("readonly", "read-only"), |
| NAME ("readwrite", "read-write"), |
| NAME ("restrict %", NULL), |
| NAME ("restrict-qualified", "%<restrict%>-qualified"), |
| NAME ("short int", NULL), |
| NAME ("signed char", NULL), |
| NAME ("signed int", NULL), |
| NAME ("signed long", NULL), |
| NAME ("signed short", NULL), |
| NAME ("sizeof", NULL), |
| NAME ("typeof", NULL), |
| NAME ("unsigned char", NULL), |
| NAME ("unsigned int", NULL), |
| NAME ("unsigned long", NULL), |
| NAME ("unsigned short", NULL), |
| NAME ("volatile %", NULL), |
| NAME ("volatile-qualified", "%<volatile%>-qualified"), |
| NAME ("weakref", NULL), |
| }; |
| |
| static const token_t cxx_keywords[] = |
| { |
| /* C++ only keywords and operators. */ |
| NAME ("catch", NULL), |
| NAME ("constexpr if", NULL), |
| NAME ("constexpr", NULL), |
| NAME ("constinit", NULL), |
| NAME ("consteval", NULL), |
| NAME ("decltype", NULL), |
| NAME ("nullptr", NULL), |
| NAME ("operator delete", NULL), |
| NAME ("operator new", NULL), |
| NAME ("typeid", NULL), |
| NAME ("typeinfo", NULL) |
| }; |
| |
| /* Blacklisted words such as misspellings that should be avoided in favor |
| of the specified alternatives. */ |
| static const struct |
| { |
| const char *name; /* Bad word. */ |
| unsigned char len; /* Its length. */ |
| const char *alt; /* Preferred alternative. */ |
| } badwords[] = |
| { |
| NAME ("arg", "argument"), |
| NAME ("bitfield", "bit-field"), |
| NAME ("builtin function", "built-in function"), |
| NAME ("can not", "cannot"), |
| NAME ("commandline option", "command-line option"), |
| NAME ("commandline", "command line"), |
| NAME ("command line option", "command-line option"), |
| NAME ("decl", "declaration"), |
| NAME ("enumeral", "enumerated"), |
| NAME ("floating point", "floating-point"), |
| NAME ("nonstatic", "non-static"), |
| NAME ("non-zero", "nonzero"), |
| NAME ("reg", "register"), |
| NAME ("stmt", "statement"), |
| }; |
| |
| /* Common contractions that should be avoided in favor of the specified |
| alternatives. */ |
| |
| static const struct |
| { |
| const char *name; /* Contraction. */ |
| unsigned char len; /* Its length. */ |
| const char *alt; /* Preferred alternative. */ |
| } contrs[] = |
| { |
| NAME ("can't", "cannot"), |
| NAME ("didn't", "did not"), |
| /* These are commonly abused. Avoid diagnosing them for now. |
| NAME ("isn't", "is not"), |
| NAME ("don't", "is not"), |
| */ |
| NAME ("mustn't", "must not"), |
| NAME ("needn't", "need not"), |
| NAME ("should't", "should not"), |
| NAME ("that's", "that is"), |
| NAME ("there's", "there is"), |
| NAME ("they're", "they are"), |
| NAME ("what's", "what is"), |
| NAME ("won't", "will not") |
| }; |
| |
| /* Check for unquoted TOKENS. FORMAT_STRING_LOC is the location of |
| the format string, FORMAT_STRING_CST the format string itself (as |
| a tree), ORIG_FORMAT_CHARS and FORMAT_CHARS are pointers to |
| the beginning of the format string and the character currently |
| being processed, and BALTOKS describes paired "tokens" within |
| the format string that are expected to be balanced. |
| Returns a pointer to the last processed character or null when |
| nothing was done. */ |
| |
| static const char* |
| check_tokens (const token_t *tokens, unsigned ntoks, |
| location_t format_string_loc, tree format_string_cst, |
| const char *orig_format_chars, const char *format_chars, |
| baltoks_t &baltoks) |
| { |
| /* For brevity. */ |
| const int opt = OPT_Wformat_diag; |
| /* Zero-based starting position of a problem sequence. */ |
| int fmtchrpos = format_chars - orig_format_chars; |
| |
| /* For identifier-like "words," set to the word length. */ |
| unsigned wlen = 0; |
| /* Set for an operator, clear for an identifier/word. */ |
| bool is_oper = false; |
| bool underscore = false; |
| |
| if (format_chars[0] == '_' || ISALPHA (format_chars[0])) |
| { |
| while (format_chars[wlen] == '_' || ISALNUM (format_chars[wlen])) |
| { |
| underscore |= format_chars[wlen] == '_'; |
| ++wlen; |
| } |
| } |
| else |
| is_oper = true; |
| |
| for (unsigned i = 0; i != ntoks; ++i) |
| { |
| unsigned toklen = tokens[i].len; |
| |
| if (toklen < wlen |
| || strncmp (format_chars, tokens[i].name, toklen)) |
| continue; |
| |
| if (toklen == 2 |
| && format_chars - orig_format_chars > 0 |
| && (TOUPPER (format_chars[-1]) == 'C' |
| || TOUPPER (format_chars[-1]) == 'G')) |
| return format_chars + toklen - 1; /* Reference to C++ or G++. */ |
| |
| if (ISPUNCT (format_chars[toklen - 1])) |
| { |
| if (format_chars[toklen - 1] == format_chars[toklen]) |
| return NULL; /* Operator followed by another punctuator. */ |
| } |
| else if (ISALNUM (format_chars[toklen])) |
| return NULL; /* Keyword prefix for a longer word. */ |
| |
| if (toklen == 2 |
| && format_chars[0] == '-' |
| && format_chars[1] == '-' |
| && ISALNUM (format_chars[2])) |
| return NULL; /* Probably option like --help. */ |
| |
| /* Allow this ugly warning for the time being. */ |
| if (toklen == 2 |
| && format_chars - orig_format_chars > 6 |
| && !strncmp (format_chars - 7, " count >= width of ", 19)) |
| return format_chars + 10; |
| |
| /* The token is a type if it ends in an alphabetic character. */ |
| bool is_type = (ISALPHA (tokens[i].name[toklen - 1]) |
| && strchr (tokens[i].name, ' ')); |
| |
| /* Backtrack to the last alphabetic character (for tokens whose |
| names end in '%'). */ |
| if (!is_oper) |
| while (!ISALPHA (tokens[i].name[toklen - 1])) |
| --toklen; |
| |
| if (format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + toklen, opt, |
| (is_type |
| ? G_("unquoted type name %<%.*s%> in format") |
| : (is_oper |
| ? G_("unquoted operator %<%.*s%> in format") |
| : G_("unquoted keyword %<%.*s%> in format"))), |
| toklen, format_chars) |
| && tokens[i].alt) |
| inform (format_string_loc, "use %qs instead", tokens[i].alt); |
| |
| return format_chars + toklen - 1; |
| } |
| |
| /* Diagnose unquoted __attribute__. Consider any parenthesized |
| argument to the attribute to avoid redundant warnings for |
| the double parentheses that might follow. */ |
| if (!strncmp (format_chars, "__attribute", sizeof "__attribute" - 1)) |
| { |
| unsigned nchars = sizeof "__attribute" - 1; |
| while ('_' == format_chars[nchars]) |
| ++nchars; |
| |
| for (int i = nchars; format_chars[i]; ++i) |
| if (' ' != format_chars[i]) |
| { |
| nchars = i; |
| break; |
| } |
| |
| if (format_chars[nchars] == '(') |
| { |
| baltoks.parens.safe_push (format_chars + nchars); |
| |
| ++nchars; |
| bool close = false; |
| if (format_chars[nchars] == '(') |
| { |
| baltoks.parens.safe_push (format_chars + nchars); |
| close = true; |
| ++nchars; |
| } |
| for (int i = nchars; format_chars[i]; ++i) |
| if (')' == format_chars[i]) |
| { |
| if (baltoks.parens.length () > 0) |
| baltoks.parens.pop (); |
| nchars = i + 1; |
| break; |
| } |
| |
| if (close && format_chars[nchars] == ')') |
| { |
| if (baltoks.parens.length () > 0) |
| baltoks.parens.pop (); |
| ++nchars; |
| } |
| } |
| |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted attribute in format"); |
| return format_chars + nchars - 1; |
| } |
| |
| /* Diagnose unquoted built-ins. */ |
| if (format_chars[0] == '_' |
| && format_chars[1] == '_' |
| && (!strncmp (format_chars + 2, "atomic", sizeof "atomic" - 1) |
| || !strncmp (format_chars + 2, "builtin", sizeof "builtin" - 1) |
| || !strncmp (format_chars + 2, "sync", sizeof "sync" - 1))) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + wlen, opt, |
| "unquoted name of built-in function %<%.*s%> " |
| "in format", |
| wlen, format_chars); |
| return format_chars + wlen - 1; |
| } |
| |
| /* Diagnose unquoted substrings of alphanumeric characters containing |
| underscores. They most likely refer to identifiers and should be |
| quoted. */ |
| if (underscore) |
| format_warning_substr (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| format_chars + wlen - orig_format_chars, |
| opt, |
| "unquoted identifier or keyword %<%.*s%> in format", |
| wlen, format_chars); |
| else |
| { |
| /* Diagnose some common misspellings. */ |
| for (unsigned i = 0; i != sizeof badwords / sizeof *badwords; ++i) |
| { |
| unsigned badwlen = strspn (badwords[i].name, " -"); |
| if (wlen >= badwlen |
| && (wlen <= badwords[i].len |
| || (wlen == badwords[i].len + 1U |
| && TOUPPER (format_chars[wlen - 1]) == 'S')) |
| && !strncasecmp (format_chars, badwords[i].name, badwords[i].len)) |
| { |
| /* Handle singular as well as plural forms of all bad words |
| even though the latter don't necessarily make sense for |
| all of the former (like "can nots"). */ |
| badwlen = badwords[i].len; |
| const char *plural = ""; |
| if (TOUPPER (format_chars[badwlen]) == 'S') |
| { |
| ++badwlen; |
| plural = "s"; |
| } |
| |
| /* As an exception, don't warn about "decl-specifier*" since |
| it's a C++ grammar production. */ |
| if (badwords[i].name[0] == 'd' |
| && strncmp (format_chars, "decl-specifier", |
| strlen ("decl-specifier")) == 0) |
| continue; |
| |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + badwords[i].len, |
| opt, |
| "misspelled term %<%.*s%> in format; " |
| "use %<%s%s%> instead", |
| badwlen, format_chars, |
| badwords[i].alt, plural); |
| |
| return format_chars + badwords[i].len - 1; |
| } |
| } |
| |
| /* Skip C++/G++. */ |
| if (!strncasecmp (format_chars, "c++", 3) |
| || !strncasecmp (format_chars, "g++", 3)) |
| return format_chars + 2; |
| } |
| |
| return wlen ? format_chars + wlen - 1 : NULL; |
| } |
| |
| /* Check plain text in a format string of a GCC diagnostic function |
| for common quoting, punctuation, and spelling mistakes, and issue |
| -Wformat-diag warnings if they are found. FORMAT_STRING_LOC is |
| the location of the format string, FORMAT_STRING_CST the format |
| string itself (as a tree), ORIG_FORMAT_CHARS and FORMAT_CHARS are |
| pointers to the beginning of the format string and the character |
| currently being processed, and BALTOKS describes paired "tokens" |
| within the format string that are expected to be balanced. |
| Returns a pointer to the last processed character. */ |
| |
| static const char* |
| check_plain (location_t format_string_loc, tree format_string_cst, |
| const char *orig_format_chars, const char *format_chars, |
| baltoks_t &baltoks) |
| { |
| /* For brevity. */ |
| const int opt = OPT_Wformat_diag; |
| /* Zero-based starting position of a problem sequence. */ |
| int fmtchrpos = format_chars - orig_format_chars; |
| |
| if (*format_chars == '%') |
| { |
| /* Diagnose %<%s%> and suggest using %qs instead. */ |
| if (!strncmp (format_chars, "%<%s%>", 6)) |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + 6, opt, |
| "quoted %qs directive in format; " |
| "use %qs instead", "%s", "%qs"); |
| else if (format_chars - orig_format_chars > 2 |
| && !strncasecmp (format_chars - 3, "can%'t", 6)) |
| format_warning_substr (format_string_loc, |
| format_string_cst, |
| fmtchrpos - 3, fmtchrpos + 3, opt, |
| "contraction %<%.*s%> in format; " |
| "use %qs instead", |
| 6, format_chars - 3, "cannot"); |
| |
| return format_chars; |
| } |
| |
| if (baltoks.quotdirs.length ()) |
| { |
| /* Skip over all plain text within a quoting directive until |
| the next directive. */ |
| while (*format_chars && '%' != *format_chars) |
| ++format_chars; |
| |
| return format_chars; |
| } |
| |
| /* The length of the problem sequence. */ |
| int nchars = 0; |
| |
| /* Diagnose any whitespace characters other than <space> but only |
| leading, trailing, and two or more consecutive <space>s. Do |
| this before diagnosing control characters because whitespace |
| is a subset of controls. */ |
| const char *other_than_space = NULL; |
| while (ISSPACE (format_chars[nchars])) |
| { |
| if (format_chars[nchars] != ' ' && !other_than_space) |
| other_than_space = format_chars + nchars; |
| ++nchars; |
| } |
| |
| if (nchars) |
| { |
| /* This is the most common problem: go the extra mile to describe |
| the problem in as much helpful detail as possible. */ |
| if (other_than_space) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted whitespace character %qc in format", |
| *other_than_space); |
| return format_chars + nchars - 1; |
| } |
| |
| if (fmtchrpos == 0) |
| /* Accept strings of leading spaces with no warning. */ |
| return format_chars + nchars - 1; |
| |
| if (!format_chars[nchars]) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "spurious trailing space in format"); |
| return format_chars + nchars - 1; |
| } |
| |
| if (nchars > 1) |
| { |
| if (nchars == 2 |
| && orig_format_chars < format_chars |
| && format_chars[-1] == '.' |
| && format_chars[0] == ' ' |
| && format_chars[1] == ' ') |
| { |
| /* A period followed by two spaces. */ |
| if (ISUPPER (*orig_format_chars)) |
| { |
| /* If the part before the period is a capitalized |
| sentence check to make sure that what follows |
| is also capitalized. */ |
| if (ISLOWER (format_chars[2])) |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "inconsistent capitalization in " |
| "format"); |
| } |
| } |
| else |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted sequence of %i consecutive " |
| "space characters in format", nchars); |
| return format_chars + nchars - 1; |
| } |
| |
| format_chars += nchars; |
| nchars = 0; |
| } |
| |
| fmtchrpos = format_chars - orig_format_chars; |
| |
| /* Diagnose any unquoted control characters other than the terminating |
| NUL. */ |
| while (format_chars[nchars] && ISCNTRL (format_chars[nchars])) |
| ++nchars; |
| |
| if (nchars > 1) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted control characters in format"); |
| return format_chars + nchars - 1; |
| } |
| if (nchars) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted control character %qc in format", |
| *format_chars); |
| return format_chars + nchars - 1; |
| } |
| |
| if (ISPUNCT (format_chars[0])) |
| { |
| size_t nelts = sizeof c_opers / sizeof *c_opers; |
| if (const char *ret = check_tokens (c_opers, nelts, |
| format_string_loc, format_string_cst, |
| orig_format_chars, format_chars, |
| baltoks)) |
| return ret; |
| |
| nelts = c_dialect_cxx () ? sizeof cxx_opers / sizeof *cxx_opers : 0; |
| if (const char *ret = check_tokens (cxx_opers, nelts, |
| format_string_loc, format_string_cst, |
| orig_format_chars, format_chars, |
| baltoks)) |
| return ret; |
| } |
| |
| if (ISALPHA (format_chars[0])) |
| { |
| size_t nelts = sizeof c_keywords / sizeof *c_keywords; |
| if (const char *ret = check_tokens (c_keywords, nelts, |
| format_string_loc, format_string_cst, |
| orig_format_chars, format_chars, |
| baltoks)) |
| return ret; |
| |
| nelts = c_dialect_cxx () ? sizeof cxx_keywords / sizeof *cxx_keywords : 0; |
| if (const char *ret = check_tokens (cxx_keywords, nelts, |
| format_string_loc, format_string_cst, |
| orig_format_chars, format_chars, |
| baltoks)) |
| return ret; |
| } |
| |
| nchars = 0; |
| |
| /* Diagnose unquoted options. */ |
| if ((format_chars == orig_format_chars |
| || format_chars[-1] == ' ') |
| && format_chars[0] == '-' |
| && ((format_chars[1] == '-' |
| && ISALPHA (format_chars[2])) |
| || ISALPHA (format_chars[1]))) |
| { |
| nchars = 1; |
| while (ISALNUM (format_chars[nchars]) |
| || '_' == format_chars[nchars] |
| || '-' == format_chars[nchars] |
| || '+' == format_chars[nchars]) |
| ++nchars; |
| |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted option name %<%.*s%> in format", |
| nchars, format_chars); |
| return format_chars + nchars - 1; |
| } |
| |
| /* Diagnose leading, trailing, and two or more consecutive punctuation |
| characters. */ |
| const char *unbalanced = NULL; |
| while ('%' != format_chars[nchars] |
| && ISPUNCT (format_chars[nchars]) |
| && !unbalanced) |
| { |
| switch (format_chars[nchars]) |
| { |
| case '[': |
| baltoks.brackets.safe_push (format_chars + nchars); |
| break; |
| case '{': |
| baltoks.curly.safe_push (format_chars + nchars); |
| break; |
| case '(': |
| baltoks.parens.safe_push (format_chars + nchars); |
| break; |
| case '<': |
| baltoks.pointy.safe_push (format_chars + nchars); |
| break; |
| |
| case ']': |
| if (baltoks.brackets.length () > 0) |
| baltoks.brackets.pop (); |
| else |
| unbalanced = format_chars + nchars; |
| break; |
| case '}': |
| if (baltoks.curly.length () > 0) |
| baltoks.curly.pop (); |
| else |
| unbalanced = format_chars + nchars; |
| break; |
| case ')': |
| if (baltoks.parens.length () > 0) |
| baltoks.parens.pop (); |
| else |
| unbalanced = format_chars + nchars; |
| break; |
| case '>': |
| if (baltoks.pointy.length () > 0) |
| baltoks.pointy.pop (); |
| else |
| unbalanced = format_chars + nchars; |
| break; |
| } |
| |
| ++nchars; |
| } |
| |
| if (unbalanced) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unbalanced punctuation character %qc in format", |
| *unbalanced); |
| return format_chars + nchars - 1; |
| } |
| |
| if (nchars) |
| { |
| /* Consider any identifier that follows the pound ('#') sign |
| a preprocessing directive. */ |
| if (nchars == 1 |
| && format_chars[0] == '#' |
| && ISALPHA (format_chars[1])) |
| { |
| while (ISALNUM (format_chars[nchars]) |
| || format_chars[nchars] == '_') |
| ++nchars; |
| |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted preprocessing directive %<%.*s%> " |
| "in format", nchars, format_chars); |
| return format_chars + nchars - 1; |
| } |
| |
| /* Diagnose a bare single quote. */ |
| if (nchars == 1 |
| && format_chars[0] == '\'' |
| && format_chars - orig_format_chars |
| && ISALPHA (format_chars[-1]) |
| && ISALPHA (format_chars[1])) |
| { |
| /* Diagnose a subset of contractions that are best avoided. */ |
| for (unsigned i = 0; i != sizeof contrs / sizeof *contrs; ++i) |
| { |
| const char *apos = strchr (contrs[i].name, '\''); |
| gcc_assert (apos != NULL); |
| int off = apos - contrs[i].name; |
| |
| if (format_chars - orig_format_chars >= off |
| && !strncmp (format_chars - off, |
| contrs[i].name, contrs[i].len)) |
| { |
| format_warning_substr (format_string_loc, |
| format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "contraction %<%.*s%> in format; " |
| "use %qs instead", |
| contrs[i].len, contrs[i].name, |
| contrs[i].alt); |
| return format_chars + nchars - 1; |
| } |
| } |
| |
| if (format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "bare apostrophe %<'%> in format")) |
| inform (format_string_loc, |
| "if avoiding the apostrophe is not feasible, enclose " |
| "it in a pair of %qs and %qs directives instead", |
| "%<", "%>"); |
| return format_chars + nchars - 1; |
| } |
| |
| /* Diagnose a backtick (grave accent). */ |
| if (nchars == 1 |
| && format_chars[0] == '`') |
| { |
| if (format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "grave accent %<`%> in format")) |
| inform (format_string_loc, |
| "use the apostrophe directive %qs instead", "%'"); |
| return format_chars + nchars - 1; |
| } |
| |
| /* Diagnose a punctuation character after a space. */ |
| if (nchars == 1 |
| && format_chars - orig_format_chars |
| && format_chars[-1] == ' ' |
| && strspn (format_chars, "!?:;.,") == 1) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos - 1, fmtchrpos, opt, |
| "space followed by punctuation character " |
| "%<%c%>", format_chars[0]); |
| return format_chars; |
| } |
| |
| if (nchars == 1) |
| { |
| if (!strncmp (format_chars, "\"%s\"", 4)) |
| { |
| if (format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + 4, opt, |
| "quoted %qs directive in format", |
| "%s")) |
| inform (format_string_loc, "if using %qs is not feasible, " |
| "use %qs instead", "%qs", "\"%-s\""); |
| } |
| |
| if (format_chars[0] == '"') |
| { |
| baltoks.doublequote = baltoks.doublequote ? NULL : format_chars; |
| return format_chars + nchars - 1; |
| } |
| if (format_chars[0] == '\'') |
| { |
| baltoks.singlequote = baltoks.singlequote ? NULL : format_chars; |
| return format_chars + nchars - 1; |
| } |
| } |
| |
| if (fmtchrpos == 0) |
| { |
| if (nchars == 1 |
| && format_chars[0] == '(') |
| ; /* Text beginning in an open parenthesis. */ |
| else if (nchars == 3 |
| && !strncmp (format_chars, "...", 3) |
| && format_chars[3]) |
| ; /* Text beginning in an ellipsis. */ |
| else |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "spurious leading punctuation sequence " |
| "%<%.*s%> in format", |
| nchars, format_chars); |
| return format_chars + nchars - 1; |
| } |
| } |
| else if (!format_chars[nchars]) |
| { |
| if (nchars == 1 |
| && (format_chars[nchars - 1] == ':' |
| || format_chars[nchars - 1] == ')')) |
| ; /* Text ending in a colon or a closing parenthesis. */ |
| else if (nchars == 1 |
| && ((ISUPPER (*orig_format_chars) |
| && format_chars[nchars - 1] == '.') |
| || strspn (format_chars + nchars - 1, "?])") == 1)) |
| ; /* Capitalized sentence terminated by a single period, |
| or text ending in a question mark, closing bracket, |
| or parenthesis. */ |
| else if (nchars == 2 |
| && format_chars[0] == '?' |
| && format_chars[1] == ')') |
| ; /* A question mark after a closing parenthetical note. */ |
| else if (nchars == 2 |
| && format_chars[0] == ')' |
| && (format_chars[1] == '?' |
| || format_chars[1] == ';' |
| || format_chars[1] == ':' |
| || (ISUPPER (*orig_format_chars) |
| && format_chars[1] == '.'))) |
| ; /* Closing parenthetical note followed by a question mark, |
| semicolon, or colon at the end of the string, or by |
| a period at the end of a capitalized sentence. */ |
| else if (nchars == 3 |
| && format_chars - orig_format_chars > 0 |
| && !strncmp (format_chars, "...", 3)) |
| ; /* Text ending in the ellipsis. */ |
| else |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "spurious trailing punctuation sequence " |
| "%<%.*s%> in format", |
| nchars, format_chars); |
| |
| return format_chars + nchars - 1; |
| } |
| else if (nchars == 2 |
| && format_chars[0] == ')' |
| && (format_chars[1] == ':' |
| || format_chars[1] == ';' |
| || format_chars[1] == ',') |
| && format_chars[2] == ' ') |
| ; /* Closing parenthetical note followed by a colon, semicolon |
| or a comma followed by a space in the middle of the string. */ |
| else if (nchars > 1) |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted sequence of %i consecutive " |
| "punctuation characters %q.*s in format", |
| nchars, nchars, format_chars); |
| return format_chars + nchars - 1; |
| } |
| |
| nchars = 0; |
| |
| /* Finally, diagnose any unquoted non-graph, non-punctuation characters |
| other than the terminating NUL. */ |
| while (format_chars[nchars] |
| && '%' != format_chars[nchars] |
| && !ISPUNCT (format_chars[nchars]) |
| && !ISGRAPH (format_chars[nchars])) |
| ++nchars; |
| |
| if (nchars > 1) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted non-graph characters in format"); |
| return format_chars + nchars - 1; |
| } |
| if (nchars) |
| { |
| format_warning_substr (format_string_loc, format_string_cst, |
| fmtchrpos, fmtchrpos + nchars, opt, |
| "unquoted non-graph character %qc in format", |
| *format_chars); |
| return format_chars + nchars - 1; |
| } |
| |
| return format_chars; |
| } |
| |
| /* Diagnose unbalanced tokens described by BALTOKS in format string |
| ORIG_FORMAT_CHARS and the corresponding FORMAT_STRING_CST. */ |
| |
| static void |
| maybe_diag_unbalanced_tokens (location_t format_string_loc, |
| const char *orig_format_chars, |
| tree format_string_cst, |
| baltoks_t &baltoks) |
| { |
| const char *unbalanced = NULL; |
| |
| if (baltoks.brackets.length ()) |
| unbalanced = baltoks.brackets.pop (); |
| else if (baltoks.curly.length ()) |
| unbalanced = baltoks.curly.pop (); |
| else if (baltoks.parens.length ()) |
| unbalanced = baltoks.parens.pop (); |
| else if (baltoks.pointy.length ()) |
| unbalanced = baltoks.pointy.pop (); |
| |
| if (unbalanced) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| unbalanced - orig_format_chars + 1, |
| OPT_Wformat_diag, |
| "unbalanced punctuation character %<%c%> in format", |
| *unbalanced); |
| |
| if (baltoks.quotdirs.length ()) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| baltoks.quotdirs.pop () - orig_format_chars, |
| OPT_Wformat_, |
| "unterminated quoting directive"); |
| |
| const char *quote |
| = baltoks.singlequote ? baltoks.singlequote : baltoks.doublequote; |
| |
| if (quote) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| quote - orig_format_chars + 1, |
| OPT_Wformat_diag, |
| "unterminated quote character %<%c%> in format", |
| *quote); |
| } |
| |
| /* Do the main part of checking a call to a format function. FORMAT_CHARS |
| is the NUL-terminated format string (which at this point may contain |
| internal NUL characters); FORMAT_LENGTH is its length (excluding the |
| terminating NUL character). ARG_NUM is one less than the number of |
| the first format argument to check; PARAMS points to that format |
| argument in the list of arguments. */ |
| |
| static void |
| check_format_info_main (format_check_results *res, |
| function_format_info *info, const char *format_chars, |
| location_t fmt_param_loc, tree format_string_cst, |
| int format_length, tree params, |
| unsigned HOST_WIDE_INT arg_num, |
| object_allocator <format_wanted_type> &fwt_pool, |
| vec<location_t> *arglocs) |
| { |
| const char * const orig_format_chars = format_chars; |
| const tree first_fillin_param = params; |
| |
| const format_kind_info * const fki = &format_types[info->format_type]; |
| const format_flag_spec * const flag_specs = fki->flag_specs; |
| const location_t format_string_loc = res->format_string_loc; |
| |
| /* -1 if no conversions taking an operand have been found; 0 if one has |
| and it didn't use $; 1 if $ formats are in use. */ |
| int has_operand_number = -1; |
| |
| /* Vectors of pointers to opening quoting directives (like GCC "%<"), |
| opening braces, brackets, and parentheses. Used to detect unbalanced |
| tokens. */ |
| baltoks_t baltoks; |
| |
| /* Pointers to the most recent color directives (like GCC's "%r or %R"). |
| A starting color directive much be terminated before the end of |
| the format string. A terminating directive makes no sense without |
| a prior starting directive. */ |
| const char *color_begin = NULL; |
| const char *color_end = NULL; |
| |
| init_dollar_format_checking (info->first_arg_num, first_fillin_param); |
| |
| /* In GCC diagnostic functions check plain directives (substrings within |
| the format string that don't start with %) for quoting and punctuations |
| problems. */ |
| bool ck_plain = (!info->is_raw |
| && (info->format_type == gcc_diag_format_type |
| || info->format_type == gcc_tdiag_format_type |
| || info->format_type == gcc_cdiag_format_type |
| || info->format_type == gcc_cxxdiag_format_type)); |
| |
| while (*format_chars != 0) |
| { |
| if (ck_plain) |
| format_chars = check_plain (format_string_loc, |
| format_string_cst, |
| orig_format_chars, format_chars, |
| baltoks); |
| |
| if (*format_chars == 0 || *format_chars++ != '%') |
| continue; |
| |
| if (*format_chars == 0) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "spurious trailing %<%%%> in format"); |
| continue; |
| } |
| if (*format_chars == '%') |
| { |
| ++format_chars; |
| continue; |
| } |
| |
| /* ARGUMENT_PARSER ctor takes FORMAT_CHARS by reference and calls |
| to ARG_PARSER members may modify the variable. */ |
| flag_chars_t flag_chars; |
| argument_parser arg_parser (info, format_chars, format_string_cst, |
| orig_format_chars, format_string_loc, |
| flag_chars, has_operand_number, |
| first_fillin_param, fwt_pool, arglocs); |
| |
| if (!arg_parser.read_any_dollar ()) |
| return; |
| |
| if (!arg_parser.read_format_flags ()) |
| return; |
| |
| /* Read any format width, possibly * or *m$. */ |
| if (!arg_parser.read_any_format_width (params, arg_num)) |
| return; |
| |
| /* Read any format left precision (must be a number, not *). */ |
| arg_parser.read_any_format_left_precision (); |
| |
| /* Read any format precision, possibly * or *m$. */ |
| if (!arg_parser.read_any_format_precision (params, arg_num)) |
| return; |
| |
| const char *format_start = format_chars; |
| |
| arg_parser.handle_alloc_chars (); |
| |
| /* The rest of the conversion specification is the length modifier |
| (if any), and the conversion specifier, so this is where the |
| type information starts. If we need to issue a suggestion |
| about a type mismatch, then we should preserve everything up |
| to here. */ |
| const char *type_start = format_chars; |
| |
| /* Read any length modifier, if this kind of format has them. */ |
| const length_modifier len_modifier |
| = arg_parser.read_any_length_modifier (); |
| |
| /* Read any modifier (strftime E/O). */ |
| arg_parser.read_any_other_modifier (); |
| |
| char format_char = *format_chars; |
| if (format_char == 0 |
| || (!(fki->flags & (int) FMT_FLAG_FANCY_PERCENT_OK) |
| && format_char == '%')) |
| { |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "conversion lacks type at end of format"); |
| continue; |
| } |
| format_chars++; |
| |
| const format_char_info * const fci |
| = arg_parser.find_format_char_info (format_char); |
| if (!fci) |
| continue; |
| |
| flag_chars.validate (fki, fci, flag_specs, format_chars, |
| format_string_cst, |
| format_string_loc, orig_format_chars, format_char, |
| baltoks.quotdirs.length () > 0); |
| |
| const int alloc_flag = flag_chars.get_alloc_flag (fki); |
| const bool suppressed = flag_chars.assignment_suppression_p (fki); |
| |
| /* Diagnose nested or unmatched quoting directives such as GCC's |
| "%<...%<" and "%>...%>". */ |
| bool quot_begin_p = strchr (fci->flags2, '<'); |
| bool quot_end_p = strchr (fci->flags2, '>'); |
| |
| if (quot_begin_p && !quot_end_p) |
| { |
| if (baltoks.quotdirs.length ()) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "nested quoting directive"); |
| baltoks.quotdirs.safe_push (format_chars); |
| } |
| else if (!quot_begin_p && quot_end_p) |
| { |
| if (baltoks.quotdirs.length ()) |
| baltoks.quotdirs.pop (); |
| else |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "unmatched quoting directive"); |
| } |
| |
| bool color_begin_p = strchr (fci->flags2, '/'); |
| if (color_begin_p) |
| { |
| color_begin = format_chars; |
| color_end = NULL; |
| } |
| else if (strchr (fci->flags2, '\\')) |
| { |
| if (color_end) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%qc directive redundant after prior " |
| "occurence of the same", format_char); |
| else if (!color_begin) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "unmatched color reset directive"); |
| color_end = format_chars; |
| } |
| |
| /* Diagnose directives that shouldn't appear in a quoted sequence. |
| (They are denoted by a double quote in FLAGS2.) */ |
| if (baltoks.quotdirs.length ()) |
| { |
| if (strchr (fci->flags2, '"')) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars - orig_format_chars, |
| OPT_Wformat_, |
| "%qc conversion used within a quoted " |
| "sequence", |
| format_char); |
| } |
| |
| /* Validate the pairs of flags used. */ |
| arg_parser.validate_flag_pairs (fci, format_char); |
| |
| arg_parser.give_y2k_warnings (fci, format_char); |
| |
| arg_parser.parse_any_scan_set (fci); |
| |
| tree wanted_type = NULL; |
| const char *wanted_type_name = NULL; |
| |
| if (!arg_parser.handle_conversions (fci, len_modifier, |
| wanted_type, wanted_type_name, |
| arg_num, |
| params, |
| format_char)) |
| continue; |
| |
| arg_parser.main_wanted_type.next = NULL; |
| |
| /* Finally. . .check type of argument against desired type! */ |
| if (!arg_parser.check_argument_type (fci, len_modifier, |
| wanted_type, wanted_type_name, |
| suppressed, |
| arg_num, params, |
| alloc_flag, |
| format_start, type_start, |
| fmt_param_loc, |
| format_char)) |
| return; |
| } |
| |
| if (format_chars - orig_format_chars != format_length) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| format_chars + 1 - orig_format_chars, |
| OPT_Wformat_contains_nul, |
| "embedded %<\\0%> in format"); |
| if (info->first_arg_num != 0 && params != 0 |
| && has_operand_number <= 0) |
| { |
| res->number_other--; |
| res->number_extra_args++; |
| } |
| if (has_operand_number > 0) |
| finish_dollar_format_checking (res, fki->flags & (int) FMT_FLAG_DOLLAR_GAP_POINTER_OK); |
| |
| maybe_diag_unbalanced_tokens (format_string_loc, orig_format_chars, |
| format_string_cst, baltoks); |
| |
| if (color_begin && !color_end) |
| format_warning_at_char (format_string_loc, format_string_cst, |
| color_begin - orig_format_chars, |
| OPT_Wformat_, "unterminated color directive"); |
| } |
| |
| /* Check the argument types from a single format conversion (possibly |
| including width and precision arguments). |
| |
| FMT_LOC is the location of the format conversion. |
| |
| TYPES is a singly-linked list expressing the parts of the format |
| conversion that expect argument types, and the arguments they |
| correspond to. |
| |
| OFFSET_TO_TYPE_START is the offset within the execution-charset encoded |
| format string to where type information begins for the conversion |
| (the length modifier and conversion specifier). |
| |
| CONVERSION_CHAR is the user-provided conversion specifier. |
| |
| For example, given: |
| |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| |
| then FMT_LOC covers this range: |
| |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^^^^^^^^^ |
| |
| and TYPES in this case is a three-entry singly-linked list consisting of: |
| (1) the check for the field width here: |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^ ^^^^ |
| against arg3, and |
| (2) the check for the field precision here: |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^^ ^^^^ |
| against arg4, and |
| (3) the check for the length modifier and conversion char here: |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^^^ ^^^^ |
| against arg5. |
| |
| OFFSET_TO_TYPE_START is 13, the offset to the "lld" within the |
| STRING_CST: |
| |
| 0000000000111111111122 |
| 0123456789012345678901 |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^ ^ |
| | ` CONVERSION_CHAR: 'd' |
| type starts here. */ |
| |
| static void |
| check_format_types (const substring_loc &fmt_loc, |
| format_wanted_type *types, const format_kind_info *fki, |
| int offset_to_type_start, |
| char conversion_char, |
| vec<location_t> *arglocs) |
| { |
| for (; types != 0; types = types->next) |
| { |
| tree cur_param; |
| tree cur_type; |
| tree orig_cur_type; |
| tree wanted_type; |
| int arg_num; |
| int i; |
| int char_type_flag; |
| |
| wanted_type = types->wanted_type; |
| arg_num = types->arg_num; |
| |
| /* The following should not occur here. */ |
| gcc_assert (wanted_type); |
| gcc_assert (wanted_type != void_type_node || types->pointer_count); |
| |
| if (types->pointer_count == 0) |
| wanted_type = lang_hooks.types.type_promotes_to (wanted_type); |
| |
| wanted_type = TYPE_MAIN_VARIANT (wanted_type); |
| |
| cur_param = types->param; |
| if (!cur_param) |
| { |
| format_type_warning (fmt_loc, UNKNOWN_LOCATION, types, wanted_type, |
| NULL, fki, offset_to_type_start, |
| conversion_char); |
| continue; |
| } |
| |
| cur_type = TREE_TYPE (cur_param); |
| if (cur_type == error_mark_node) |
| continue; |
| orig_cur_type = cur_type; |
| char_type_flag = 0; |
| |
| location_t param_loc = UNKNOWN_LOCATION; |
| if (EXPR_HAS_LOCATION (cur_param)) |
| param_loc = EXPR_LOCATION (cur_param); |
| else if (arglocs) |
| { |
| /* arg_num is 1-based. */ |
| gcc_assert (types->arg_num > 0); |
| param_loc = (*arglocs)[types->arg_num - 1]; |
| } |
| |
| STRIP_NOPS (cur_param); |
| |
| /* Check the types of any additional pointer arguments |
| that precede the "real" argument. */ |
| for (i = 0; i < types->pointer_count; ++i) |
| { |
| if (TREE_CODE (cur_type) == POINTER_TYPE) |
| { |
| cur_type = TREE_TYPE (cur_type); |
| if (cur_type == error_mark_node) |
| break; |
| |
| /* Check for writing through a NULL pointer. */ |
| if (types->writing_in_flag |
| && i == 0 |
| && cur_param != 0 |
| && integer_zerop (cur_param)) |
| warning (OPT_Wformat_, "writing through null pointer " |
| "(argument %d)", arg_num); |
| |
| /* Check for reading through a NULL pointer. Ignore |
| printf-family of functions as they are checked for |
| null arguments by the middle-end. */ |
| if (fki->conversion_specs != print_char_table |
| && types->reading_from_flag |
| && i == 0 |
| && cur_param != 0 |
| && integer_zerop (cur_param)) |
| warning (OPT_Wformat_, "reading through null pointer " |
| "(argument %d)", arg_num); |
| |
| if (cur_param != 0 && TREE_CODE (cur_param) == ADDR_EXPR) |
| cur_param = TREE_OPERAND (cur_param, 0); |
| else |
| cur_param = 0; |
| |
| /* See if this is an attempt to write into a const type with |
| scanf or with printf "%n". Note: the writing in happens |
| at the first indirection only, if for example |
| void * const * is passed to scanf %p; passing |
| const void ** is simply passing an incompatible type. */ |
| if (types->writing_in_flag |
| && i == 0 |
| && (TYPE_READONLY (cur_type) |
| || (cur_param != 0 |
| && (CONSTANT_CLASS_P (cur_param) |
| || (DECL_P (cur_param) |
| && TREE_READONLY (cur_param)))))) |
| warning (OPT_Wformat_, "writing into constant object " |
| "(argument %d)", arg_num); |
| |
| /* If there are extra type qualifiers beyond the first |
| indirection, then this makes the types technically |
| incompatible. */ |
| if (i > 0 |
| && pedantic |
| && (TYPE_READONLY (cur_type) |
| || TYPE_VOLATILE (cur_type) |
| || TYPE_ATOMIC (cur_type) |
| || TYPE_RESTRICT (cur_type))) |
| warning (OPT_Wformat_, "extra type qualifiers in format " |
| "argument (argument %d)", |
| arg_num); |
| |
| } |
| else |
| { |
| format_type_warning (fmt_loc, param_loc, |
| types, wanted_type, orig_cur_type, fki, |
| offset_to_type_start, conversion_char); |
| break; |
| } |
| } |
| |
| if (i < types->pointer_count) |
| continue; |
| |
| cur_type = TYPE_MAIN_VARIANT (cur_type); |
| |
| /* Check whether the argument type is a character type. This leniency |
| only applies to certain formats, flagged with 'c'. */ |
| if (types->char_lenient_flag) |
| char_type_flag = (cur_type == char_type_node |
| || cur_type == signed_char_type_node |
| || cur_type == unsigned_char_type_node); |
| |
| /* Check the type of the "real" argument, if there's a type we want. */ |
| if (lang_hooks.types_compatible_p (wanted_type, cur_type)) |
| continue; |
| /* If we want 'void *', allow any pointer type. |
| (Anything else would already have got a warning.) |
| With -Wpedantic, only allow pointers to void and to character |
| types. */ |
| if (wanted_type == void_type_node |
| && (!pedantic || (i == 1 && char_type_flag))) |
| continue; |
| /* Don't warn about differences merely in signedness, unless |
| -Wpedantic. With -Wpedantic, warn if the type is a pointer |
| target and not a character type, and for character types at |
| a second level of indirection. */ |
| if (TREE_CODE (wanted_type) == INTEGER_TYPE |
| && TREE_CODE (cur_type) == INTEGER_TYPE |
| && ((!pedantic && !warn_format_signedness) |
| || (i == 0 && !warn_format_signedness) |
| || (i == 1 && char_type_flag)) |
| && (TYPE_UNSIGNED (wanted_type) |
| ? wanted_type == c_common_unsigned_type (cur_type) |
| : wanted_type == c_common_signed_type (cur_type))) |
| continue; |
| /* Don't warn about differences merely in signedness if we know |
| that the current type is integer-promoted and its original type |
| was unsigned such as that it is in the range of WANTED_TYPE. */ |
| if (TREE_CODE (wanted_type) == INTEGER_TYPE |
| && TREE_CODE (cur_type) == INTEGER_TYPE |
| && warn_format_signedness |
| && TYPE_UNSIGNED (wanted_type) |
| && cur_param != NULL_TREE |
| && TREE_CODE (cur_param) == NOP_EXPR) |
| { |
| tree t = TREE_TYPE (TREE_OPERAND (cur_param, 0)); |
| if (TYPE_UNSIGNED (t) |
| && cur_type == lang_hooks.types.type_promotes_to (t)) |
| continue; |
| } |
| /* Likewise, "signed char", "unsigned char" and "char" are |
| equivalent but the above test won't consider them equivalent. */ |
| if (wanted_type == char_type_node |
| && (!pedantic || i < 2) |
| && char_type_flag) |
| continue; |
| if (types->scalar_identity_flag |
| && (TREE_CODE (cur_type) == TREE_CODE (wanted_type) |
| || (INTEGRAL_TYPE_P (cur_type) |
| && INTEGRAL_TYPE_P (wanted_type))) |
| && TYPE_PRECISION (cur_type) == TYPE_PRECISION (wanted_type)) |
| continue; |
| /* Now we have a type mismatch. */ |
| format_type_warning (fmt_loc, param_loc, types, |
| wanted_type, orig_cur_type, fki, |
| offset_to_type_start, conversion_char); |
| } |
| } |
| |
| /* Given type TYPE, attempt to dereference the type N times |
| (e.g. from ("int ***", 2) to "int *") |
| |
| Return the derefenced type, with any qualifiers |
| such as "const" stripped from the result, or |
| NULL if unsuccessful (e.g. TYPE is not a pointer type). */ |
| |
| static tree |
| deref_n_times (tree type, int n) |
| { |
| gcc_assert (type); |
| |
| for (int i = n; i > 0; i--) |
| { |
| if (TREE_CODE (type) != POINTER_TYPE) |
| return NULL_TREE; |
| type = TREE_TYPE (type); |
| } |
| /* Strip off any "const" etc. */ |
| return build_qualified_type (type, 0); |
| } |
| |
| /* Lookup the format code for FORMAT_LEN within FLI, |
| returning the string code for expressing it, or NULL |
| if it is not found. */ |
| |
| static const char * |
| get_modifier_for_format_len (const format_length_info *fli, |
| enum format_lengths format_len) |
| { |
| for (; fli->name; fli++) |
| { |
| if (fli->index == format_len) |
| return fli->name; |
| if (fli->double_index == format_len) |
| return fli->double_name; |
| } |
| return NULL; |
| } |
| |
| #if CHECKING_P |
| |
| namespace selftest { |
| |
| static void |
| test_get_modifier_for_format_len () |
| { |
| ASSERT_STREQ ("h", |
| get_modifier_for_format_len (printf_length_specs, FMT_LEN_h)); |
| ASSERT_STREQ ("hh", |
| get_modifier_for_format_len (printf_length_specs, FMT_LEN_hh)); |
| ASSERT_STREQ ("L", |
| get_modifier_for_format_len (printf_length_specs, FMT_LEN_L)); |
| ASSERT_EQ (NULL, |
| get_modifier_for_format_len (printf_length_specs, FMT_LEN_none)); |
| } |
| |
| } // namespace selftest |
| |
| #endif /* CHECKING_P */ |
| |
| /* Determine if SPEC_TYPE and ARG_TYPE are sufficiently similar for a |
| format_type_detail using SPEC_TYPE to be offered as a suggestion for |
| Wformat type errors where the argument has type ARG_TYPE. */ |
| |
| static bool |
| matching_type_p (tree spec_type, tree arg_type) |
| { |
| gcc_assert (spec_type); |
| gcc_assert (arg_type); |
| |
| /* If any of the types requires structural equality, we can't compare |
| their canonical types. */ |
| if (TYPE_STRUCTURAL_EQUALITY_P (spec_type) |
| || TYPE_STRUCTURAL_EQUALITY_P (arg_type)) |
| return false; |
| |
| spec_type = TYPE_CANONICAL (spec_type); |
| arg_type = TYPE_CANONICAL (arg_type); |
| |
| if (TREE_CODE (spec_type) == INTEGER_TYPE |
| && TREE_CODE (arg_type) == INTEGER_TYPE |
| && (TYPE_UNSIGNED (spec_type) |
| ? spec_type == c_common_unsigned_type (arg_type) |
| : spec_type == c_common_signed_type (arg_type))) |
| return true; |
| |
| return spec_type == arg_type; |
| } |
| |
| /* Subroutine of get_format_for_type. |
| |
| Generate a string containing the length modifier and conversion specifier |
| that should be used to format arguments of type ARG_TYPE within FKI |
| (effectively the inverse of the checking code). |
| |
| If CONVERSION_CHAR is not zero (the first pass), the resulting suggestion |
| is required to use it, for correcting bogus length modifiers. |
| If CONVERSION_CHAR is zero (the second pass), then allow any suggestion |
| that matches ARG_TYPE. |
| |
| If successful, returns a non-NULL string which should be freed |
| by the caller. |
| Otherwise, returns NULL. */ |
| |
| static char * |
| get_format_for_type_1 (const format_kind_info *fki, tree arg_type, |
| char conversion_char) |
| { |
| gcc_assert (arg_type); |
| |
| const format_char_info *spec; |
| for (spec = &fki->conversion_specs[0]; |
| spec->format_chars; |
| spec++) |
| { |
| if (conversion_char) |
| if (!strchr (spec->format_chars, conversion_char)) |
| continue; |
| |
| tree effective_arg_type = deref_n_times (arg_type, |
| spec->pointer_count); |
| if (!effective_arg_type) |
| continue; |
| for (int i = 0; i < FMT_LEN_MAX; i++) |
| { |
| const format_type_detail *ftd = &spec->types[i]; |
| if (!ftd->type || *ftd->type == NULL_TREE) |
| continue; |
| if (matching_type_p (*ftd->type, effective_arg_type)) |
| { |
| const char *len_modifier |
| = get_modifier_for_format_len (fki->length_char_specs, |
| (enum format_lengths)i); |
| if (!len_modifier) |
| len_modifier = ""; |
| |
| if (conversion_char) |
| /* We found a match, using the given conversion char - the |
| length modifier was incorrect (or absent). |
| Provide a suggestion using the conversion char with the |
| correct length modifier for the type. */ |
| return xasprintf ("%s%c", len_modifier, conversion_char); |
| else |
| /* 2nd pass: no match was possible using the user-provided |
| conversion char, but we do have a match without using it. |
| Provide a suggestion using the first conversion char |
| listed for the given type. */ |
| return xasprintf ("%s%c", len_modifier, spec->format_chars[0]); |
| } |
| } |
| } |
| |
| return NULL; |
| } |
| |
| /* Generate a string containing the length modifier and conversion specifier |
| that should be used to format arguments of type ARG_TYPE within FKI |
| (effectively the inverse of the checking code). |
| |
| If successful, returns a non-NULL string which should be freed |
| by the caller. |
| Otherwise, returns NULL. */ |
| |
| static char * |
| get_format_for_type (const format_kind_info *fki, tree arg_type, |
| char conversion_char) |
| { |
| gcc_assert (arg_type); |
| gcc_assert (conversion_char); |
| |
| /* First pass: look for a format_char_info containing CONVERSION_CHAR |
| If we find one, then presumably the length modifier was incorrect |
| (or absent). */ |
| char *result = get_format_for_type_1 (fki, arg_type, conversion_char); |
| if (result) |
| return result; |
| |
| /* Second pass: we didn't find a match for CONVERSION_CHAR, so try |
| matching just on the type. */ |
| return get_format_for_type_1 (fki, arg_type, '\0'); |
| } |
| |
| /* Attempt to get a string for use as a replacement fix-it hint for the |
| source range in FMT_LOC. |
| |
| Preserve all of the text within the range of FMT_LOC up to |
| OFFSET_TO_TYPE_START, replacing the rest with an appropriate |
| length modifier and conversion specifier for ARG_TYPE, attempting |
| to keep the user-provided CONVERSION_CHAR if possible. |
| |
| For example, given a long vs long long mismatch for arg5 here: |
| |
| 000000000111111111122222222223333333333| |
| 123456789012345678901234567890123456789` column numbers |
| 0000000000111111111122| |
| 0123456789012345678901` string offsets |
| V~~~~~~~~ : range of FMT_LOC, from cols 23-31 |
| sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); |
| ^ ^ |
| | ` CONVERSION_CHAR: 'd' |
| type starts here |
| |
| where OFFSET_TO_TYPE_START is 13 (the offset to the "lld" within the |
| STRING_CST), where the user provided: |
| %-+*.*lld |
| the result (assuming "long" argument 5) should be: |
| %-+*.*ld |
| |
| If successful, returns a non-NULL string which should be freed |
| by the caller. |
| Otherwise, returns NULL. */ |
| |
| static char * |
| get_corrected_substring (const substring_loc &fmt_loc, |
| format_wanted_type *type, tree arg_type, |
| const format_kind_info *fki, |
| int offset_to_type_start, char conversion_char) |
| { |
| /* Attempt to provide hints for argument types, but not for field widths |
| and precisions. */ |
| if (!arg_type) |
| return NULL; |
| if (type->kind != CF_KIND_FORMAT) |
| return NULL; |
| |
| /* Locate the current code within the source range, rejecting |
| any awkward cases where the format string occupies more than |
| one line. |
| Lookup the place where the type starts (including any length |
| modifiers), getting it as the caret location. */ |
| substring_loc type_loc (fmt_loc); |
| type_loc.set_caret_index (offset_to_type_start); |
| |
| location_t fmt_substring_loc; |
| const char *err = type_loc.get_location (&fmt_substring_loc); |
| if (err) |
| return NULL; |
| |
| source_range fmt_substring_range |
| = get_range_from_loc (line_table, fmt_substring_loc); |
| |
| expanded_location caret |
| = expand_location_to_spelling_point (fmt_substring_loc); |
| expanded_location start |
| = expand_location_to_spelling_point (fmt_substring_range.m_start); |
| expanded_location finish |
| = expand_location_to_spelling_point (fmt_substring_range.m_finish); |
| if (caret.file != start.file) |
| return NULL; |
| if (start.file != finish.file) |
| return NULL; |
| if (caret.line != start.line) |
| return NULL; |
| if (start.line != finish.line) |
| return NULL; |
| if (start.column > caret.column) |
| return NULL; |
| if (start.column > finish.column) |
| return NULL; |
| if (caret.column > finish.column) |
| return NULL; |
| |
| char_span line = location_get_source_line (start.file, start.line); |
| if (!line) |
| return NULL; |
| |
| /* If we got this far, then we have the line containing the |
| existing conversion specification. |
| |
| Generate a trimmed copy, containing the prefix part of the conversion |
| specification, up to the (but not including) the length modifier. |
| In the above example, this would be "%-+*.*". */ |
| int length_up_to_type = caret.column - start.column; |
| char_span prefix_span = line.subspan (start.column - 1, length_up_to_type); |
| char *prefix = prefix_span.xstrdup (); |
| |
| /* Now attempt to generate a suggestion for the rest of the specification |
| (length modifier and conversion char), based on ARG_TYPE and |
| CONVERSION_CHAR. |
| In the above example, this would be "ld". */ |
| char *format_for_type = get_format_for_type (fki, arg_type, conversion_char); |
| if (!format_for_type) |
| { |
| free (prefix); |
| return NULL; |
| } |
| |
| /* Success. Generate the resulting suggestion for the whole range of |
| FMT_LOC by concatenating the two strings. |
| In the above example, this would be "%-+*.*ld". */ |
| char *result = concat (prefix, format_for_type, NULL); |
| free (format_for_type); |
| free (prefix); |
| return result; |
| } |
| |
| /* Helper class for adding zero or more trailing '*' to types. |
| |
| The format type and name exclude any '*' for pointers, so those |
| must be formatted manually. For all the types we currently have, |
| this is adequate, but formats taking pointers to functions or |
| arrays would require the full type to be built up in order to |
| print it with %T. */ |
| |
| class indirection_suffix |
| { |
| public: |
| indirection_suffix (int pointer_count) : m_pointer_count (pointer_count) {} |
| |
| /* Determine the size of the buffer (including NUL-terminator). */ |
| |
| size_t get_buffer_size () const |
| { |
| return m_pointer_count + 2; |
| } |
| |
| /* Write the '*' to DST and add a NUL-terminator. */ |
| |
| void fill_buffer (char *dst) const |
| { |
| if (m_pointer_count == 0) |
| dst[0] = 0; |
| else if (c_dialect_cxx ()) |
| { |
| memset (dst, '*', m_pointer_count); |
| dst[m_pointer_count] = 0; |
| } |
| else |
| { |
| dst[0] = ' '; |
| memset (dst + 1, '*', m_pointer_count); |
| dst[m_pointer_count + 1] = 0; |
| } |
| } |
| |
| private: |
| int m_pointer_count; |
| }; |
| |
| /* Subclass of range_label for labelling the range in the format string |
| with the type in question, adding trailing '*' for pointer_count. */ |
| |
| class range_label_for_format_type_mismatch |
| : public range_label_for_type_mismatch |
| { |
| public: |
| range_label_for_format_type_mismatch (tree labelled_type, tree other_type, |
| int pointer_count) |
| : range_label_for_type_mismatch (labelled_type, other_type), |
| m_pointer_count (pointer_count) |
| { |
| } |
| |
| label_text get_text (unsigned range_idx) const FINAL OVERRIDE |
| { |
| label_text text = range_label_for_type_mismatch::get_text (range_idx); |
| if (text.m_buffer == NULL) |
| return text; |
| |
| indirection_suffix suffix (m_pointer_count); |
| char *p = (char *) alloca (suffix.get_buffer_size ()); |
| suffix.fill_buffer (p); |
| |
| char *result = concat (text.m_buffer, p, NULL); |
| text.maybe_free (); |
| return label_text::take (result); |
| } |
| |
| private: |
| int m_pointer_count; |
| }; |
| |
| /* Give a warning about a format argument of different type from that expected. |
| The range of the diagnostic is taken from WHOLE_FMT_LOC; the caret location |
| is based on the location of the char at TYPE->offset_loc. |
| PARAM_LOC is the location of the relevant argument, or UNKNOWN_LOCATION |
| if this is unavailable. |
| WANTED_TYPE is the type the argument should have, |
| possibly stripped of pointer dereferences. The description (such as "field |
| precision"), the placement in the format string, a possibly more |
| friendly name of WANTED_TYPE, and the number of pointer dereferences |
| are taken from TYPE. ARG_TYPE is the type of the actual argument, |
| or NULL if it is missing. |
| |
| OFFSET_TO_TYPE_START is the offset within the execution-charset encoded |
| format string to where type information begins for the conversion |
| (the length modifier and conversion specifier). |
| CONVERSION_CHAR is the user-provided conversion specifier. |
| |
| For example, given a type mismatch for argument 5 here: |
| |
| 00000000011111111112222222222333333333344444444445555555555| |
| 12345678901234567890123456789012345678901234567890123456789` column numbers |
| 0000000000111111111122| |
| 0123456789012345678901` offsets within STRING_CST |
| V~~~~~~~~ : range of WHOLE_FMT_LOC, from cols 23-31 |
| sprintf (d, "before %-+*.*lld after", int_expr, int_expr, long_expr); |
| ^ ^ ^~~~~~~~~ |
| | ` CONVERSION_CHAR: 'd' PARAM_LOC |
| type starts here |
| |
| OFFSET_TO_TYPE_START is 13, the offset to the "lld" within the |
| STRING_CST. */ |
| |
| static void |
| format_type_warning (const substring_loc &whole_fmt_loc, |
| location_t param_loc, |
| format_wanted_type *type, |
| tree wanted_type, tree arg_type, |
| const format_kind_info *fki, |
| int offset_to_type_start, |
| char conversion_char) |
| { |
| enum format_specifier_kind kind = type->kind; |
| const char *wanted_type_name = type->wanted_type_name; |
| const char *format_start = type->format_start; |
| int format_length = type->format_length; |
| int pointer_count = type->pointer_count; |
| int arg_num = type->arg_num; |
| |
| /* If ARG_TYPE is a typedef with a misleading name (for example, |
| size_t but not the standard size_t expected by printf %zu), avoid |
| printing the typedef name. */ |
| if (wanted_type_name |
| && arg_type |
| && TYPE_NAME (arg_type) |
| && TREE_CODE (TYPE_NAME (arg_type)) == TYPE_DECL |
| && DECL_NAME (TYPE_NAME (arg_type)) |
| && !strcmp (wanted_type_name, |
| lang_hooks.decl_printable_name (TYPE_NAME (arg_type), 2))) |
| arg_type = TYPE_MAIN_VARIANT (arg_type); |
| |
| indirection_suffix suffix (pointer_count); |
| char *p = (char *) alloca (suffix.get_buffer_size ()); |
| suffix.fill_buffer (p); |
| |
| /* WHOLE_FMT_LOC has the caret at the end of the range. |
| Set the caret to be at the offset from TYPE. Subtract one |
| from the offset for the same reason as in format_warning_at_char. */ |
| substring_loc fmt_loc (whole_fmt_loc); |
| fmt_loc.set_caret_index (type->offset_loc - 1); |
| |
| range_label_for_format_type_mismatch fmt_label (wanted_type, arg_type, |
| pointer_count); |
| range_label_for_type_mismatch param_label (arg_type, wanted_type); |
| |
| /* Get a string for use as a replacement fix-it hint for the range in |
| fmt_loc, or NULL. */ |
| char *corrected_substring |
| = get_corrected_substring (fmt_loc, type, arg_type, fki, |
| offset_to_type_start, conversion_char); |
| format_string_diagnostic_t diag (fmt_loc, &fmt_label, param_loc, ¶m_label, |
| corrected_substring); |
| if (wanted_type_name) |
| { |
| if (arg_type) |
| diag.emit_warning |
| (OPT_Wformat_, |
| "%s %<%s%.*s%> expects argument of type %<%s%s%>, " |
| "but argument %d has type %qT", |
| gettext (kind_descriptions[kind]), |
| (kind == CF_KIND_FORMAT ? "%" : ""), |
| format_length, format_start, |
| wanted_type_name, p, arg_num, arg_type); |
| else |
| diag.emit_warning |
| (OPT_Wformat_, |
| "%s %<%s%.*s%> expects a matching %<%s%s%> argument", |
| gettext (kind_descriptions[kind]), |
| (kind == CF_KIND_FORMAT ? "%" : ""), |
| format_length, format_start, wanted_type_name, p); |
| } |
| else |
| { |
| if (arg_type) |
| diag.emit_warning |
| (OPT_Wformat_, |
| "%s %<%s%.*s%> expects argument of type %<%T%s%>, " |
| "but argument %d has type %qT", |
| gettext (kind_descriptions[kind]), |
| (kind == CF_KIND_FORMAT ? "%" : ""), |
| format_length, format_start, |
| wanted_type, p, arg_num, arg_type); |
| else |
| diag.emit_warning |
| (OPT_Wformat_, |
| "%s %<%s%.*s%> expects a matching %<%T%s%> argument", |
| gettext (kind_descriptions[kind]), |
| (kind == CF_KIND_FORMAT ? "%" : ""), |
| format_length, format_start, wanted_type, p); |
| } |
| |
| free (corrected_substring); |
| } |
| |
| |
| /* Given a format_char_info array FCI, and a character C, this function |
| returns the index into the conversion_specs where that specifier's |
| data is located. The character must exist. */ |
| static unsigned int |
| find_char_info_specifier_index (const format_char_info *fci, int c) |
| { |
| unsigned i; |
| |
| for (i = 0; fci->format_chars; i++, fci++) |
| if (strchr (fci->format_chars, c)) |
| return i; |
| |
| /* We shouldn't be looking for a non-existent specifier. */ |
| gcc_unreachable (); |
| } |
| |
| /* Given a format_length_info array FLI, and a character C, this |
| function returns the index into the conversion_specs where that |
| modifier's data is located. The character must exist. */ |
| static unsigned int |
| find_length_info_modifier_index (const format_length_info *fli, int c) |
| { |
| unsigned i; |
| |
| for (i = 0; fli->name; i++, fli++) |
| if (strchr (fli->name, c)) |
| return i; |
| |
| /* We shouldn't be looking for a non-existent modifier. */ |
| gcc_unreachable (); |
| } |
| |
| /* Determine the type of HOST_WIDE_INT in the code being compiled for |
| use in GCC's __asm_fprintf__ custom format attribute. You must |
| have set dynamic_format_types before calling this function. */ |
| static void |
| init_dynamic_asm_fprintf_info (void) |
| { |
| static tree hwi; |
| |
| if (!hwi) |
| { |
| format_length_info *new_asm_fprintf_length_specs; |
| unsigned int i; |
| |
| /* Find the underlying type for HOST_WIDE_INT. For the %w |
| length modifier to work, one must have issued: "typedef |
| HOST_WIDE_INT __gcc_host_wide_int__;" in one's source code |
| prior to using that modifier. */ |
| hwi = maybe_get_identifier ("__gcc_host_wide_int__"); |
| if (!hwi) |
| { |
| error ("%<__gcc_host_wide_int__%> is not defined as a type"); |
| return; |
| } |
| hwi = identifier_global_value (hwi); |
| if (!hwi || TREE_CODE (hwi) != TYPE_DECL) |
| { |
| error ("%<__gcc_host_wide_int__%> is not defined as a type"); |
| return; |
| } |
| hwi = DECL_ORIGINAL_TYPE (hwi); |
| gcc_assert (hwi); |
| if (hwi != long_integer_type_node && hwi != long_long_integer_type_node) |
| { |
| error ("%<__gcc_host_wide_int__%> is not defined as %<long%>" |
| " or %<long long%>"); |
| return; |
| } |
| |
| /* Create a new (writable) copy of asm_fprintf_length_specs. */ |
| new_asm_fprintf_length_specs = (format_length_info *) |
| xmemdup (asm_fprintf_length_specs, |
| sizeof (asm_fprintf_length_specs), |
| sizeof (asm_fprintf_length_specs)); |
| |
| /* HOST_WIDE_INT must be one of 'long' or 'long long'. */ |
| i = find_length_info_modifier_index (new_asm_fprintf_length_specs, 'w'); |
| if (hwi == long_integer_type_node) |
| new_asm_fprintf_length_specs[i].index = FMT_LEN_l; |
| else if (hwi == long_long_integer_type_node) |
| new_asm_fprintf_length_specs[i].index = FMT_LEN_ll; |
| else |
| gcc_unreachable (); |
| |
| /* Assign the new data for use. */ |
| dynamic_format_types[asm_fprintf_format_type].length_char_specs = |
| new_asm_fprintf_length_specs; |
| } |
| } |
| |
| /* Determine the type of a "locus" in the code being compiled for use |
| in GCC's __gcc_gfc__ custom format attribute. You must have set |
| dynamic_format_types before calling this function. */ |
| static void |
| init_dynamic_gfc_info (void) |
| { |
| if (!locus) |
| { |
| static format_char_info *gfc_fci; |
| |
| /* For the GCC __gcc_gfc__ custom format specifier to work, one |
| must have declared 'locus' prior to using this attribute. If |
| we haven't seen this declarations then you shouldn't use the |
| specifier requiring that type. */ |
| if ((locus = maybe_get_identifier ("locus"))) |
| { |
| locus = identifier_global_value (locus); |
| if (locus) |
| { |
| if (TREE_CODE (locus) != TYPE_DECL |
| || TREE_TYPE (locus) == error_mark_node) |
| { |
| error ("%<locus%> is not defined as a type"); |
| locus = 0; |
| } |
| else |
| locus = TREE_TYPE (locus); |
| } |
| } |
| |
| /* Assign the new data for use. */ |
| |
| /* Handle the __gcc_gfc__ format specifics. */ |
| if (!gfc_fci) |
| dynamic_format_types[gcc_gfc_format_type].conversion_specs = |
| gfc_fci = (format_char_info *) |
| xmemdup (gcc_gfc_char_table, |
| sizeof (gcc_gfc_char_table), |
| sizeof (gcc_gfc_char_table)); |
| if (locus) |
| { |
| const unsigned i = find_char_info_specifier_index (gfc_fci, 'L'); |
| gfc_fci[i].types[0].type = &locus; |
| gfc_fci[i].pointer_count = 1; |
| } |
| } |
| } |
| |
| /* Lookup the type named NAME and return a NAME type if found. |
| Otherwise, return void_type_node if NAME has not been used yet, |
| or NULL_TREE if NAME is not a type (issuing an error). */ |
| |
| static tree |
| get_named_type (const char *name) |
| { |
| if (tree result = maybe_get_identifier (name)) |
| { |
| result = identifier_global_tag (result); |
| if (result) |
| { |
| if (TYPE_P (result)) |
| ; |
| else if (TREE_CODE (result) == TYPE_DECL) |
| result = TREE_TYPE (result); |
| else |
| { |
| error ("%qs is not defined as a type", name); |
| result = NULL_TREE; |
| } |
| } |
| return result; |
| } |
| else |
| return void_type_node; |
| } |
| |
| /* Determine the types of "tree" and "location_t" in the code being |
| compiled for use in GCC's diagnostic custom format attributes. You |
| must have set dynamic_format_types before calling this function. */ |
| static void |
| init_dynamic_diag_info (void) |
| { |
| /* For the GCC-diagnostics custom format specifiers to work, one |
| must have declared 'tree' and 'location_t' prior to using those |
| attributes. If we haven't seen these declarations then |
| the specifiers requiring these types shouldn't be used. |
| However we don't force a hard ICE because we may see only one |
| or the other type. */ |
| if (tree loc = maybe_get_identifier ("location_t")) |
| { |
| loc = identifier_global_value (loc); |
| if (loc && TREE_CODE (loc) != TYPE_DECL) |
| error ("%<location_t%> is not defined as a type"); |
| } |
| |
| /* Initialize the global tree node type local to this file. */ |
| if (!local_tree_type_node |
| || local_tree_type_node == void_type_node) |
| { |
| /* We need to grab the underlying 'union tree_node' so peek into |
| an extra type level. */ |
| if ((local_tree_type_node = maybe_get_identifier ("tree"))) |
| { |
| local_tree_type_node |
| = identifier_global_value (local_tree_type_node); |
| if (local_tree_type_node) |
| { |
| if (TREE_CODE (local_tree_type_node) != TYPE_DECL) |
| { |
| error ("%<tree%> is not defined as a type"); |
| local_tree_type_node = NULL_TREE; |
| } |
| else if (TREE_CODE (TREE_TYPE (local_tree_type_node)) |
| != POINTER_TYPE) |
| { |
| error ("%<tree%> is not defined as a pointer type"); |
| local_tree_type_node = NULL_TREE; |
| } |
| else |
| local_tree_type_node |
| = TREE_TYPE (TREE_TYPE (local_tree_type_node)); |
| } |
| } |
| else |
| local_tree_type_node = void_type_node; |
| } |
| |
| /* Similar to the above but for gimple*. */ |
| if (!local_gimple_ptr_node |
| || local_gimple_ptr_node == void_type_node) |
| local_gimple_ptr_node = get_named_type ("gimple"); |
| |
| /* Similar to the above but for cgraph_node*. */ |
| if (!local_cgraph_node_ptr_node |
| || local_cgraph_node_ptr_node == void_type_node) |
| local_cgraph_node_ptr_node = get_named_type ("cgraph_node"); |
| |
| /* Similar to the above but for diagnostic_event_id_t*. */ |
| if (!local_event_ptr_node |
| || local_event_ptr_node == void_type_node) |
| local_event_ptr_node = get_named_type ("diagnostic_event_id_t"); |
| |
| static tree hwi; |
| |
| if (!hwi) |
| { |
| static format_length_info *diag_ls; |
| unsigned int i; |
| |
| /* Find the underlying type for HOST_WIDE_INT. For the 'w' |
| length modifier to work, one must have issued: "typedef |
| HOST_WIDE_INT __gcc_host_wide_int__;" in one's source code |
| prior to using that modifier. */ |
| if ((hwi = maybe_get_identifier ("__gcc_host_wide_int__"))) |
| { |
| hwi = identifier_global_value (hwi); |
| if (hwi) |
| { |
| if (TREE_CODE (hwi) != TYPE_DECL) |
| { |
| error ("%<__gcc_host_wide_int__%> is not defined as a type"); |
| hwi = 0; |
| } |
| else |
| { |
| hwi = DECL_ORIGINAL_TYPE (hwi); |
| gcc_assert (hwi); |
| if (hwi != long_integer_type_node |
| && hwi != long_long_integer_type_node) |
| { |
| error ("%<__gcc_host_wide_int__%> is not defined" |
| " as %<long%> or %<long long%>"); |
| hwi = 0; |
| } |
| } |
| } |
| } |
| |
| /* Assign the new data for use. */ |
| |
| /* All the GCC diag formats use the same length specs. */ |
| if (!diag_ls) |
| dynamic_format_types[gcc_diag_format_type].length_char_specs = |
| dynamic_format_types[gcc_tdiag_format_type].length_char_specs = |
| dynamic_format_types[gcc_cdiag_format_type].length_char_specs = |
| dynamic_format_types[gcc_cxxdiag_format_type].length_char_specs = |
| dynamic_format_types[gcc_dump_printf_format_type].length_char_specs = |
| diag_ls = (format_length_info *) |
| xmemdup (gcc_diag_length_specs, |
| sizeof (gcc_diag_length_specs), |
| sizeof (gcc_diag_length_specs)); |
| if (hwi) |
| { |
| /* HOST_WIDE_INT must be one of 'long' or 'long long'. */ |
| i = find_length_info_modifier_index (diag_ls, 'w'); |
| if (hwi == long_integer_type_node) |
| diag_ls[i].index = FMT_LEN_l; |
| else if (hwi == long_long_integer_type_node) |
| diag_ls[i].index = FMT_LEN_ll; |
| else |
| gcc_unreachable (); |
| } |
| } |
| |
| /* It's safe to "re-initialize these to the same values. */ |
| dynamic_format_types[gcc_diag_format_type].conversion_specs = |
| gcc_diag_char_table; |
| dynamic_format_types[gcc_tdiag_format_type].conversion_specs = |
| gcc_tdiag_char_table; |
| dynamic_format_types[gcc_cdiag_format_type].conversion_specs = |
| gcc_cdiag_char_table; |
| dynamic_format_types[gcc_cxxdiag_format_type].conversion_specs = |
| gcc_cxxdiag_char_table; |
| dynamic_format_types[gcc_dump_printf_format_type].conversion_specs = |
| gcc_dump_printf_char_table; |
| } |
| |
| #ifdef TARGET_FORMAT_TYPES |
| extern const format_kind_info TARGET_FORMAT_TYPES[]; |
| #endif |
| |
| #ifdef TARGET_OVERRIDES_FORMAT_ATTRIBUTES |
| extern const target_ovr_attr TARGET_OVERRIDES_FORMAT_ATTRIBUTES[]; |
| #endif |
| #ifdef TARGET_OVERRIDES_FORMAT_INIT |
| extern void TARGET_OVERRIDES_FORMAT_INIT (void); |
| #endif |
| |
| /* Attributes such as "printf" are equivalent to those such as |
| "gnu_printf" unless this is overridden by a target. */ |
| static const target_ovr_attr gnu_target_overrides_format_attributes[] = |
| { |
| { "gnu_printf", "printf" }, |
| { "gnu_scanf", "scanf" }, |
| { "gnu_strftime", "strftime" }, |
| { "gnu_strfmon", "strfmon" }, |
| { NULL, NULL } |
| }; |
| |
| /* Translate to unified attribute name. This is used in decode_format_type and |
| decode_format_attr. In attr_name the user specified argument is passed. It |
| returns the unified format name from TARGET_OVERRIDES_FORMAT_ATTRIBUTES |
| or the attr_name passed to this function, if there is no matching entry. */ |
| static const char * |
| convert_format_name_to_system_name (const char *attr_name) |
| { |
| int i; |
| |
| if (attr_name == NULL || *attr_name == 0 |
| || strncmp (attr_name, "gcc_", 4) == 0) |
| return attr_name; |
| #ifdef TARGET_OVERRIDES_FORMAT_INIT |
| TARGET_OVERRIDES_FORMAT_INIT (); |
| #endif |
| |
| #ifdef TARGET_OVERRIDES_FORMAT_ATTRIBUTES |
| /* Check if format attribute is overridden by target. */ |
| if (TARGET_OVERRIDES_FORMAT_ATTRIBUTES != NULL |
| && TARGET_OVERRIDES_FORMAT_ATTRIBUTES_COUNT > 0) |
| { |
| for (i = 0; i < TARGET_OVERRIDES_FORMAT_ATTRIBUTES_COUNT; ++i) |
| { |
| if (cmp_attribs (TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_src, |
| attr_name)) |
| return attr_name; |
| if (cmp_attribs (TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_dst, |
| attr_name)) |
| return TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_src; |
| } |
| } |
| #endif |
| /* Otherwise default to gnu format. */ |
| for (i = 0; |
| gnu_target_overrides_format_attributes[i].named_attr_src != NULL; |
| ++i) |
| { |
| if (cmp_attribs (gnu_target_overrides_format_attributes[i].named_attr_src, |
| attr_name)) |
| return attr_name; |
| if (cmp_attribs (gnu_target_overrides_format_attributes[i].named_attr_dst, |
| attr_name)) |
| return gnu_target_overrides_format_attributes[i].named_attr_src; |
| } |
| |
| return attr_name; |
| } |
| |
| /* Handle a "format" attribute; arguments as in |
| struct attribute_spec.handler. */ |
| tree |
| handle_format_attribute (tree *node, tree atname, tree args, |
| int flags, bool *no_add_attrs) |
| { |
| const_tree type = *node; |
| function_format_info info; |
| |
| #ifdef TARGET_FORMAT_TYPES |
| /* If the target provides additional format types, we need to |
| add them to FORMAT_TYPES at first use. */ |
| if (TARGET_FORMAT_TYPES != NULL && !dynamic_format_types) |
| { |
| dynamic_format_types = XNEWVEC (format_kind_info, |
| n_format_types + TARGET_N_FORMAT_TYPES); |
| memcpy (dynamic_format_types, format_types_orig, |
| sizeof (format_types_orig)); |
| memcpy (&dynamic_format_types[n_format_types], TARGET_FORMAT_TYPES, |
| TARGET_N_FORMAT_TYPES * sizeof (dynamic_format_types[0])); |
| |
| format_types = dynamic_format_types; |
| /* Provide a reference for the first potential external type. */ |
| first_target_format_type = n_format_types; |
| n_format_types += TARGET_N_FORMAT_TYPES; |
| } |
| #endif |
| |
| /* Canonicalize name of format function. */ |
| if (TREE_CODE (TREE_VALUE (args)) == IDENTIFIER_NODE) |
| TREE_VALUE (args) = canonicalize_attr_name (TREE_VALUE (args)); |
| |
| if (!decode_format_attr (type, atname, args, &info, /* validated_p = */false)) |
| { |
| *no_add_attrs = true; |
| return NULL_TREE; |
| } |
| |
| if (prototype_p (type)) |
| { |
| if (!check_format_string (type, info.format_num, flags, |
| no_add_attrs, info.format_type)) |
| return NULL_TREE; |
| |
| if (info.first_arg_num != 0) |
| { |
| unsigned HOST_WIDE_INT arg_num = 1; |
| function_args_iterator iter; |
| tree arg_type; |
| |
| /* Verify that first_arg_num points to the last arg, |
| the ... */ |
| FOREACH_FUNCTION_ARGS (type, arg_type, iter) |
| arg_num++; |
| |
| if (arg_num != info.first_arg_num) |
| { |
| if (!(flags & (int) ATTR_FLAG_BUILT_IN)) |
| error ("argument to be formatted is not %<...%>"); |
| *no_add_attrs = true; |
| return NULL_TREE; |
| } |
| } |
| } |
| |
| /* Check if this is a strftime variant. Just for this variant |
| FMT_FLAG_ARG_CONVERT is not set. */ |
| if ((format_types[info.format_type].flags & (int) FMT_FLAG_ARG_CONVERT) == 0 |
| && info.first_arg_num != 0) |
| { |
| error ("strftime formats cannot format arguments"); |
| *no_add_attrs = true; |
| return NULL_TREE; |
| } |
| |
| /* If this is a custom GCC-internal format type, we have to |
| initialize certain bits at runtime. */ |
| if (info.format_type == asm_fprintf_format_type |
| || info.format_type == gcc_gfc_format_type |
| || info.format_type == gcc_diag_format_type |
| || info.format_type == gcc_tdiag_format_type |
| || info.format_type == gcc_cdiag_format_type |
| || info.format_type == gcc_cxxdiag_format_type |
| || info.format_type == gcc_dump_printf_format_type) |
| { |
| /* Our first time through, we have to make sure that our |
| format_type data is allocated dynamically and is modifiable. */ |
| if (!dynamic_format_types) |
| format_types = dynamic_format_types = (format_kind_info *) |
| xmemdup (format_types_orig, sizeof (format_types_orig), |
| sizeof (format_types_orig)); |
| |
| /* If this is format __asm_fprintf__, we have to initialize |
| GCC's notion of HOST_WIDE_INT for checking %wd. */ |
| if (info.format_type == asm_fprintf_format_type) |
| init_dynamic_asm_fprintf_info (); |
| /* If this is format __gcc_gfc__, we have to initialize GCC's |
| notion of 'locus' at runtime for %L. */ |
| else if (info.format_type == gcc_gfc_format_type) |
| init_dynamic_gfc_info (); |
| /* If this is one of the diagnostic attributes, then we have to |
| initialize 'location_t' and 'tree' at runtime. */ |
| else if (info.format_type == gcc_diag_format_type |
| || info.format_type == gcc_tdiag_format_type |
| || info.format_type == gcc_cdiag_format_type |
| || info.format_type == gcc_cxxdiag_format_type |
| || info.format_type == gcc_dump_printf_format_type) |
| init_dynamic_diag_info (); |
| else |
| gcc_unreachable (); |
| } |
| |
| return NULL_TREE; |
| } |
| |
| #if CHECKING_P |
| |
| namespace selftest { |
| |
| /* Selftests of location handling. */ |
| |
| /* Get the format_kind_info with the given name. */ |
| |
| static const format_kind_info * |
| get_info (const char *name) |
| { |
| int idx = decode_format_type (name); |
| const format_kind_info *fki = &format_types[idx]; |
| ASSERT_STREQ (fki->name, name); |
| return fki; |
| } |
| |
| /* Verify that get_format_for_type (FKI, TYPE, CONVERSION_CHAR) |
| is EXPECTED_FORMAT. */ |
| |
| static void |
| assert_format_for_type_streq (const location &loc, const format_kind_info *fki, |
| const char *expected_format, tree type, |
| char conversion_char) |
| { |
| gcc_assert (fki); |
| gcc_assert (expected_format); |
| gcc_assert (type); |
| |
| char *actual_format = get_format_for_type (fki, type, conversion_char); |
| ASSERT_STREQ_AT (loc, expected_format, actual_format); |
| free (actual_format); |
| } |
| |
| /* Selftests for get_format_for_type. */ |
| |
| #define ASSERT_FORMAT_FOR_TYPE_STREQ(EXPECTED_FORMAT, TYPE, CONVERSION_CHAR) \ |
| assert_format_for_type_streq (SELFTEST_LOCATION, (fki), (EXPECTED_FORMAT), \ |
| (TYPE), (CONVERSION_CHAR)) |
| |
| /* Selftest for get_format_for_type for "printf"-style functions. */ |
| |
| static void |
| test_get_format_for_type_printf () |
| { |
| const format_kind_info *fki = get_info ("gnu_printf"); |
| ASSERT_NE (fki, NULL); |
| |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'X'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'X'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("d", integer_type_node, 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("i", integer_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("o", integer_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("x", integer_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("X", integer_type_node, 'X'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("d", unsigned_type_node, 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("i", unsigned_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("o", unsigned_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("x", unsigned_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("X", unsigned_type_node, 'X'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("ld", long_integer_type_node, 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("li", long_integer_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lx", long_integer_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lo", long_unsigned_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lx", long_unsigned_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lld", long_long_integer_type_node, 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lli", long_long_integer_type_node, 'i'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("llo", long_long_unsigned_type_node, 'o'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("llx", long_long_unsigned_type_node, 'x'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("s", build_pointer_type (char_type_node), 'i'); |
| } |
| |
| /* Selftest for get_format_for_type for "scanf"-style functions. */ |
| |
| static void |
| test_get_format_for_type_scanf () |
| { |
| const format_kind_info *fki = get_info ("gnu_scanf"); |
| ASSERT_NE (fki, NULL); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("d", build_pointer_type (integer_type_node), 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("u", build_pointer_type (unsigned_type_node), 'u'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("ld", |
| build_pointer_type (long_integer_type_node), 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("lu", |
| build_pointer_type (long_unsigned_type_node), 'u'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ |
| ("lld", build_pointer_type (long_long_integer_type_node), 'd'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ |
| ("llu", build_pointer_type (long_long_unsigned_type_node), 'u'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("e", build_pointer_type (float_type_node), 'e'); |
| ASSERT_FORMAT_FOR_TYPE_STREQ ("le", build_pointer_type (double_type_node), 'e'); |
| } |
| |
| #undef ASSERT_FORMAT_FOR_TYPE_STREQ |
| |
| /* Exercise the type-printing label code, to give some coverage |
| under "make selftest-valgrind" (in particular, to ensure that |
| the label-printing machinery doesn't leak). */ |
| |
| static void |
| test_type_mismatch_range_labels () |
| { |
| /* Create a tempfile and write some text to it. |
| ....................0000000001 11111111 12 22222222 |
| ....................1234567890 12345678 90 12345678. */ |
| const char *content = " printf (\"msg: %i\\n\", msg);\n"; |
| temp_source_file tmp (SELFTEST_LOCATION, ".c", content); |
| line_table_test ltt; |
| |
| linemap_add (line_table, LC_ENTER, false, tmp.get_filename (), 1); |
| |
| location_t c17 = linemap_position_for_column (line_table, 17); |
| ASSERT_EQ (LOCATION_COLUMN (c17), 17); |
| location_t c18 = linemap_position_for_column (line_table, 18); |
| location_t c24 = linemap_position_for_column (line_table, 24); |
| location_t c26 = linemap_position_for_column (line_table, 26); |
| |
| /* Don't attempt to run the tests if column data might be unavailable. */ |
| if (c26 > LINE_MAP_MAX_LOCATION_WITH_COLS) |
| return; |
| |
| location_t fmt = make_location (c18, c17, c18); |
| ASSERT_EQ (LOCATION_COLUMN (fmt), 18); |
| |
| location_t param = make_location (c24, c24, c26); |
| ASSERT_EQ (LOCATION_COLUMN (param), 24); |
| |
| range_label_for_format_type_mismatch fmt_label (char_type_node, |
| integer_type_node, 1); |
| range_label_for_type_mismatch param_label (integer_type_node, |
| char_type_node); |
| gcc_rich_location richloc (fmt, &fmt_label); |
| richloc.add_range (param, SHOW_RANGE_WITHOUT_CARET, ¶m_label); |
| |
| test_diagnostic_context dc; |
| diagnostic_show_locus (&dc, &richloc, DK_ERROR); |
| if (c_dialect_cxx ()) |
| /* "char*", without a space. */ |
| ASSERT_STREQ (" printf (\"msg: %i\\n\", msg);\n" |
| " ~^ ~~~\n" |
| " | |\n" |
| " char* int\n", |
| pp_formatted_text (dc.printer)); |
| else |
| /* "char *", with a space. */ |
| ASSERT_STREQ (" printf (\"msg: %i\\n\", msg);\n" |
| " ~^ ~~~\n" |
| " | |\n" |
| " | int\n" |
| " char *\n", |
| pp_formatted_text (dc.printer)); |
| } |
| |
| /* Run all of the selftests within this file. */ |
| |
| void |
| c_format_c_tests () |
| { |
| test_get_modifier_for_format_len (); |
| test_get_format_for_type_printf (); |
| test_get_format_for_type_scanf (); |
| test_type_mismatch_range_labels (); |
| } |
| |
| } // namespace selftest |
| |
| #endif /* CHECKING_P */ |
| |
| #include "gt-c-family-c-format.h" |