/* Check calls to formatted I/O functions (-Wformat). Copyright (C) 1992-2024 Free Software Foundation, Inc. This file is part of GCC. GCC is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3, or (at your option) any later version. GCC is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with GCC; see the file COPYING3. If not see . */ #include "config.h" #include "system.h" #include "coretypes.h" #include "tm.h" #include "c-target.h" #include "c-common.h" #include "alloc-pool.h" #include "stringpool.h" #include "c-objc.h" #include "intl.h" #include "langhooks.h" #include "c-format.h" #include "diagnostic.h" #include "substring-locations.h" #include "selftest.h" #include "selftest-diagnostic.h" #include "builtins.h" #include "attribs.h" #include "c-family/c-type-mismatch.h" #include "tree-pretty-print-markup.h" /* Handle attributes associated with format checking. */ /* This must be in the same order as format_types, except for format_type_error. Target-specific format types do not have matching enum values. */ enum format_type { printf_format_type, asm_fprintf_format_type, gcc_diag_format_type, gcc_tdiag_format_type, gcc_cdiag_format_type, gcc_cxxdiag_format_type, gcc_gfc_format_type, gcc_dump_printf_format_type, gcc_objc_string_format_type, format_type_error = -1}; struct function_format_info { enum format_type format_type; /* type of format (printf, scanf, etc.) */ /* IS_RAW is relevant only for GCC diagnostic format functions. It is set for "raw" formatting functions like pp_printf that are not intended to produce complete diagnostics according to GCC guidelines, and clear for others like error and warning whose format string is checked for proper quoting and spelling. */ bool is_raw; unsigned HOST_WIDE_INT format_num; /* number of format argument */ unsigned HOST_WIDE_INT first_arg_num; /* number of first arg (zero for varargs) */ }; /* Initialized in init_dynamic_diag_info. */ static GTY(()) tree local_tree_type_node; static GTY(()) tree local_event_ptr_node; static GTY(()) tree local_pp_element_ptr_node; static GTY(()) tree local_gimple_ptr_node; static GTY(()) tree local_cgraph_node_ptr_node; static GTY(()) tree locus; static bool decode_format_attr (const_tree, tree, tree, function_format_info *, bool); static format_type decode_format_type (const char *, bool * = NULL); static bool check_format_string (const_tree argument, unsigned HOST_WIDE_INT format_num, int flags, bool *no_add_attrs, int expected_format_type); static bool validate_constant (const_tree fn, const_tree atname, tree &expr, int argno, unsigned HOST_WIDE_INT *value, int flags, bool validated_p); static const char *convert_format_name_to_system_name (const char *attr_name); static int first_target_format_type; static const char *format_name (int format_num); static int format_flags (int format_num); /* Emit a warning as per format_warning_va, but construct the substring_loc for the character at offset (CHAR_IDX - 1) within a string constant FORMAT_STRING_CST at FMT_STRING_LOC. */ ATTRIBUTE_GCC_DIAG (5,6) static bool format_warning_at_char (location_t fmt_string_loc, tree format_string_cst, int char_idx, int opt, const char *gmsgid, ...) { va_list ap; va_start (ap, gmsgid); tree string_type = TREE_TYPE (format_string_cst); /* The callers are of the form: format_warning (format_string_loc, format_string_cst, format_chars - orig_format_chars, where format_chars has already been incremented, so that CHAR_IDX is one character beyond where the warning should be emitted. Fix it. */ char_idx -= 1; substring_loc fmt_loc (fmt_string_loc, string_type, char_idx, char_idx, char_idx); format_string_diagnostic_t diag (fmt_loc, NULL, UNKNOWN_LOCATION, NULL, NULL); bool warned = diag.emit_warning_va (opt, gmsgid, &ap); va_end (ap); return warned; } /* Emit a warning as per format_warning_va, but construct the substring_loc for the substring at offset (POS1, POS2 - 1) within a string constant FORMAT_STRING_CST at FMT_STRING_LOC. */ ATTRIBUTE_GCC_DIAG (6,7) static bool format_warning_substr (location_t fmt_string_loc, tree format_string_cst, int pos1, int pos2, int opt, const char *gmsgid, ...) { va_list ap; va_start (ap, gmsgid); tree string_type = TREE_TYPE (format_string_cst); pos2 -= 1; substring_loc fmt_loc (fmt_string_loc, string_type, pos1, pos1, pos2); format_string_diagnostic_t diag (fmt_loc, NULL, UNKNOWN_LOCATION, NULL, NULL); bool warned = diag.emit_warning_va (opt, gmsgid, &ap); va_end (ap); return warned; } /* Check that we have a pointer to a string suitable for use as a format. The default is to check for a char type. For objective-c dialects, this is extended to include references to string objects validated by objc_string_ref_type_p (). Targets may also provide a string object type that can be used within c and c++ and shared with their respective objective-c dialects. In this case the reference to a format string is checked for validity via a hook. The function returns true if strref points to any string type valid for the language dialect and target. */ bool valid_format_string_type_p (tree strref) { return (strref != NULL && TREE_CODE (strref) == POINTER_TYPE && (TYPE_MAIN_VARIANT (TREE_TYPE (strref)) == char_type_node || objc_string_ref_type_p (strref) || (*targetcm.string_object_ref_type_p) ((const_tree) strref))); } /* Handle a "format_arg" attribute; arguments as in struct attribute_spec.handler. */ tree handle_format_arg_attribute (tree *node, tree atname, tree args, int flags, bool *no_add_attrs) { tree type = *node; /* Note that TREE_VALUE (args) is changed in the validate_constant call. */ tree *format_num_expr = &TREE_VALUE (args); unsigned HOST_WIDE_INT format_num = 0; if (!validate_constant (type, atname, *format_num_expr, 0, &format_num, 0, false)) { *no_add_attrs = true; return NULL_TREE; } if (prototype_p (type)) { /* The format arg can be any string reference valid for the language and target. We cannot be more specific in this case. */ if (!check_format_string (type, format_num, flags, no_add_attrs, -1)) return NULL_TREE; } if (!valid_format_string_type_p (TREE_TYPE (type))) { if (!(flags & (int) ATTR_FLAG_BUILT_IN)) error ("function does not return string type"); *no_add_attrs = true; return NULL_TREE; } return NULL_TREE; } /* Verify that the format_num argument is actually a string reference suitable, for the language dialect and target (in case the format attribute is in error). When we know the specific reference type expected, this is also checked. */ static bool check_format_string (const_tree fntype, unsigned HOST_WIDE_INT format_num, int flags, bool *no_add_attrs, int expected_format_type) { unsigned HOST_WIDE_INT i; bool is_objc_sref, is_target_sref, is_char_ref; tree ref; int fmt_flags; function_args_iterator iter; i = 1; FOREACH_FUNCTION_ARGS (fntype, ref, iter) { if (i == format_num) break; i++; } if (!ref || !valid_format_string_type_p (ref)) { if (!(flags & (int) ATTR_FLAG_BUILT_IN)) error ("format string argument is not a string type"); *no_add_attrs = true; return false; } /* We only know that we want a suitable string reference. */ if (expected_format_type < 0) return true; /* Now check that the arg matches the expected type. */ is_char_ref = (TYPE_MAIN_VARIANT (TREE_TYPE (ref)) == char_type_node); fmt_flags = format_flags (expected_format_type); is_objc_sref = is_target_sref = false; if (!is_char_ref) is_objc_sref = objc_string_ref_type_p (ref); if (!(fmt_flags & FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL)) { if (is_char_ref) return true; /* OK, we expected a char and found one. */ else { /* We expected a char but found an extended string type. */ if (is_objc_sref) error ("found a %qs reference but the format argument should" " be a string", format_name (gcc_objc_string_format_type)); else error ("found a %qT but the format argument should be a string", ref); *no_add_attrs = true; return false; } } /* We expect a string object type as the format arg. */ if (is_char_ref) { error ("format argument should be a %qs reference but" " a string was found", format_name (expected_format_type)); *no_add_attrs = true; return false; } /* We will assert that objective-c will support either its own string type or the target-supplied variant. */ if (!is_objc_sref) is_target_sref = (*targetcm.string_object_ref_type_p) ((const_tree) ref); if (expected_format_type == (int) gcc_objc_string_format_type && (is_objc_sref || is_target_sref)) return true; /* We will allow a target string ref to match only itself. */ if (first_target_format_type && expected_format_type >= first_target_format_type && is_target_sref) return true; else { error ("format argument should be a %qs reference", format_name (expected_format_type)); *no_add_attrs = true; return false; } } /* Under the control of FLAGS, verify EXPR is a valid constant that refers to a positional argument ARGNO having a string type (char* or, for targets like Darwin, a pointer to struct CFString) to a function FN declared with attribute ATNAME. If valid, store the constant's integer value in *VALUE and return true. If VALIDATED_P is true assert the validation is successful. N.B. This function modifies EXPR. */ static bool validate_constant (const_tree fn, const_tree atname, tree &expr, int argno, unsigned HOST_WIDE_INT *value, int flags, bool validated_p) { /* Require the referenced argument to have a string type. For targets like Darwin, also accept pointers to struct CFString. */ if (tree val = positional_argument (fn, atname, expr, STRING_CST, argno, flags)) { *value = TREE_INT_CST_LOW (val); return true; } gcc_assert (!validated_p); return false; } /* Decode the arguments to a "format" attribute into a function_format_info structure. It is already known that the list is of the right length. If VALIDATED_P is true, then these attributes have already been validated and must not be erroneous; if false, it will give an error message. FN is either a function declaration or function type. Returns true if the attributes are successfully decoded, false otherwise. */ static bool decode_format_attr (const_tree fn, tree atname, tree args, function_format_info *info, bool validated_p) { tree format_type_id = TREE_VALUE (args); /* Note that TREE_VALUE (args) is changed in place below. Ditto for the value of the next element on the list. */ tree *format_num_expr = &TREE_VALUE (TREE_CHAIN (args)); tree *first_arg_num_expr = &TREE_VALUE (TREE_CHAIN (TREE_CHAIN (args))); if (TREE_CODE (format_type_id) != IDENTIFIER_NODE) { gcc_assert (!validated_p); error ("unrecognized format specifier"); return false; } else { const char *p = IDENTIFIER_POINTER (format_type_id); info->format_type = decode_format_type (p, &info->is_raw); if (!c_dialect_objc () && info->format_type == gcc_objc_string_format_type) { gcc_assert (!validated_p); warning (OPT_Wformat_, "%qE is only allowed in Objective-C dialects", format_type_id); info->format_type = format_type_error; return false; } if (info->format_type == format_type_error) { gcc_assert (!validated_p); warning (OPT_Wformat_, "%qE is an unrecognized format function type", format_type_id); return false; } } if (!validate_constant (fn, atname, *format_num_expr, 2, &info->format_num, 0, validated_p)) return false; if (!validate_constant (fn, atname, *first_arg_num_expr, 3, &info->first_arg_num, (POSARG_ZERO | POSARG_ELLIPSIS), validated_p)) return false; if (info->first_arg_num != 0 && info->first_arg_num <= info->format_num) { gcc_assert (!validated_p); error ("format string argument follows the arguments to be formatted"); return false; } return true; } /* Check a call to a format function against a parameter list. */ /* The C standard version C++ is treated as equivalent to or inheriting from, for the purpose of format features supported. */ #define CPLUSPLUS_STD_VER (cxx_dialect < cxx11 ? STD_C94 : STD_C99) /* The C standard version we are checking formats against when pedantic. */ #define C_STD_VER ((int) (c_dialect_cxx () \ ? CPLUSPLUS_STD_VER \ : (flag_isoc23 \ ? STD_C23 \ : (flag_isoc99 \ ? STD_C99 \ : (flag_isoc94 ? STD_C94 : STD_C89))))) /* The name to give to the standard version we are warning about when pedantic. FEATURE_VER is the version in which the feature warned out appeared, which is higher than C_STD_VER. */ #define C_STD_NAME(FEATURE_VER) (c_dialect_cxx () \ ? (cxx_dialect < cxx11 ? "ISO C++98" \ : "ISO C++11") \ : ((FEATURE_VER) == STD_EXT \ ? "ISO C" \ : ((FEATURE_VER) == STD_C23 \ ? "ISO C17" \ : "ISO C90"))) /* Adjust a C standard version, which may be STD_C9L, to account for -Wno-long-long. Returns other standard versions unchanged. */ #define ADJ_STD(VER) ((int) ((VER) == STD_C9L \ ? (warn_long_long ? STD_C99 : STD_C89) \ : (VER))) /* Enum describing the kind of specifiers present in the format and requiring an argument. */ enum format_specifier_kind { CF_KIND_FORMAT, CF_KIND_FIELD_WIDTH, CF_KIND_FIELD_PRECISION }; static const char *kind_descriptions[] = { N_("format"), N_("field width specifier"), N_("field precision specifier") }; /* Structure describing details of a type expected in format checking, and the type to check against it. */ struct format_wanted_type { /* The type wanted. */ tree wanted_type; /* The name of this type to use in diagnostics. */ const char *wanted_type_name; /* Should be type checked just for scalar width identity. */ int scalar_identity_flag; /* The level of indirection through pointers at which this type occurs. */ int pointer_count; /* Whether, when pointer_count is 1, to allow any character type when pedantic, rather than just the character or void type specified. */ int char_lenient_flag; /* Whether the argument, dereferenced once, is written into and so the argument must not be a pointer to a const-qualified type. */ int writing_in_flag; /* Whether the argument, dereferenced once, is read from and so must not be a NULL pointer. */ int reading_from_flag; /* The kind of specifier that this type is used for. */ enum format_specifier_kind kind; /* The starting character of the specifier. This never includes the initial percent sign. */ const char *format_start; /* The length of the specifier. */ int format_length; /* The actual parameter to check against the wanted type. */ tree param; /* The argument number of that parameter. */ int arg_num; /* The offset location of this argument with respect to the format string location. */ unsigned int offset_loc; /* The next type to check for this format conversion, or NULL if none. */ struct format_wanted_type *next; }; /* Convenience macro for format_length_info meaning unused. */ #define NO_FMT NULL, FMT_LEN_none, STD_C89 static const format_length_info printf_length_specs[] = { { "h", FMT_LEN_h, STD_C89, "hh", FMT_LEN_hh, STD_C99, 0 }, { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C9L, 0 }, { "q", FMT_LEN_ll, STD_EXT, NO_FMT, 0 }, { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, { "z", FMT_LEN_z, STD_C99, NO_FMT, 0 }, { "Z", FMT_LEN_z, STD_EXT, NO_FMT, 0 }, { "t", FMT_LEN_t, STD_C99, NO_FMT, 0 }, { "j", FMT_LEN_j, STD_C99, NO_FMT, 0 }, { "H", FMT_LEN_H, STD_C23, NO_FMT, 0 }, { "D", FMT_LEN_D, STD_C23, "DD", FMT_LEN_DD, STD_C23, 0 }, { "w8", FMT_LEN_w8, STD_C23, NO_FMT, 0 }, { "w16", FMT_LEN_w16, STD_C23, NO_FMT, 0 }, { "w32", FMT_LEN_w32, STD_C23, NO_FMT, 0 }, { "w64", FMT_LEN_w64, STD_C23, NO_FMT, 0 }, { "wf8", FMT_LEN_wf8, STD_C23, NO_FMT, 0 }, { "wf16", FMT_LEN_wf16, STD_C23, NO_FMT, 0 }, { "wf32", FMT_LEN_wf32, STD_C23, NO_FMT, 0 }, { "wf64", FMT_LEN_wf64, STD_C23, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; /* Length specifiers valid for asm_fprintf. */ static const format_length_info asm_fprintf_length_specs[] = { { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C89, 0 }, { "w", FMT_LEN_w, STD_C89, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; /* Length specifiers valid for GCC diagnostics. */ static const format_length_info gcc_diag_length_specs[] = { { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C89, 0 }, { "w", FMT_LEN_w, STD_C89, NO_FMT, 0 }, { "z", FMT_LEN_z, STD_C99, NO_FMT, 0 }, { "t", FMT_LEN_t, STD_C99, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; /* The custom diagnostics all accept the same length specifiers. */ #define gcc_tdiag_length_specs gcc_diag_length_specs #define gcc_cdiag_length_specs gcc_diag_length_specs #define gcc_cxxdiag_length_specs gcc_diag_length_specs #define gcc_dump_printf_length_specs gcc_diag_length_specs /* This differs from printf_length_specs only in that "Z" is not accepted. */ static const format_length_info scanf_length_specs[] = { { "h", FMT_LEN_h, STD_C89, "hh", FMT_LEN_hh, STD_C99, 0 }, { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C9L, 0 }, { "q", FMT_LEN_ll, STD_EXT, NO_FMT, 0 }, { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, { "z", FMT_LEN_z, STD_C99, NO_FMT, 0 }, { "t", FMT_LEN_t, STD_C99, NO_FMT, 0 }, { "j", FMT_LEN_j, STD_C99, NO_FMT, 0 }, { "H", FMT_LEN_H, STD_C23, NO_FMT, 0 }, { "D", FMT_LEN_D, STD_C23, "DD", FMT_LEN_DD, STD_C23, 0 }, { "w8", FMT_LEN_w8, STD_C23, NO_FMT, 0 }, { "w16", FMT_LEN_w16, STD_C23, NO_FMT, 0 }, { "w32", FMT_LEN_w32, STD_C23, NO_FMT, 0 }, { "w64", FMT_LEN_w64, STD_C23, NO_FMT, 0 }, { "wf8", FMT_LEN_wf8, STD_C23, NO_FMT, 0 }, { "wf16", FMT_LEN_wf16, STD_C23, NO_FMT, 0 }, { "wf32", FMT_LEN_wf32, STD_C23, NO_FMT, 0 }, { "wf64", FMT_LEN_wf64, STD_C23, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; /* All tables for strfmon use STD_C89 everywhere, since -pedantic warnings make no sense for a format type not part of any C standard version. */ static const format_length_info strfmon_length_specs[] = { /* A GNU extension. */ { "L", FMT_LEN_L, STD_C89, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; /* Length modifiers used by the fortran/error.cc routines. */ static const format_length_info gcc_gfc_length_specs[] = { { "l", FMT_LEN_l, STD_C89, "ll", FMT_LEN_ll, STD_C89, 0 }, { "w", FMT_LEN_w, STD_C89, NO_FMT, 0 }, { NO_FMT, NO_FMT, 0 } }; static const format_flag_spec printf_flag_specs[] = { { ' ', 0, 0, 0, N_("' ' flag"), N_("the ' ' printf flag"), STD_C89 }, { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' printf flag"), STD_C89 }, { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' printf flag"), STD_C89 }, { '\'', 0, 0, 0, N_("''' flag"), N_("the ''' printf flag"), STD_EXT }, { 'I', 0, 0, 0, N_("'I' flag"), N_("the 'I' printf flag"), STD_EXT }, { 'w', 0, 0, 0, N_("field width"), N_("field width in printf format"), STD_C89 }, { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; static const format_flag_pair printf_flag_pairs[] = { { ' ', '+', 1, 0 }, { '0', '-', 1, 0 }, { '0', 'p', 1, 'i' }, { 0, 0, 0, 0 } }; static const format_flag_spec asm_fprintf_flag_specs[] = { { ' ', 0, 0, 0, N_("' ' flag"), N_("the ' ' printf flag"), STD_C89 }, { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' printf flag"), STD_C89 }, { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' printf flag"), STD_C89 }, { 'w', 0, 0, 0, N_("field width"), N_("field width in printf format"), STD_C89 }, { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; static const format_flag_pair asm_fprintf_flag_pairs[] = { { ' ', '+', 1, 0 }, { '0', '-', 1, 0 }, { '0', 'p', 1, 'i' }, { 0, 0, 0, 0 } }; static const format_flag_pair gcc_diag_flag_pairs[] = { { 0, 0, 0, 0 } }; #define gcc_tdiag_flag_pairs gcc_diag_flag_pairs #define gcc_cdiag_flag_pairs gcc_diag_flag_pairs #define gcc_cxxdiag_flag_pairs gcc_diag_flag_pairs #define gcc_gfc_flag_pairs gcc_diag_flag_pairs #define gcc_dump_printf_flag_pairs gcc_diag_flag_pairs static const format_flag_spec gcc_diag_flag_specs[] = { { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' printf flag"), STD_C89 }, { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' printf flag"), STD_C89 }, { 'q', 0, 0, 1, N_("'q' flag"), N_("the 'q' diagnostic flag"), STD_C89 }, { 'p', 0, 0, 0, N_("precision"), N_("precision in printf format"), STD_C89 }, { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in printf format"), STD_C89 }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; #define gcc_tdiag_flag_specs gcc_diag_flag_specs #define gcc_cdiag_flag_specs gcc_diag_flag_specs #define gcc_cxxdiag_flag_specs gcc_diag_flag_specs #define gcc_gfc_flag_specs gcc_diag_flag_specs #define gcc_dump_printf_flag_specs gcc_diag_flag_specs static const format_flag_spec scanf_flag_specs[] = { { '*', 0, 0, 0, N_("assignment suppression"), N_("the assignment suppression scanf feature"), STD_C89 }, { 'a', 0, 0, 0, N_("'a' flag"), N_("the 'a' scanf flag"), STD_EXT }, { 'm', 0, 0, 0, N_("'m' flag"), N_("the 'm' scanf flag"), STD_EXT }, { 'w', 0, 0, 0, N_("field width"), N_("field width in scanf format"), STD_C89 }, { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in scanf format"), STD_C89 }, { '\'', 0, 0, 0, N_("''' flag"), N_("the ''' scanf flag"), STD_EXT }, { 'I', 0, 0, 0, N_("'I' flag"), N_("the 'I' scanf flag"), STD_EXT }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; static const format_flag_pair scanf_flag_pairs[] = { { '*', 'L', 0, 0 }, { 'a', 'm', 0, 0 }, { 0, 0, 0, 0 } }; static const format_flag_spec strftime_flag_specs[] = { { '_', 0, 0, 0, N_("'_' flag"), N_("the '_' strftime flag"), STD_EXT }, { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' strftime flag"), STD_EXT }, { '0', 0, 0, 0, N_("'0' flag"), N_("the '0' strftime flag"), STD_EXT }, { '^', 0, 0, 0, N_("'^' flag"), N_("the '^' strftime flag"), STD_EXT }, { '#', 0, 0, 0, N_("'#' flag"), N_("the '#' strftime flag"), STD_EXT }, { 'w', 0, 0, 0, N_("field width"), N_("field width in strftime format"), STD_EXT }, { 'E', 0, 0, 0, N_("'E' modifier"), N_("the 'E' strftime modifier"), STD_C99 }, { 'O', 0, 0, 0, N_("'O' modifier"), N_("the 'O' strftime modifier"), STD_C99 }, { 'O', 'o', 0, 0, NULL, N_("the 'O' modifier"), STD_EXT }, { 'O', 'p', 0, 0, NULL, N_("the 'O' modifier"), STD_C23 }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; static const format_flag_pair strftime_flag_pairs[] = { { 'E', 'O', 0, 0 }, { '_', '-', 0, 0 }, { '_', '0', 0, 0 }, { '-', '0', 0, 0 }, { '^', '#', 0, 0 }, { 0, 0, 0, 0 } }; static const format_flag_spec strfmon_flag_specs[] = { { '=', 0, 1, 0, N_("fill character"), N_("fill character in strfmon format"), STD_C89 }, { '^', 0, 0, 0, N_("'^' flag"), N_("the '^' strfmon flag"), STD_C89 }, { '+', 0, 0, 0, N_("'+' flag"), N_("the '+' strfmon flag"), STD_C89 }, { '(', 0, 0, 0, N_("'(' flag"), N_("the '(' strfmon flag"), STD_C89 }, { '!', 0, 0, 0, N_("'!' flag"), N_("the '!' strfmon flag"), STD_C89 }, { '-', 0, 0, 0, N_("'-' flag"), N_("the '-' strfmon flag"), STD_C89 }, { 'w', 0, 0, 0, N_("field width"), N_("field width in strfmon format"), STD_C89 }, { '#', 0, 0, 0, N_("left precision"), N_("left precision in strfmon format"), STD_C89 }, { 'p', 0, 0, 0, N_("right precision"), N_("right precision in strfmon format"), STD_C89 }, { 'L', 0, 0, 0, N_("length modifier"), N_("length modifier in strfmon format"), STD_C89 }, { 0, 0, 0, 0, NULL, NULL, STD_C89 } }; static const format_flag_pair strfmon_flag_pairs[] = { { '+', '(', 0, 0 }, { 0, 0, 0, 0 } }; static const format_char_info print_char_table[] = { /* C89 conversion specifiers. */ { "di", 0, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, TEX_LL, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN, T23_I8, T23_I16, T23_I32, T23_I64, T23_IF8, T23_IF16, T23_IF32, T23_IF64 }, "-wp0 +'I", "i", NULL }, { "oxX", 0, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "-wp0#", "i", NULL }, { "u", 0, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "-wp0'I", "i", NULL }, { "fgG", 0, STD_C89, { T89_D, BADLEN, BADLEN, T99_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +#'I", "", NULL }, { "eE", 0, STD_C89, { T89_D, BADLEN, BADLEN, T99_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +#I", "", NULL }, { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, T94_WI, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "cR", NULL }, { "p", 1, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "c", NULL }, { "n", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN, T23_I8, T23_I16, T23_I32, T23_I64, T23_IF8, T23_IF16, T23_IF32, T23_IF64 }, "", "W", NULL }, /* C99 conversion specifiers. */ { "F", 0, STD_C99, { T99_D, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +#'I", "", NULL }, { "aA", 0, STD_C99, { T99_D, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +#", "", NULL }, /* C23 conversion specifiers. */ { "bB", 0, STD_C23, { T23_UI, T23_UC, T23_US, T23_UL, T23_ULL, TEX_ULL, T23_ST, T23_UPD, T23_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "-wp0#", "i", NULL }, /* X/Open conversion specifiers. */ { "C", 0, STD_EXT, { TEX_WI, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, { "S", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "R", NULL }, /* GNU conversion specifiers. */ { "m", 0, STD_EXT, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info asm_fprintf_char_table[] = { /* C89 conversion specifiers. */ { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, T9L_LL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0 +", "i", NULL }, { "oxX", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0#", "i", NULL }, { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp0", "i", NULL }, { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-w", "", NULL }, { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "-wp", "cR", NULL }, /* asm_fprintf conversion specifiers. */ { "O", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "R", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "I", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "L", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "U", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "r", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "", NULL }, { "z", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { "@", 0, STD_C89, NOARGUMENTS, "", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; /* GCC-specific format_char_info arrays. */ /* The conversion specifiers implemented within pp_format, and thus supported by all pretty_printer instances within GCC. */ #define PP_FORMAT_CHAR_TABLE \ { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ { "ox", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, T99_ST, T99_UPD, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, T99_ST, T99_UPD, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, \ { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "pq", "cR", NULL }, \ { "p", 1, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "c", NULL }, \ { "r", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "//cR", NULL }, \ { "@", 1, STD_C89, { T_EVENT_PTR, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, \ { "e", 1, STD_C89, { T_PP_ELEMENT_PTR, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, \ { "<", 0, STD_C89, NOARGUMENTS, "", "<", NULL }, \ { ">", 0, STD_C89, NOARGUMENTS, "", ">", NULL }, \ { "'" , 0, STD_C89, NOARGUMENTS, "", "", NULL }, \ { "{", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "cR", NULL }, \ { "}", 0, STD_C89, NOARGUMENTS, "", "", NULL }, \ { "R", 0, STD_C89, NOARGUMENTS, "", "\\", NULL }, \ { "m", 0, STD_C89, NOARGUMENTS, "q", "", NULL }, \ { "Z", 1, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "", &gcc_diag_char_table[0] } static const format_char_info gcc_diag_char_table[] = { /* The conversion specifiers implemented within pp_format. */ PP_FORMAT_CHAR_TABLE, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info gcc_tdiag_char_table[] = { /* The conversion specifiers implemented within pp_format. */ PP_FORMAT_CHAR_TABLE, /* Custom conversion specifiers implemented by default_tree_printer. */ /* These will require a "tree" at runtime. */ { "DFTV", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "'", NULL }, { "E", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info gcc_cdiag_char_table[] = { /* The conversion specifiers implemented within pp_format. */ PP_FORMAT_CHAR_TABLE, /* Custom conversion specifiers implemented by c_tree_printer. */ /* These will require a "tree" at runtime. */ { "DFTV", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "'", NULL }, { "E", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "", NULL }, { "v", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q#", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info gcc_cxxdiag_char_table[] = { /* The conversion specifiers implemented within pp_format. */ PP_FORMAT_CHAR_TABLE, /* Custom conversion specifiers implemented by cp_printer. */ /* These will require a "tree" at runtime. */ { "ADFHISTVX",1,STD_C89,{ T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+#", "'", NULL }, { "E", 1,STD_C89,{ T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+#", "", NULL }, /* These accept either an 'int' or an 'enum tree_code' (which is handled as an 'int'.) */ { "CLOPQ",0,STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info gcc_gfc_char_table[] = { /* C89 conversion specifiers. */ { "di", 0, STD_C89, { T89_I, BADLEN, BADLEN, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, { "u", 0, STD_C89, { T89_UI, BADLEN, BADLEN, T89_UL, T9L_ULL, BADLEN, T99_ST, T99_UPD, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, { "c", 0, STD_C89, { T89_I, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "", NULL }, { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q", "cR", NULL }, /* gfc conversion specifiers. */ { "C", 0, STD_C89, NOARGUMENTS, "", "", NULL }, /* This will require a "locus" at runtime. */ { "L", 0, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "R", NULL }, /* These will require a "tree" at runtime. */ { "DFTV", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "'", NULL }, { "E", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "q+", "", NULL }, /* These will require nothing. */ { "<>",0, STD_C89, NOARGUMENTS, "", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info gcc_dump_printf_char_table[] = { /* The conversion specifiers implemented within pp_format. */ PP_FORMAT_CHAR_TABLE, /* Custom conversion specifiers implemented by dump_pretty_printer. */ /* E and G require a "gimple *" argument at runtime. */ { "EG", 1, STD_C89, { T89_G, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, /* C requires a "cgraph_node *" argument at runtime. */ { "C", 1, STD_C89, { T_CGRAPH_NODE, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, /* T requires a "tree" at runtime. */ { "T", 1, STD_C89, { T89_T, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, /* %f requires a "double"; it doesn't support modifiers. */ { "f", 0, STD_C89, { T89_D, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "", "\"", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info scan_char_table[] = { /* C89 conversion specifiers. */ { "di", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, TEX_LL, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN, T23_I8, T23_I16, T23_I32, T23_I64, T23_IF8, T23_IF16, T23_IF32, T23_IF64 }, "*w'I", "W", NULL }, { "u", 1, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "*w'I", "W", NULL }, { "oxX", 1, STD_C89, { T89_UI, T99_UC, T89_US, T89_UL, T9L_ULL, TEX_ULL, T99_ST, T99_UPD, T99_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "*w", "W", NULL }, { "efgEG", 1, STD_C89, { T89_F, BADLEN, BADLEN, T89_D, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*w'", "W", NULL }, { "c", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*mw", "cW", NULL }, { "s", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "cW", NULL }, { "[", 1, STD_C89, { T89_C, BADLEN, BADLEN, T94_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "cW[", NULL }, { "p", 2, STD_C89, { T89_V, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*w", "W", NULL }, { "n", 1, STD_C89, { T89_I, T99_SC, T89_S, T89_L, T9L_LL, BADLEN, T99_SST, T99_PD, T99_IM, BADLEN, BADLEN, BADLEN, T23_I8, T23_I16, T23_I32, T23_I64, T23_IF8, T23_IF16, T23_IF32, T23_IF64 }, "", "W", NULL }, /* C99 conversion specifiers. */ { "F", 1, STD_C99, { T99_F, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*w'", "W", NULL }, { "aA", 1, STD_C99, { T99_F, BADLEN, BADLEN, T99_D, BADLEN, T99_LD, BADLEN, BADLEN, BADLEN, T23_D32, T23_D64, T23_D128, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*w'", "W", NULL }, /* C23 conversion specifiers. */ { "b", 1, STD_C23, { T23_UI, T23_UC, T23_US, T23_UL, T23_ULL, TEX_ULL, T23_ST, T23_UPD, T23_UIM, BADLEN, BADLEN, BADLEN, T23_U8, T23_U16, T23_U32, T23_U64, T23_UF8, T23_UF16, T23_UF32, T23_UF64 }, "*w", "W", NULL }, /* X/Open conversion specifiers. */ { "C", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*mw", "W", NULL }, { "S", 1, STD_EXT, { TEX_W, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "*amw", "W", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info time_char_table[] = { /* C89 conversion specifiers. */ { "AZa", 0, STD_C89, NOLENGTHS, "^#", "", NULL }, { "Bb", 0, STD_C89, NOLENGTHS, "O^#", "p", NULL }, { "cx", 0, STD_C89, NOLENGTHS, "E", "3", NULL }, { "HIMSUWdmw", 0, STD_C89, NOLENGTHS, "-_0Ow", "", NULL }, { "j", 0, STD_C89, NOLENGTHS, "-_0Ow", "o", NULL }, { "p", 0, STD_C89, NOLENGTHS, "#", "", NULL }, { "X", 0, STD_C89, NOLENGTHS, "E", "", NULL }, { "y", 0, STD_C89, NOLENGTHS, "EO-_0w", "4", NULL }, { "Y", 0, STD_C89, NOLENGTHS, "-_0EOw", "o", NULL }, { "%", 0, STD_C89, NOLENGTHS, "", "", NULL }, /* C99 conversion specifiers. */ { "C", 0, STD_C99, NOLENGTHS, "-_0EOw", "o", NULL }, { "D", 0, STD_C99, NOLENGTHS, "", "2", NULL }, { "eVu", 0, STD_C99, NOLENGTHS, "-_0Ow", "", NULL }, { "FRTnrt", 0, STD_C99, NOLENGTHS, "", "", NULL }, { "g", 0, STD_C99, NOLENGTHS, "O-_0w", "2o", NULL }, { "G", 0, STD_C99, NOLENGTHS, "-_0Ow", "o", NULL }, { "h", 0, STD_C99, NOLENGTHS, "^#", "", NULL }, { "z", 0, STD_C99, NOLENGTHS, "O", "o", NULL }, /* GNU conversion specifiers. */ { "kls", 0, STD_EXT, NOLENGTHS, "-_0Ow", "", NULL }, { "P", 0, STD_EXT, NOLENGTHS, "", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; static const format_char_info monetary_char_table[] = { { "in", 0, STD_C89, { T89_D, BADLEN, BADLEN, BADLEN, BADLEN, T89_LD, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN, BADLEN }, "=^+(!-w#p", "", NULL }, { NULL, 0, STD_C89, NOLENGTHS, NULL, NULL, NULL } }; /* This must be in the same order as enum format_type. */ static const format_kind_info format_types_orig[] = { { "gnu_printf", printf_length_specs, print_char_table, " +#0-'I", NULL, printf_flag_specs, printf_flag_pairs, FMT_FLAG_ARG_CONVERT|FMT_FLAG_DOLLAR_MULTIPLE|FMT_FLAG_USE_DOLLAR|FMT_FLAG_EMPTY_PREC_OK, 'w', 0, 'p', 0, 'L', 0, &integer_type_node, &integer_type_node }, { "asm_fprintf", asm_fprintf_length_specs, asm_fprintf_char_table, " +#0-", NULL, asm_fprintf_flag_specs, asm_fprintf_flag_pairs, FMT_FLAG_ARG_CONVERT|FMT_FLAG_EMPTY_PREC_OK, 'w', 0, 'p', 0, 'L', 0, NULL, NULL }, { "gcc_diag", gcc_diag_length_specs, gcc_diag_char_table, "q+#", NULL, gcc_diag_flag_specs, gcc_diag_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 'p', 0, 'L', 0, NULL, &integer_type_node }, { "gcc_tdiag", gcc_tdiag_length_specs, gcc_tdiag_char_table, "q+#", NULL, gcc_tdiag_flag_specs, gcc_tdiag_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 'p', 0, 'L', 0, NULL, &integer_type_node }, { "gcc_cdiag", gcc_cdiag_length_specs, gcc_cdiag_char_table, "q+#", NULL, gcc_cdiag_flag_specs, gcc_cdiag_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 'p', 0, 'L', 0, NULL, &integer_type_node }, { "gcc_cxxdiag", gcc_cxxdiag_length_specs, gcc_cxxdiag_char_table, "q+#", NULL, gcc_cxxdiag_flag_specs, gcc_cxxdiag_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 'p', 0, 'L', 0, NULL, &integer_type_node }, { "gcc_gfc", gcc_gfc_length_specs, gcc_gfc_char_table, "q+#", NULL, gcc_gfc_flag_specs, gcc_gfc_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 0, 0, 0, 0, NULL, NULL }, { "gcc_dump_printf", gcc_dump_printf_length_specs, gcc_dump_printf_char_table, "q+#", NULL, gcc_dump_printf_flag_specs, gcc_dump_printf_flag_pairs, FMT_FLAG_ARG_CONVERT, 0, 0, 'p', 0, 'L', 0, NULL, &integer_type_node }, { "NSString", NULL, NULL, NULL, NULL, NULL, NULL, FMT_FLAG_ARG_CONVERT|FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL, 0, 0, 0, 0, 0, 0, NULL, NULL }, { "gnu_scanf", scanf_length_specs, scan_char_table, "*'I", NULL, scanf_flag_specs, scanf_flag_pairs, FMT_FLAG_ARG_CONVERT|FMT_FLAG_SCANF_A_KLUDGE|FMT_FLAG_USE_DOLLAR|FMT_FLAG_ZERO_WIDTH_BAD|FMT_FLAG_DOLLAR_GAP_POINTER_OK, 'w', 0, 0, '*', 'L', 'm', NULL, NULL }, { "gnu_strftime", NULL, time_char_table, "_-0^#", "EO", strftime_flag_specs, strftime_flag_pairs, FMT_FLAG_FANCY_PERCENT_OK, 'w', 0, 0, 0, 0, 0, NULL, NULL }, { "gnu_strfmon", strfmon_length_specs, monetary_char_table, "=^+(!-", NULL, strfmon_flag_specs, strfmon_flag_pairs, FMT_FLAG_ARG_CONVERT, 'w', '#', 'p', 0, 'L', 0, NULL, NULL } }; /* This layer of indirection allows GCC to reassign format_types with new data if necessary, while still allowing the original data to be const. */ static const format_kind_info *format_types = format_types_orig; /* We can modify this one. We also add target-specific format types to the end of the array. */ static format_kind_info *dynamic_format_types; static int n_format_types = ARRAY_SIZE (format_types_orig); /* Structure detailing the results of checking a format function call where the format expression may be a conditional expression with many leaves resulting from nested conditional expressions. */ struct format_check_results { format_check_results (location_t format_string_loc_) : number_non_literal (0), number_extra_args (0), extra_arg_loc (UNKNOWN_LOCATION), number_dollar_extra_args (0), number_wide (0), number_non_char (0), number_empty (0), number_unterminated (0), number_other (0), format_string_loc (format_string_loc_) { } /* Number of leaves of the format argument that could not be checked as they were not string literals. */ int number_non_literal; /* Number of leaves of the format argument that were null pointers or string literals, but had extra format arguments. */ int number_extra_args; location_t extra_arg_loc; /* Number of leaves of the format argument that were null pointers or string literals, but had extra format arguments and used $ operand numbers. */ int number_dollar_extra_args; /* Number of leaves of the format argument that were wide string literals. */ int number_wide; /* Number of leaves of the format argument that are not array of "char". */ int number_non_char; /* Number of leaves of the format argument that were empty strings. */ int number_empty; /* Number of leaves of the format argument that were unterminated strings. */ int number_unterminated; /* Number of leaves of the format argument that were not counted above. */ int number_other; /* Location of the format string. */ location_t format_string_loc; }; struct format_check_context { format_check_context (format_check_results *res, function_format_info *info, tree params, vec *arglocs, bool (*comp_types) (tree, tree)) : m_res (res), m_info (info), m_params (params), m_arglocs (arglocs), m_comp_types (comp_types) { } format_check_results *m_res; function_format_info *m_info; tree m_params; vec *m_arglocs; bool (*m_comp_types) (tree, tree); }; /* Return the format name (as specified in the original table) for the format type indicated by format_num. */ static const char * format_name (int format_num) { if (format_num >= 0 && format_num < n_format_types) return format_types[format_num].name; gcc_unreachable (); } /* Return the format flags (as specified in the original table) for the format type indicated by format_num. */ static int format_flags (int format_num) { if (format_num >= 0 && format_num < n_format_types) return format_types[format_num].flags; gcc_unreachable (); } static void check_format_info (function_format_info *, tree, vec *, bool (*comp_types) (tree, tree)); static void check_format_arg (void *, tree, unsigned HOST_WIDE_INT); static void check_format_info_main (format_check_results *, function_format_info *, const char *, location_t, tree, int, tree, unsigned HOST_WIDE_INT, object_allocator &, vec *, bool (*comp_types) (tree, tree)); static void init_dollar_format_checking (int, tree); static int maybe_read_dollar_number (const char **, int, tree, tree *, const format_kind_info *); static bool avoid_dollar_number (const char *); static void finish_dollar_format_checking (format_check_results *, int); static const format_flag_spec *get_flag_spec (const format_flag_spec *, int, const char *); static void check_format_types (const substring_loc &fmt_loc, format_wanted_type *, const format_kind_info *fki, int offset_to_type_start, char conversion_char, vec *arglocs, bool (*comp_types) (tree, tree)); static void format_type_warning (const substring_loc &fmt_loc, location_t param_loc, format_wanted_type *, tree, tree, const format_kind_info *fki, int offset_to_type_start, char conversion_char); /* Decode a format type from a string, returning the type, or format_type_error if not valid, in which case the caller should print an error message. On success, when IS_RAW is non-null, set *IS_RAW when the format type corresponds to a GCC "raw" diagnostic formatting function and clear it otherwise. */ static format_type decode_format_type (const char *s, bool *is_raw /* = NULL */) { bool is_raw_buf; if (!is_raw) is_raw = &is_raw_buf; *is_raw = false; s = convert_format_name_to_system_name (s); size_t slen = strlen (s); for (int i = 0; i < n_format_types; i++) { /* Check for a match with no underscores. */ if (!strcmp (s, format_types[i].name)) return static_cast (i); /* Check for leading and trailing underscores. */ size_t alen = strlen (format_types[i].name); if (slen == alen + 4 && s[0] == '_' && s[1] == '_' && s[slen - 1] == '_' && s[slen - 2] == '_' && !strncmp (s + 2, format_types[i].name, alen)) return static_cast(i); /* Check for the "_raw" suffix and no leading underscores. */ if (slen == alen + 4 && !strncmp (s, format_types[i].name, alen) && !strcmp (s + alen, "_raw")) { *is_raw = true; return static_cast(i); } /* Check for the "_raw__" suffix and leading underscores. */ if (slen == alen + 8 && s[0] == '_' && s[1] == '_' && !strncmp (s + 2, format_types[i].name, alen) && !strcmp (s + 2 + alen, "_raw__")) { *is_raw = true; return static_cast(i); } } return format_type_error; } /* Check the argument list of a call to printf, scanf, etc. ATTRS are the attributes on the function type. There are NARGS argument values in the array ARGARRAY. FN is either a function declaration or function type. Also, if -Wsuggest-attribute=format, warn for calls to vprintf or vscanf in functions with no such format attribute themselves. */ void check_function_format (const_tree fn, tree attrs, int nargs, tree *argarray, vec *arglocs, bool (*comp_types) (tree, tree)) { tree a; tree atname = get_identifier ("format"); bool skipped_default_format = false; /* See if this function has any format attributes. */ for (a = attrs; a; a = TREE_CHAIN (a)) { if (is_attribute_p ("format", get_attribute_name (a))) { /* Yup; check it. */ function_format_info info; decode_format_attr (fn, atname, TREE_VALUE (a), &info, /*validated=*/true); /* Mingw32 targets have traditionally used ms_printf format for the printf function, and this format is built in GCC. But nowadays, if mingw-w64 is configured to target UCRT, the printf function uses the gnu_printf format (specified in the stdio.h header). This causes GCC to check both formats, which means that GCC would warn twice about the same issue when both formats are violated, e.g. for %lu used to print long long unsigned. Hence, if there is a built-in attribute specifier and at least one another, we skip the built-in one. See PR 95130 (but note that GCC ms_printf already supports %llu) and PR 92292. */ if (!skipped_default_format && fn && TREE_CODE (fn) == FUNCTION_DECL && fndecl_built_in_p (fn, BUILT_IN_NORMAL) && (tree_to_uhwi (TREE_PURPOSE (TREE_VALUE (a))) & (int) ATTR_FLAG_BUILT_IN)) { tree aa; for (aa = attrs; aa; aa = TREE_CHAIN (aa)) if (a != aa && is_attribute_p ("format", get_attribute_name (aa))) { skipped_default_format = true; break; } if (skipped_default_format) continue; } if (warn_format) { /* FIXME: Rewrite all the internal functions in this file to use the ARGARRAY directly instead of constructing this temporary list. */ tree params = NULL_TREE; int i; for (i = nargs - 1; i >= 0; i--) params = tree_cons (NULL_TREE, argarray[i], params); check_format_info (&info, params, arglocs, comp_types); } /* Attempt to detect whether the current function might benefit from the format attribute if the called function is decorated with it. Avoid using calls with string literal formats for guidance since those are unlikely to be viable candidates. */ if (warn_suggest_attribute_format && current_function_decl != NULL_TREE && info.first_arg_num == 0 && (format_types[info.format_type].flags & (int) FMT_FLAG_ARG_CONVERT) /* c_strlen will fail for a function parameter but succeed for a literal or constant array. */ && !c_strlen (argarray[info.format_num - 1], 1)) { tree c; for (c = TYPE_ATTRIBUTES (TREE_TYPE (current_function_decl)); c; c = TREE_CHAIN (c)) if (is_attribute_p ("format", get_attribute_name (c)) && (decode_format_type (IDENTIFIER_POINTER (TREE_VALUE (TREE_VALUE (c)))) == info.format_type)) break; if (c == NULL_TREE) { /* Check if the current function has a parameter to which the format attribute could be attached; if not, it can't be a candidate for a format attribute, despite the vprintf-like or vscanf-like call. */ tree args; for (args = DECL_ARGUMENTS (current_function_decl); args != 0; args = DECL_CHAIN (args)) { if (TREE_CODE (TREE_TYPE (args)) == POINTER_TYPE && (TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (args))) == char_type_node)) break; } if (args != 0) warning (OPT_Wsuggest_attribute_format, "function %qD " "might be a candidate for %qs format attribute", current_function_decl, format_types[info.format_type].name); } } } } } /* Variables used by the checking of $ operand number formats. */ static char *dollar_arguments_used = NULL; static char *dollar_arguments_pointer_p = NULL; static int dollar_arguments_alloc = 0; static int dollar_arguments_count; static int dollar_first_arg_num; static int dollar_max_arg_used; static int dollar_format_warned; /* Initialize the checking for a format string that may contain $ parameter number specifications; we will need to keep track of whether each parameter has been used. FIRST_ARG_NUM is the number of the first argument that is a parameter to the format, or 0 for a vprintf-style function; PARAMS is the list of arguments starting at this argument. */ static void init_dollar_format_checking (int first_arg_num, tree params) { tree oparams = params; dollar_first_arg_num = first_arg_num; dollar_arguments_count = 0; dollar_max_arg_used = 0; dollar_format_warned = 0; if (first_arg_num > 0) { while (params) { dollar_arguments_count++; params = TREE_CHAIN (params); } } if (dollar_arguments_alloc < dollar_arguments_count) { free (dollar_arguments_used); free (dollar_arguments_pointer_p); dollar_arguments_alloc = dollar_arguments_count; dollar_arguments_used = XNEWVEC (char, dollar_arguments_alloc); dollar_arguments_pointer_p = XNEWVEC (char, dollar_arguments_alloc); } if (dollar_arguments_alloc) { memset (dollar_arguments_used, 0, dollar_arguments_alloc); if (first_arg_num > 0) { int i = 0; params = oparams; while (params) { dollar_arguments_pointer_p[i] = (TREE_CODE (TREE_TYPE (TREE_VALUE (params))) == POINTER_TYPE); params = TREE_CHAIN (params); i++; } } } } /* Look for a decimal number followed by a $ in *FORMAT. If DOLLAR_NEEDED is set, it is an error if one is not found; otherwise, it is OK. If such a number is found, check whether it is within range and mark that numbered operand as being used for later checking. Returns the operand number if found and within range, zero if no such number was found and this is OK, or -1 on error. PARAMS points to the first operand of the format; PARAM_PTR is made to point to the parameter referred to. If a $ format is found, *FORMAT is updated to point just after it. */ static int maybe_read_dollar_number (const char **format, int dollar_needed, tree params, tree *param_ptr, const format_kind_info *fki) { int argnum; int overflow_flag; const char *fcp = *format; if (!ISDIGIT (*fcp)) { if (dollar_needed) { warning (OPT_Wformat_, "missing $ operand number in format"); return -1; } else return 0; } argnum = 0; overflow_flag = 0; while (ISDIGIT (*fcp)) { HOST_WIDE_INT nargnum = HOST_WIDE_INT_UC (10) * argnum + (*fcp - '0'); if ((int) nargnum != nargnum) overflow_flag = 1; argnum = nargnum; fcp++; } if (*fcp != '$') { if (dollar_needed) { warning (OPT_Wformat_, "missing $ operand number in format"); return -1; } else return 0; } *format = fcp + 1; if (pedantic && !dollar_format_warned) { warning (OPT_Wformat_, "%s does not support %%n$ operand number formats", C_STD_NAME (STD_EXT)); dollar_format_warned = 1; } if (overflow_flag || argnum == 0 || (dollar_first_arg_num && argnum > dollar_arguments_count)) { warning (OPT_Wformat_, "operand number out of range in format"); return -1; } if (argnum > dollar_max_arg_used) dollar_max_arg_used = argnum; /* For vprintf-style functions we may need to allocate more memory to track which arguments are used. */ while (dollar_arguments_alloc < dollar_max_arg_used) { int nalloc; nalloc = 2 * dollar_arguments_alloc + 16; dollar_arguments_used = XRESIZEVEC (char, dollar_arguments_used, nalloc); dollar_arguments_pointer_p = XRESIZEVEC (char, dollar_arguments_pointer_p, nalloc); memset (dollar_arguments_used + dollar_arguments_alloc, 0, nalloc - dollar_arguments_alloc); dollar_arguments_alloc = nalloc; } if (!(fki->flags & (int) FMT_FLAG_DOLLAR_MULTIPLE) && dollar_arguments_used[argnum - 1] == 1) { dollar_arguments_used[argnum - 1] = 2; warning (OPT_Wformat_, "format argument %d used more than once in %s format", argnum, fki->name); } else dollar_arguments_used[argnum - 1] = 1; if (dollar_first_arg_num) { int i; *param_ptr = params; for (i = 1; i < argnum && *param_ptr != 0; i++) *param_ptr = TREE_CHAIN (*param_ptr); /* This case shouldn't be caught here. */ gcc_assert (*param_ptr); } else *param_ptr = 0; return argnum; } /* Ensure that FORMAT does not start with a decimal number followed by a $; give a diagnostic and return true if it does, false otherwise. */ static bool avoid_dollar_number (const char *format) { if (!ISDIGIT (*format)) return false; while (ISDIGIT (*format)) format++; if (*format == '$') { warning (OPT_Wformat_, "%<$%>operand number used after format without operand number"); return true; } return false; } /* Finish the checking for a format string that used $ operand number formats instead of non-$ formats. We check for unused operands before used ones (a serious error, since the implementation of the format function can't know what types to pass to va_arg to find the later arguments). and for unused operands at the end of the format (if we know how many arguments the format had, so not for vprintf). If there were operand numbers out of range on a non-vprintf-style format, we won't have reached here. If POINTER_GAP_OK, unused arguments are OK if all arguments are pointers. */ static void finish_dollar_format_checking (format_check_results *res, int pointer_gap_ok) { int i; bool found_pointer_gap = false; for (i = 0; i < dollar_max_arg_used; i++) { if (!dollar_arguments_used[i]) { if (pointer_gap_ok && (dollar_first_arg_num == 0 || dollar_arguments_pointer_p[i])) found_pointer_gap = true; else warning_at (res->format_string_loc, OPT_Wformat_, "format argument %d unused before used argument %d " "in %<$%>-style format", i + 1, dollar_max_arg_used); } } if (found_pointer_gap || (dollar_first_arg_num && dollar_max_arg_used < dollar_arguments_count)) { res->number_other--; res->number_dollar_extra_args++; } } /* Retrieve the specification for a format flag. SPEC contains the specifications for format flags for the applicable kind of format. FLAG is the flag in question. If PREDICATES is NULL, the basic spec for that flag must be retrieved and must exist. If PREDICATES is not NULL, it is a string listing possible predicates for the spec entry; if an entry predicated on any of these is found, it is returned, otherwise NULL is returned. */ static const format_flag_spec * get_flag_spec (const format_flag_spec *spec, int flag, const char *predicates) { int i; for (i = 0; spec[i].flag_char != 0; i++) { if (spec[i].flag_char != flag) continue; if (predicates != NULL) { if (spec[i].predicate != 0 && strchr (predicates, spec[i].predicate) != 0) return &spec[i]; } else if (spec[i].predicate == 0) return &spec[i]; } gcc_assert (predicates); return NULL; } /* Check the argument list of a call to printf, scanf, etc. INFO points to the function_format_info structure. PARAMS is the list of argument values. */ static void check_format_info (function_format_info *info, tree params, vec *arglocs, bool (*comp_types) (tree, tree)) { unsigned HOST_WIDE_INT arg_num; tree format_tree; /* Skip to format argument. If the argument isn't available, there's no work for us to do; prototype checking will catch the problem. */ for (arg_num = 1; ; ++arg_num) { if (params == 0) return; if (arg_num == info->format_num) break; params = TREE_CHAIN (params); } format_tree = TREE_VALUE (params); params = TREE_CHAIN (params); if (format_tree == 0) return; format_check_results res (input_location); format_check_context format_ctx (&res, info, params, arglocs, comp_types); check_function_arguments_recurse (check_format_arg, &format_ctx, format_tree, arg_num, OPT_Wformat_); location_t loc = format_ctx.m_res->format_string_loc; if (res.number_non_literal > 0) { /* Functions taking a va_list normally pass a non-literal format string. These functions typically are declared with first_arg_num == 0, so avoid warning in those cases. */ if (!(format_types[info->format_type].flags & (int) FMT_FLAG_ARG_CONVERT)) { /* For strftime-like formats, warn for not checking the format string; but there are no arguments to check. */ warning_at (loc, OPT_Wformat_nonliteral, "format not a string literal, format string not checked"); } else if (info->first_arg_num != 0) { /* If there are no arguments for the format at all, we may have printf (foo) which is likely to be a security hole. */ while (arg_num + 1 < info->first_arg_num) { if (params == 0) break; params = TREE_CHAIN (params); ++arg_num; } if (params == 0 && warn_format_security) warning_at (loc, OPT_Wformat_security, "format not a string literal and no format arguments"); else if (params == 0 && warn_format_nonliteral) warning_at (loc, OPT_Wformat_nonliteral, "format not a string literal and no format arguments"); else warning_at (loc, OPT_Wformat_nonliteral, "format not a string literal, argument types not checked"); } } /* If there were extra arguments to the format, normally warn. However, the standard does say extra arguments are ignored, so in the specific case where we have multiple leaves (conditional expressions or ngettext) allow extra arguments if at least one leaf didn't have extra arguments, but was otherwise OK (either non-literal or checked OK). If the format is an empty string, this should be counted similarly to the case of extra format arguments. */ if (res.number_extra_args > 0 && res.number_non_literal == 0 && res.number_other == 0) { if (res.extra_arg_loc == UNKNOWN_LOCATION) res.extra_arg_loc = loc; warning_at (res.extra_arg_loc, OPT_Wformat_extra_args, "too many arguments for format"); } if (res.number_dollar_extra_args > 0 && res.number_non_literal == 0 && res.number_other == 0) warning_at (loc, OPT_Wformat_extra_args, "unused arguments in %<$%>-style format"); if (res.number_empty > 0 && res.number_non_literal == 0 && res.number_other == 0) warning_at (loc, OPT_Wformat_zero_length, "zero-length %s format string", format_types[info->format_type].name); if (res.number_wide > 0) warning_at (loc, OPT_Wformat_, "format is a wide character string"); if (res.number_non_char > 0) warning_at (loc, OPT_Wformat_, "format string is not an array of type %qs", "char"); if (res.number_unterminated > 0) warning_at (loc, OPT_Wformat_, "unterminated format string"); } /* Callback from check_function_arguments_recurse to check a format string. FORMAT_TREE is the format parameter. ARG_NUM is the number of the format argument. CTX points to a format_check_context. */ static void check_format_arg (void *ctx, tree format_tree, unsigned HOST_WIDE_INT arg_num) { format_check_context *format_ctx = (format_check_context *) ctx; format_check_results *res = format_ctx->m_res; function_format_info *info = format_ctx->m_info; tree params = format_ctx->m_params; vec *arglocs = format_ctx->m_arglocs; bool (*comp_types) (tree, tree) = format_ctx->m_comp_types; int format_length; HOST_WIDE_INT offset; const char *format_chars; tree array_size = 0; tree array_init; location_t fmt_param_loc = EXPR_LOC_OR_LOC (format_tree, input_location); /* Pull out a constant value if the front end didn't, and handle location wrappers. */ format_tree = fold_for_warn (format_tree); STRIP_NOPS (format_tree); if (integer_zerop (format_tree)) { /* Skip to first argument to check, so we can see if this format has any arguments (it shouldn't). */ while (arg_num + 1 < info->first_arg_num) { if (params == 0) return; params = TREE_CHAIN (params); ++arg_num; } if (params == 0) res->number_other++; else { if (res->number_extra_args == 0) res->extra_arg_loc = EXPR_LOC_OR_LOC (TREE_VALUE (params), input_location); res->number_extra_args++; } return; } offset = 0; if (TREE_CODE (format_tree) == POINTER_PLUS_EXPR) { tree arg0, arg1; arg0 = TREE_OPERAND (format_tree, 0); arg1 = TREE_OPERAND (format_tree, 1); STRIP_NOPS (arg0); STRIP_NOPS (arg1); if (TREE_CODE (arg1) == INTEGER_CST) format_tree = arg0; else { res->number_non_literal++; return; } /* POINTER_PLUS_EXPR offsets are to be interpreted signed. */ if (!cst_and_fits_in_hwi (arg1)) { res->number_non_literal++; return; } offset = int_cst_value (arg1); } if (TREE_CODE (format_tree) != ADDR_EXPR) { res->number_non_literal++; return; } res->format_string_loc = EXPR_LOC_OR_LOC (format_tree, input_location); format_tree = TREE_OPERAND (format_tree, 0); if (format_types[info->format_type].flags & (int) FMT_FLAG_PARSE_ARG_CONVERT_EXTERNAL) { bool objc_str = (info->format_type == gcc_objc_string_format_type); /* We cannot examine this string here - but we can check that it is a valid type. */ if (TREE_CODE (format_tree) != CONST_DECL || !((objc_str && objc_string_ref_type_p (TREE_TYPE (format_tree))) || (*targetcm.string_object_ref_type_p) ((const_tree) TREE_TYPE (format_tree)))) { res->number_non_literal++; return; } /* Skip to first argument to check. */ while (arg_num + 1 < info->first_arg_num) { if (params == 0) return; params = TREE_CHAIN (params); ++arg_num; } /* So, we have a valid literal string object and one or more params. We need to use an external helper to parse the string into format info. For Objective-C variants we provide the resource within the objc tree, for target variants, via a hook. */ if (objc_str) objc_check_format_arg (format_tree, params); else if (targetcm.check_string_object_format_arg) (*targetcm.check_string_object_format_arg) (format_tree, params); /* Else we can't handle it and retire quietly. */ return; } if (TREE_CODE (format_tree) == ARRAY_REF && tree_fits_shwi_p (TREE_OPERAND (format_tree, 1)) && (offset += tree_to_shwi (TREE_OPERAND (format_tree, 1))) >= 0) format_tree = TREE_OPERAND (format_tree, 0); if (offset < 0) { res->number_non_literal++; return; } if (VAR_P (format_tree) && TREE_CODE (TREE_TYPE (format_tree)) == ARRAY_TYPE && (array_init = decl_constant_value (format_tree)) != format_tree && TREE_CODE (array_init) == STRING_CST) { /* Extract the string constant initializer. Note that this may include a trailing NUL character that is not in the array (e.g. const char a[3] = "foo";). */ array_size = DECL_SIZE_UNIT (format_tree); format_tree = array_init; } if (TREE_CODE (format_tree) != STRING_CST) { res->number_non_literal++; return; } tree underlying_type = TYPE_MAIN_VARIANT (TREE_TYPE (TREE_TYPE (format_tree))); if (underlying_type != char_type_node && !(flag_char8_t && underlying_type == char8_type_node)) { if (underlying_type == char16_type_node || underlying_type == char32_type_node || underlying_type == wchar_type_node) res->number_wide++; else res->number_non_char++; return; } format_chars = TREE_STRING_POINTER (format_tree); format_length = TREE_STRING_LENGTH (format_tree); if (array_size != 0) { /* Variable length arrays can't be initialized. */ gcc_assert (TREE_CODE (array_size) == INTEGER_CST); if (tree_fits_shwi_p (array_size)) { HOST_WIDE_INT array_size_value = tree_to_shwi (array_size); if (array_size_value > 0 && array_size_value == (int) array_size_value && format_length > array_size_value) format_length = array_size_value; } } if (offset) { if (offset >= format_length) { res->number_non_literal++; return; } format_chars += offset; format_length -= offset; } if (format_length < 1 || format_chars[--format_length] != 0) { res->number_unterminated++; return; } if (format_length == 0) { res->number_empty++; return; } /* Skip to first argument to check. */ while (arg_num + 1 < info->first_arg_num) { if (params == 0) return; params = TREE_CHAIN (params); ++arg_num; } /* Provisionally increment res->number_other; check_format_info_main will decrement it if it finds there are extra arguments, but this way need not adjust it for every return. */ res->number_other++; object_allocator fwt_pool ("format_wanted_type pool"); check_format_info_main (res, info, format_chars, fmt_param_loc, format_tree, format_length, params, arg_num, fwt_pool, arglocs, comp_types); } /* Support class for argument_parser and check_format_info_main. Tracks any flag characters that have been applied to the current argument. */ class flag_chars_t { public: flag_chars_t (); bool has_char_p (char ch) const; void add_char (char ch); void validate (const format_kind_info *fki, const format_char_info *fci, const format_flag_spec *flag_specs, const char * const format_chars, tree format_string_cst, location_t format_string_loc, const char * const orig_format_chars, char format_char, bool quoted); int get_alloc_flag (const format_kind_info *fki); int assignment_suppression_p (const format_kind_info *fki); private: char m_flag_chars[256]; }; /* Support struct for argument_parser and check_format_info_main. Encapsulates any length modifier applied to the current argument. */ class length_modifier { public: length_modifier () : chars (NULL), val (FMT_LEN_none), std (STD_C89), scalar_identity_flag (0) { } length_modifier (const char *chars_, enum format_lengths val_, enum format_std_version std_, int scalar_identity_flag_) : chars (chars_), val (val_), std (std_), scalar_identity_flag (scalar_identity_flag_) { } const char *chars; enum format_lengths val; enum format_std_version std; int scalar_identity_flag; }; /* Parsing one argument within a format string. */ class argument_parser { public: argument_parser (function_format_info *info, const char *&format_chars, tree format_string_cst, const char * const orig_format_chars, location_t format_string_loc, flag_chars_t &flag_chars, int &has_operand_number, tree first_fillin_param, object_allocator &fwt_pool_, vec *arglocs, bool (*comp_types) (tree, tree)); bool read_any_dollar (); bool read_format_flags (); bool read_any_format_width (tree ¶ms, unsigned HOST_WIDE_INT &arg_num); void read_any_format_left_precision (); bool read_any_format_precision (tree ¶ms, unsigned HOST_WIDE_INT &arg_num); void handle_alloc_chars (); length_modifier read_any_length_modifier (); void read_any_other_modifier (); const format_char_info *find_format_char_info (char format_char); void validate_flag_pairs (const format_char_info *fci, char format_char); void give_y2k_warnings (const format_char_info *fci, char format_char); void parse_any_scan_set (const format_char_info *fci); bool handle_conversions (const format_char_info *fci, const length_modifier &len_modifier, tree &wanted_type, const char *&wanted_type_name, unsigned HOST_WIDE_INT &arg_num, tree ¶ms, char format_char); bool check_argument_type (const format_char_info *fci, const length_modifier &len_modifier, tree &wanted_type, const char *&wanted_type_name, const bool suppressed, unsigned HOST_WIDE_INT &arg_num, tree ¶ms, const int alloc_flag, const char * const format_start, const char * const type_start, location_t fmt_param_loc, char conversion_char); private: const function_format_info *const info; const format_kind_info * const fki; const format_flag_spec * const flag_specs; const char *start_of_this_format; const char *&format_chars; const tree format_string_cst; const char * const orig_format_chars; const location_t format_string_loc; object_allocator &fwt_pool; flag_chars_t &flag_chars; int main_arg_num; tree main_arg_params; int &has_operand_number; const tree first_fillin_param; format_wanted_type width_wanted_type; format_wanted_type precision_wanted_type; public: format_wanted_type main_wanted_type; private: format_wanted_type *first_wanted_type; format_wanted_type *last_wanted_type; vec *arglocs; bool (*m_comp_types) (tree, tree); }; /* flag_chars_t's constructor. */ flag_chars_t::flag_chars_t () { m_flag_chars[0] = 0; } /* Has CH been seen as a flag within the current argument? */ bool flag_chars_t::has_char_p (char ch) const { return strchr (m_flag_chars, ch) != 0; } /* Add CH to the flags seen within the current argument. */ void flag_chars_t::add_char (char ch) { int i = strlen (m_flag_chars); m_flag_chars[i++] = ch; m_flag_chars[i] = 0; } /* Validate the individual flags used, removing any that are invalid. */ void flag_chars_t::validate (const format_kind_info *fki, const format_char_info *fci, const format_flag_spec *flag_specs, const char * const format_chars, tree format_string_cst, location_t format_string_loc, const char * const orig_format_chars, char format_char, bool quoted) { int i; int d = 0; bool quotflag = false; for (i = 0; m_flag_chars[i] != 0; i++) { const format_flag_spec *s = get_flag_spec (flag_specs, m_flag_chars[i], NULL); m_flag_chars[i - d] = m_flag_chars[i]; if (m_flag_chars[i] == fki->length_code_char) continue; /* Remember if a quoting flag is seen. */ quotflag |= s->quoting; if (strchr (fci->flag_chars, m_flag_chars[i]) == 0) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%s used with %<%%%c%> %s format", _(s->name), format_char, fki->name); d++; continue; } if (pedantic) { const format_flag_spec *t; if (ADJ_STD (s->std) > C_STD_VER) warning_at (format_string_loc, OPT_Wformat_, "%s does not support %s", C_STD_NAME (s->std), _(s->long_name)); t = get_flag_spec (flag_specs, m_flag_chars[i], fci->flags2); if (t != NULL && ADJ_STD (t->std) > ADJ_STD (s->std)) { const char *long_name = (t->long_name != NULL ? t->long_name : s->long_name); if (ADJ_STD (t->std) > C_STD_VER) warning_at (format_string_loc, OPT_Wformat_, "%s does not support %s with" " the %<%%%c%> %s format", C_STD_NAME (t->std), _(long_name), format_char, fki->name); } } /* Detect quoting directives used within a quoted sequence, such as GCC's "%<...%qE". */ if (quoted && s->quoting) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars - 1, OPT_Wformat_, "%s used within a quoted sequence", _(s->name)); } } m_flag_chars[i - d] = 0; if (!quoted && !quotflag && strchr (fci->flags2, '\'')) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%qc conversion used unquoted", format_char); } } /* Determine if an assignment-allocation has been set, requiring an extra char ** for writing back a dynamically-allocated char *. This is for handling the optional 'm' character in scanf. */ int flag_chars_t::get_alloc_flag (const format_kind_info *fki) { if ((fki->flags & (int) FMT_FLAG_SCANF_A_KLUDGE) && has_char_p ('a')) return 1; if (fki->alloc_char && has_char_p (fki->alloc_char)) return 1; return 0; } /* Determine if an assignment-suppression character was seen. ('*' in scanf, for discarding the converted input). */ int flag_chars_t::assignment_suppression_p (const format_kind_info *fki) { if (fki->suppression_char && has_char_p (fki->suppression_char)) return 1; return 0; } /* Constructor for argument_parser. Initialize for parsing one argument within a format string. */ argument_parser:: argument_parser (function_format_info *info_, const char *&format_chars_, tree format_string_cst_, const char * const orig_format_chars_, location_t format_string_loc_, flag_chars_t &flag_chars_, int &has_operand_number_, tree first_fillin_param_, object_allocator &fwt_pool_, vec *arglocs_, bool (*comp_types) (tree, tree)) : info (info_), fki (&format_types[info->format_type]), flag_specs (fki->flag_specs), start_of_this_format (format_chars_), format_chars (format_chars_), format_string_cst (format_string_cst_), orig_format_chars (orig_format_chars_), format_string_loc (format_string_loc_), fwt_pool (fwt_pool_), flag_chars (flag_chars_), main_arg_num (0), main_arg_params (NULL), has_operand_number (has_operand_number_), first_fillin_param (first_fillin_param_), first_wanted_type (NULL), last_wanted_type (NULL), arglocs (arglocs_), m_comp_types (comp_types) { } /* Handle dollars at the start of format arguments, setting up main_arg_params and main_arg_num. Return true if format parsing is to continue, false otherwise. */ bool argument_parser::read_any_dollar () { if ((fki->flags & (int) FMT_FLAG_USE_DOLLAR) && has_operand_number != 0) { /* Possibly read a $ operand number at the start of the format. If one was previously used, one is required here. If one is not used here, we can't immediately conclude this is a format without them, since it could be printf %m or scanf %*. */ int opnum; opnum = maybe_read_dollar_number (&format_chars, 0, first_fillin_param, &main_arg_params, fki); if (opnum == -1) return false; else if (opnum > 0) { has_operand_number = 1; main_arg_num = opnum + info->first_arg_num - 1; } } else if (fki->flags & FMT_FLAG_USE_DOLLAR) { if (avoid_dollar_number (format_chars)) return false; } return true; } /* Read any format flags, but do not yet validate them beyond removing duplicates, since in general validation depends on the rest of the format. Return true if format parsing is to continue, false otherwise. */ bool argument_parser::read_format_flags () { while (*format_chars != 0 && strchr (fki->flag_chars, *format_chars) != 0) { const format_flag_spec *s = get_flag_spec (flag_specs, *format_chars, NULL); if (flag_chars.has_char_p (*format_chars)) { format_warning_at_char (format_string_loc, format_string_cst, format_chars + 1 - orig_format_chars, OPT_Wformat_, "repeated %s in format", _(s->name)); } else flag_chars.add_char (*format_chars); if (s->skip_next_char) { ++format_chars; if (*format_chars == 0) { warning_at (format_string_loc, OPT_Wformat_, "missing fill character at end of strfmon format"); return false; } } ++format_chars; } return true; } /* Read any format width, possibly * or *m$. Return true if format parsing is to continue, false otherwise. */ bool argument_parser:: read_any_format_width (tree ¶ms, unsigned HOST_WIDE_INT &arg_num) { if (!fki->width_char) return true; if (fki->width_type != NULL && *format_chars == '*') { flag_chars.add_char (fki->width_char); /* "...a field width...may be indicated by an asterisk. In this case, an int argument supplies the field width..." */ ++format_chars; if (has_operand_number != 0) { int opnum; opnum = maybe_read_dollar_number (&format_chars, has_operand_number == 1, first_fillin_param, ¶ms, fki); if (opnum == -1) return false; else if (opnum > 0) { has_operand_number = 1; arg_num = opnum + info->first_arg_num - 1; } else has_operand_number = 0; } else { if (avoid_dollar_number (format_chars)) return false; } if (info->first_arg_num != 0) { tree cur_param; if (params == 0) cur_param = NULL; else { cur_param = TREE_VALUE (params); if (has_operand_number <= 0) { params = TREE_CHAIN (params); ++arg_num; } } width_wanted_type.wanted_type = *fki->width_type; width_wanted_type.wanted_type_name = NULL; width_wanted_type.pointer_count = 0; width_wanted_type.char_lenient_flag = 0; width_wanted_type.scalar_identity_flag = 0; width_wanted_type.writing_in_flag = 0; width_wanted_type.reading_from_flag = 0; width_wanted_type.kind = CF_KIND_FIELD_WIDTH; width_wanted_type.format_start = format_chars - 1; width_wanted_type.format_length = 1; width_wanted_type.param = cur_param; width_wanted_type.arg_num = arg_num; width_wanted_type.offset_loc = format_chars - orig_format_chars; width_wanted_type.next = NULL; if (last_wanted_type != 0) last_wanted_type->next = &width_wanted_type; if (first_wanted_type == 0) first_wanted_type = &width_wanted_type; last_wanted_type = &width_wanted_type; } } else { /* Possibly read a numeric width. If the width is zero, we complain if appropriate. */ int non_zero_width_char = false; int found_width = false; while (ISDIGIT (*format_chars)) { found_width = true; if (*format_chars != '0') non_zero_width_char = true; ++format_chars; } if (found_width && !non_zero_width_char && (fki->flags & (int) FMT_FLAG_ZERO_WIDTH_BAD)) warning_at (format_string_loc, OPT_Wformat_, "zero width in %s format", fki->name); if (found_width) flag_chars.add_char (fki->width_char); } return true; } /* Read any format left precision (must be a number, not *). */ void argument_parser::read_any_format_left_precision () { if (fki->left_precision_char == 0) return; if (*format_chars != '#') return; ++format_chars; flag_chars.add_char (fki->left_precision_char); if (!ISDIGIT (*format_chars)) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "empty left precision in %s format", fki->name); while (ISDIGIT (*format_chars)) ++format_chars; } /* Read any format precision, possibly * or *m$. Return true if format parsing is to continue, false otherwise. */ bool argument_parser:: read_any_format_precision (tree ¶ms, unsigned HOST_WIDE_INT &arg_num) { if (fki->precision_char == 0) return true; if (*format_chars != '.') return true; ++format_chars; flag_chars.add_char (fki->precision_char); if (fki->precision_type != NULL && *format_chars == '*') { /* "...a...precision...may be indicated by an asterisk. In this case, an int argument supplies the...precision." */ ++format_chars; if (has_operand_number != 0) { int opnum; opnum = maybe_read_dollar_number (&format_chars, has_operand_number == 1, first_fillin_param, ¶ms, fki); if (opnum == -1) return false; else if (opnum > 0) { has_operand_number = 1; arg_num = opnum + info->first_arg_num - 1; } else has_operand_number = 0; } else { if (avoid_dollar_number (format_chars)) return false; } if (info->first_arg_num != 0) { tree cur_param; if (params == 0) cur_param = NULL; else { cur_param = TREE_VALUE (params); if (has_operand_number <= 0) { params = TREE_CHAIN (params); ++arg_num; } } precision_wanted_type.wanted_type = *fki->precision_type; precision_wanted_type.wanted_type_name = NULL; precision_wanted_type.pointer_count = 0; precision_wanted_type.char_lenient_flag = 0; precision_wanted_type.scalar_identity_flag = 0; precision_wanted_type.writing_in_flag = 0; precision_wanted_type.reading_from_flag = 0; precision_wanted_type.kind = CF_KIND_FIELD_PRECISION; precision_wanted_type.param = cur_param; precision_wanted_type.format_start = format_chars - 2; precision_wanted_type.format_length = 2; precision_wanted_type.arg_num = arg_num; precision_wanted_type.offset_loc = format_chars - orig_format_chars; precision_wanted_type.next = NULL; if (last_wanted_type != 0) last_wanted_type->next = &precision_wanted_type; if (first_wanted_type == 0) first_wanted_type = &precision_wanted_type; last_wanted_type = &precision_wanted_type; } } else { if (!(fki->flags & (int) FMT_FLAG_EMPTY_PREC_OK) && !ISDIGIT (*format_chars)) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "empty precision in %s format", fki->name); while (ISDIGIT (*format_chars)) ++format_chars; } return true; } /* Parse any assignment-allocation flags, which request an extra char ** for writing back a dynamically-allocated char *. This is for handling the optional 'm' character in scanf, and, before C99, 'a' (for compatibility with a non-standard GNU libc extension). */ void argument_parser::handle_alloc_chars () { if (fki->alloc_char && fki->alloc_char == *format_chars) { flag_chars.add_char (fki->alloc_char); format_chars++; } /* Handle the scanf allocation kludge. */ if (fki->flags & (int) FMT_FLAG_SCANF_A_KLUDGE) { if (*format_chars == 'a' && !flag_isoc99) { if (format_chars[1] == 's' || format_chars[1] == 'S' || format_chars[1] == '[') { /* 'a' is used as a flag. */ flag_chars.add_char ('a'); format_chars++; } } } } /* Look for length modifiers within the current format argument, returning a length_modifier instance describing it (or the default if one is not found). Issue warnings about non-standard modifiers. */ length_modifier argument_parser::read_any_length_modifier () { length_modifier result; const format_length_info *fli = fki->length_char_specs; if (!fli) return result; while (fli->name != 0 && strncmp (fli->name, format_chars, strlen (fli->name))) fli++; if (fli->name != 0) { format_chars += strlen (fli->name); if (fli->double_name != 0 && fli->name[0] == *format_chars) { format_chars++; result = length_modifier (fli->double_name, fli->double_index, fli->double_std, 0); } else { result = length_modifier (fli->name, fli->index, fli->std, fli->scalar_identity_flag); } flag_chars.add_char (fki->length_code_char); } if (pedantic) { /* Warn if the length modifier is non-standard. */ if (ADJ_STD (result.std) > C_STD_VER) warning_at (format_string_loc, OPT_Wformat_, "%s does not support the %qs %s length modifier", C_STD_NAME (result.std), result.chars, fki->name); } return result; } /* Read any other modifier (strftime E/O). */ void argument_parser::read_any_other_modifier () { if (fki->modifier_chars == NULL) return; while (*format_chars != 0 && strchr (fki->modifier_chars, *format_chars) != 0) { if (flag_chars.has_char_p (*format_chars)) { const format_flag_spec *s = get_flag_spec (flag_specs, *format_chars, NULL); format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "repeated %s in format", _(s->name)); } else flag_chars.add_char (*format_chars); ++format_chars; } } /* Return the format_char_info corresponding to FORMAT_CHAR, potentially issuing a warning if the format char is not supported in the C standard version we are checking against. Issue a warning and return NULL if it is not found. Issue warnings about non-standard modifiers. */ const format_char_info * argument_parser::find_format_char_info (char format_char) { const format_char_info *fci = fki->conversion_specs; while (fci->format_chars != 0 && strchr (fci->format_chars, format_char) == 0) ++fci; if (fci->format_chars == 0) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "unknown conversion type character" " %qc in format", format_char); return NULL; } if (pedantic) { if (ADJ_STD (fci->std) > C_STD_VER) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%s does not support the %<%%%c%> %s format", C_STD_NAME (fci->std), format_char, fki->name); } return fci; } /* Validate the pairs of flags used. Issue warnings about incompatible combinations of flags. */ void argument_parser::validate_flag_pairs (const format_char_info *fci, char format_char) { const format_flag_pair * const bad_flag_pairs = fki->bad_flag_pairs; for (int i = 0; bad_flag_pairs[i].flag_char1 != 0; i++) { const format_flag_spec *s, *t; if (!flag_chars.has_char_p (bad_flag_pairs[i].flag_char1)) continue; if (!flag_chars.has_char_p (bad_flag_pairs[i].flag_char2)) continue; if (bad_flag_pairs[i].predicate != 0 && strchr (fci->flags2, bad_flag_pairs[i].predicate) == 0) continue; s = get_flag_spec (flag_specs, bad_flag_pairs[i].flag_char1, NULL); t = get_flag_spec (flag_specs, bad_flag_pairs[i].flag_char2, NULL); if (bad_flag_pairs[i].ignored) { if (bad_flag_pairs[i].predicate != 0) warning_at (format_string_loc, OPT_Wformat_, "%s ignored with %s and %<%%%c%> %s format", _(s->name), _(t->name), format_char, fki->name); else warning_at (format_string_loc, OPT_Wformat_, "%s ignored with %s in %s format", _(s->name), _(t->name), fki->name); } else { if (bad_flag_pairs[i].predicate != 0) warning_at (format_string_loc, OPT_Wformat_, "use of %s and %s together with %<%%%c%> %s format", _(s->name), _(t->name), format_char, fki->name); else warning_at (format_string_loc, OPT_Wformat_, "use of %s and %s together in %s format", _(s->name), _(t->name), fki->name); } } } /* Give Y2K warnings. */ void argument_parser::give_y2k_warnings (const format_char_info *fci, char format_char) { if (!warn_format_y2k) return; int y2k_level = 0; if (strchr (fci->flags2, '4') != 0) if (flag_chars.has_char_p ('E')) y2k_level = 3; else y2k_level = 2; else if (strchr (fci->flags2, '3') != 0) y2k_level = 3; else if (strchr (fci->flags2, '2') != 0) y2k_level = 2; if (y2k_level == 3) warning_at (format_string_loc, OPT_Wformat_y2k, "%<%%%c%> yields only last 2 digits of " "year in some locales", format_char); else if (y2k_level == 2) warning_at (format_string_loc, OPT_Wformat_y2k, "%<%%%c%> yields only last 2 digits of year", format_char); } /* Parse any "scan sets" enclosed in square brackets, e.g. for scanf-style calls. */ void argument_parser::parse_any_scan_set (const format_char_info *fci) { if (strchr (fci->flags2, '[') == NULL) return; /* Skip over scan set, in case it happens to have '%' in it. */ if (*format_chars == '^') ++format_chars; /* Find closing bracket; if one is hit immediately, then it's part of the scan set rather than a terminator. */ if (*format_chars == ']') ++format_chars; while (*format_chars && *format_chars != ']') ++format_chars; if (*format_chars != ']') /* The end of the format string was reached. */ format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "no closing %<]%> for %<%%[%> format"); } /* Return true if this argument is to be continued to be parsed, false to skip to next argument. */ bool argument_parser::handle_conversions (const format_char_info *fci, const length_modifier &len_modifier, tree &wanted_type, const char *&wanted_type_name, unsigned HOST_WIDE_INT &arg_num, tree ¶ms, char format_char) { enum format_std_version wanted_type_std; if (!(fki->flags & (int) FMT_FLAG_ARG_CONVERT)) return true; wanted_type = (fci->types[len_modifier.val].type ? *fci->types[len_modifier.val].type : 0); wanted_type_name = fci->types[len_modifier.val].name; wanted_type_std = fci->types[len_modifier.val].std; if (wanted_type == 0) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "use of %qs length modifier with %qc type" " character has either no effect" " or undefined behavior", len_modifier.chars, format_char); /* Heuristic: skip one argument when an invalid length/type combination is encountered. */ arg_num++; if (params != 0) params = TREE_CHAIN (params); return false; } else if (pedantic /* Warn if non-standard, provided it is more non-standard than the length and type characters that may already have been warned for. */ && ADJ_STD (wanted_type_std) > ADJ_STD (len_modifier.std) && ADJ_STD (wanted_type_std) > ADJ_STD (fci->std)) { if (ADJ_STD (wanted_type_std) > C_STD_VER) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%s does not support the %<%%%s%c%> %s format", C_STD_NAME (wanted_type_std), len_modifier.chars, format_char, fki->name); } return true; } /* Check type of argument against desired type. Return true if format parsing is to continue, false otherwise. */ bool argument_parser:: check_argument_type (const format_char_info *fci, const length_modifier &len_modifier, tree &wanted_type, const char *&wanted_type_name, const bool suppressed, unsigned HOST_WIDE_INT &arg_num, tree ¶ms, const int alloc_flag, const char * const format_start, const char * const type_start, location_t fmt_param_loc, char conversion_char) { if (info->first_arg_num == 0) return true; if ((fci->pointer_count == 0 && wanted_type == void_type_node) || suppressed) { if (main_arg_num != 0) { if (suppressed) warning_at (format_string_loc, OPT_Wformat_, "operand number specified with " "suppressed assignment"); else warning_at (format_string_loc, OPT_Wformat_, "operand number specified for format " "taking no argument"); } } else { format_wanted_type *wanted_type_ptr; if (main_arg_num != 0) { arg_num = main_arg_num; params = main_arg_params; } else { ++arg_num; if (has_operand_number > 0) { warning_at (format_string_loc, OPT_Wformat_, "missing $ operand number in format"); return false; } else has_operand_number = 0; } wanted_type_ptr = &main_wanted_type; while (fci) { tree cur_param; if (params == 0) cur_param = NULL; else { cur_param = TREE_VALUE (params); params = TREE_CHAIN (params); } wanted_type_ptr->wanted_type = wanted_type; wanted_type_ptr->wanted_type_name = wanted_type_name; wanted_type_ptr->pointer_count = fci->pointer_count + alloc_flag; wanted_type_ptr->char_lenient_flag = 0; if (strchr (fci->flags2, 'c') != 0) wanted_type_ptr->char_lenient_flag = 1; wanted_type_ptr->scalar_identity_flag = 0; if (len_modifier.scalar_identity_flag) wanted_type_ptr->scalar_identity_flag = 1; wanted_type_ptr->writing_in_flag = 0; wanted_type_ptr->reading_from_flag = 0; if (alloc_flag) wanted_type_ptr->writing_in_flag = 1; else { if (strchr (fci->flags2, 'W') != 0) wanted_type_ptr->writing_in_flag = 1; if (strchr (fci->flags2, 'R') != 0) wanted_type_ptr->reading_from_flag = 1; } wanted_type_ptr->kind = CF_KIND_FORMAT; wanted_type_ptr->param = cur_param; wanted_type_ptr->arg_num = arg_num; wanted_type_ptr->format_start = format_start; wanted_type_ptr->format_length = format_chars - format_start; wanted_type_ptr->offset_loc = format_chars - orig_format_chars; wanted_type_ptr->next = NULL; if (last_wanted_type != 0) last_wanted_type->next = wanted_type_ptr; if (first_wanted_type == 0) first_wanted_type = wanted_type_ptr; last_wanted_type = wanted_type_ptr; fci = fci->chain; if (fci) { wanted_type_ptr = fwt_pool.allocate (); arg_num++; wanted_type = *fci->types[len_modifier.val].type; wanted_type_name = fci->types[len_modifier.val].name; } } } if (first_wanted_type != 0) { ptrdiff_t offset_to_format_start = (start_of_this_format - 1) - orig_format_chars; ptrdiff_t offset_to_format_end = (format_chars - 1) - orig_format_chars; /* By default, use the end of the range for the caret location. */ substring_loc fmt_loc (fmt_param_loc, TREE_TYPE (format_string_cst), offset_to_format_end, offset_to_format_start, offset_to_format_end); ptrdiff_t offset_to_type_start = type_start - orig_format_chars; check_format_types (fmt_loc, first_wanted_type, fki, offset_to_type_start, conversion_char, arglocs, m_comp_types); } return true; } /* Describes "paired tokens" within the format string that are expected to be balanced. */ class baltoks_t { public: baltoks_t (): singlequote (), doublequote () { } typedef auto_vec balanced_tokens_t; /* Vectors of pointers to opening brackets ('['), curly brackets ('{'), quoting directives (like GCC "%<"), parentheses, and angle brackets ('<'). Used to detect unbalanced tokens. */ balanced_tokens_t brackets; balanced_tokens_t curly; balanced_tokens_t quotdirs; balanced_tokens_t parens; balanced_tokens_t pointy; /* Pointer to the last opening quote. */ const char *singlequote; const char *doublequote; }; /* Describes a keyword, operator, or other name. */ struct token_t { const char *name; /* Keyword/operator name. */ unsigned char len; /* Its length. */ const char *alt; /* Alternate spelling. */ }; /* Helper for initializing global token_t arrays below. */ #define NAME(name) { name, sizeof name - 1, NULL } /* C/C++ operators that are expected to be quoted within the format string. */ static const token_t c_opers[] = { NAME ("!="), NAME ("%="), NAME ("&&"), NAME ("&="), NAME ("*="), NAME ("++"), NAME ("+="), NAME ("--"), NAME ("-="), NAME ("->"), NAME ("/="), NAME ("<<"), NAME ("<<="), NAME ("<="), NAME ("=="), NAME (">="), NAME (">>="), NAME (">>"), NAME ("?:"), NAME ("^="), NAME ("|="), NAME ("||") }; static const token_t cxx_opers[] = { NAME ("->*"), NAME (".*"), NAME ("::"), NAME ("<=>") }; /* Common C/C++ keywords that are expected to be quoted within the format string. Keywords like auto, inline, or volatile are excluded because they are sometimes used in common terms like /auto variables/, /inline function/, or /volatile access/ where they should not be quoted. */ static const token_t c_keywords[] = { #undef NAME #define NAME(name, alt) { name, sizeof name - 1, alt } NAME ("alignas", NULL), NAME ("alignof", NULL), NAME ("asm", NULL), NAME ("bool", NULL), NAME ("char", NULL), NAME ("const %", NULL), NAME ("const-qualified", "%-qualified"), NAME ("float", NULL), NAME ("ifunc", NULL), NAME ("int", NULL), NAME ("long double", NULL), NAME ("long int", NULL), NAME ("long long", NULL), NAME ("malloc", NULL), NAME ("noclone", NULL), NAME ("noinline", NULL), NAME ("nonnull", NULL), NAME ("noreturn", NULL), NAME ("offsetof", NULL), NAME ("readonly", "read-only"), NAME ("readwrite", "read-write"), NAME ("restrict %", NULL), NAME ("restrict-qualified", "%-qualified"), NAME ("short int", NULL), NAME ("signed char", NULL), NAME ("signed int", NULL), NAME ("signed long", NULL), NAME ("signed short", NULL), NAME ("sizeof", NULL), NAME ("typeof", NULL), NAME ("unsigned char", NULL), NAME ("unsigned int", NULL), NAME ("unsigned long", NULL), NAME ("unsigned short", NULL), NAME ("volatile %", NULL), NAME ("volatile-qualified", "%-qualified"), NAME ("weakref", NULL), }; static const token_t cxx_keywords[] = { /* C++ only keywords and operators. */ NAME ("catch", NULL), NAME ("constexpr if", NULL), NAME ("constexpr", NULL), NAME ("constinit", NULL), NAME ("consteval", NULL), NAME ("decltype", NULL), NAME ("nullptr", NULL), NAME ("operator delete", NULL), NAME ("operator new", NULL), NAME ("typeid", NULL), NAME ("typeinfo", NULL) }; /* Blacklisted words such as misspellings that should be avoided in favor of the specified alternatives. */ static const struct { const char *name; /* Bad word. */ unsigned char len; /* Its length. */ const char *alt; /* Preferred alternative. */ } badwords[] = { NAME ("arg", "argument"), NAME ("bitfield", "bit-field"), NAME ("builtin function", "built-in function"), NAME ("can not", "cannot"), NAME ("commandline option", "command-line option"), NAME ("commandline", "command line"), NAME ("command line option", "command-line option"), NAME ("decl", "declaration"), NAME ("enumeral", "enumerated"), NAME ("floating point", "floating-point"), NAME ("nonstatic", "non-static"), NAME ("non-zero", "nonzero"), NAME ("reg", "register"), NAME ("stmt", "statement"), }; /* Common contractions that should be avoided in favor of the specified alternatives. */ static const struct { const char *name; /* Contraction. */ unsigned char len; /* Its length. */ const char *alt; /* Preferred alternative. */ } contrs[] = { NAME ("can't", "cannot"), NAME ("didn't", "did not"), /* These are commonly abused. Avoid diagnosing them for now. NAME ("isn't", "is not"), NAME ("don't", "is not"), */ NAME ("mustn't", "must not"), NAME ("needn't", "need not"), NAME ("should't", "should not"), NAME ("that's", "that is"), NAME ("there's", "there is"), NAME ("they're", "they are"), NAME ("what's", "what is"), NAME ("won't", "will not") }; /* Check for unquoted TOKENS. FORMAT_STRING_LOC is the location of the format string, FORMAT_STRING_CST the format string itself (as a tree), ORIG_FORMAT_CHARS and FORMAT_CHARS are pointers to the beginning of the format string and the character currently being processed, and BALTOKS describes paired "tokens" within the format string that are expected to be balanced. Returns a pointer to the last processed character or null when nothing was done. */ static const char* check_tokens (const token_t *tokens, unsigned ntoks, location_t format_string_loc, tree format_string_cst, const char *orig_format_chars, const char *format_chars, baltoks_t &baltoks) { /* For brevity. */ const int opt = OPT_Wformat_diag; /* Zero-based starting position of a problem sequence. */ int fmtchrpos = format_chars - orig_format_chars; /* For identifier-like "words," set to the word length. */ unsigned wlen = 0; /* Set for an operator, clear for an identifier/word. */ bool is_oper = false; bool underscore = false; if (format_chars[0] == '_' || ISALPHA (format_chars[0])) { while (format_chars[wlen] == '_' || ISALNUM (format_chars[wlen])) { underscore |= format_chars[wlen] == '_'; ++wlen; } } else is_oper = true; for (unsigned i = 0; i != ntoks; ++i) { unsigned toklen = tokens[i].len; if (toklen < wlen || strncmp (format_chars, tokens[i].name, toklen)) continue; if (toklen == 2 && format_chars - orig_format_chars > 0 && (TOUPPER (format_chars[-1]) == 'C' || TOUPPER (format_chars[-1]) == 'G')) return format_chars + toklen - 1; /* Reference to C++ or G++. */ if (ISPUNCT (format_chars[toklen - 1])) { if (format_chars[toklen - 1] == format_chars[toklen]) return NULL; /* Operator followed by another punctuator. */ } else if (ISALNUM (format_chars[toklen])) return NULL; /* Keyword prefix for a longer word. */ if (toklen == 2 && format_chars[0] == '-' && format_chars[1] == '-' && ISALNUM (format_chars[2])) return NULL; /* Probably option like --help. */ /* Allow this ugly warning for the time being. */ if (toklen == 2 && format_chars - orig_format_chars > 6 && startswith (format_chars - 7, " count >= width of ")) return format_chars + 10; /* The token is a type if it ends in an alphabetic character. */ bool is_type = (ISALPHA (tokens[i].name[toklen - 1]) && strchr (tokens[i].name, ' ')); /* Backtrack to the last alphabetic character (for tokens whose names end in '%'). */ if (!is_oper) while (!ISALPHA (tokens[i].name[toklen - 1])) --toklen; if (format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + toklen, opt, (is_type ? G_("unquoted type name %<%.*s%> in format") : (is_oper ? G_("unquoted operator %<%.*s%> in format") : G_("unquoted keyword %<%.*s%> in format"))), toklen, format_chars) && tokens[i].alt) inform (format_string_loc, "use %qs instead", tokens[i].alt); return format_chars + toklen - 1; } /* Diagnose unquoted __attribute__. Consider any parenthesized argument to the attribute to avoid redundant warnings for the double parentheses that might follow. */ if (startswith (format_chars, "__attribute")) { unsigned nchars = sizeof "__attribute" - 1; while ('_' == format_chars[nchars]) ++nchars; for (int i = nchars; format_chars[i]; ++i) if (' ' != format_chars[i]) { nchars = i; break; } if (format_chars[nchars] == '(') { baltoks.parens.safe_push (format_chars + nchars); ++nchars; bool close = false; if (format_chars[nchars] == '(') { baltoks.parens.safe_push (format_chars + nchars); close = true; ++nchars; } for (int i = nchars; format_chars[i]; ++i) if (')' == format_chars[i]) { if (baltoks.parens.length () > 0) baltoks.parens.pop (); nchars = i + 1; break; } if (close && format_chars[nchars] == ')') { if (baltoks.parens.length () > 0) baltoks.parens.pop (); ++nchars; } } format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted attribute in format"); return format_chars + nchars - 1; } /* Diagnose unquoted built-ins. */ if (format_chars[0] == '_' && format_chars[1] == '_' && (startswith (format_chars + 2, "atomic") || startswith (format_chars + 2, "builtin") || startswith (format_chars + 2, "sync"))) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + wlen, opt, "unquoted name of built-in function %<%.*s%> " "in format", wlen, format_chars); return format_chars + wlen - 1; } /* Diagnose unquoted substrings of alphanumeric characters containing underscores. They most likely refer to identifiers and should be quoted. */ if (underscore) format_warning_substr (format_string_loc, format_string_cst, format_chars - orig_format_chars, format_chars + wlen - orig_format_chars, opt, "unquoted identifier or keyword %<%.*s%> in format", wlen, format_chars); else { /* Diagnose some common misspellings. */ for (unsigned i = 0; i != ARRAY_SIZE (badwords); ++i) { unsigned badwlen = strspn (badwords[i].name, " -"); if (wlen >= badwlen && (wlen <= badwords[i].len || (wlen == badwords[i].len + 1U && TOUPPER (format_chars[wlen - 1]) == 'S')) && !strncasecmp (format_chars, badwords[i].name, badwords[i].len)) { /* Handle singular as well as plural forms of all bad words even though the latter don't necessarily make sense for all of the former (like "can nots"). */ badwlen = badwords[i].len; const char *plural = ""; if (TOUPPER (format_chars[badwlen]) == 'S') { ++badwlen; plural = "s"; } /* As an exception, don't warn about "decl-specifier*" since it's a C++ grammar production. */ if (badwords[i].name[0] == 'd' && startswith (format_chars, "decl-specifier")) continue; format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + badwords[i].len, opt, "misspelled term %<%.*s%> in format; " "use %<%s%s%> instead", badwlen, format_chars, badwords[i].alt, plural); return format_chars + badwords[i].len - 1; } } /* Skip C++/G++. */ if (!strncasecmp (format_chars, "c++", 3) || !strncasecmp (format_chars, "g++", 3)) return format_chars + 2; } return wlen ? format_chars + wlen - 1 : NULL; } /* Check plain text in a format string of a GCC diagnostic function for common quoting, punctuation, and spelling mistakes, and issue -Wformat-diag warnings if they are found. FORMAT_STRING_LOC is the location of the format string, FORMAT_STRING_CST the format string itself (as a tree), ORIG_FORMAT_CHARS and FORMAT_CHARS are pointers to the beginning of the format string and the character currently being processed, and BALTOKS describes paired "tokens" within the format string that are expected to be balanced. Returns a pointer to the last processed character. */ static const char* check_plain (location_t format_string_loc, tree format_string_cst, const char *orig_format_chars, const char *format_chars, baltoks_t &baltoks) { /* For brevity. */ const int opt = OPT_Wformat_diag; /* Zero-based starting position of a problem sequence. */ int fmtchrpos = format_chars - orig_format_chars; if (*format_chars == '%') { /* Diagnose %<%s%> and suggest using %qs instead. */ if (startswith (format_chars, "%<%s%>")) format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + 6, opt, "quoted %qs directive in format; " "use %qs instead", "%s", "%qs"); else if (format_chars - orig_format_chars > 2 && !strncasecmp (format_chars - 3, "can%'t", 6)) format_warning_substr (format_string_loc, format_string_cst, fmtchrpos - 3, fmtchrpos + 3, opt, "contraction %<%.*s%> in format; " "use %qs instead", 6, format_chars - 3, "cannot"); return format_chars; } if (baltoks.quotdirs.length ()) { /* Skip over all plain text within a quoting directive until the next directive. */ while (*format_chars && '%' != *format_chars) ++format_chars; return format_chars; } /* The length of the problem sequence. */ int nchars = 0; /* Diagnose any whitespace characters other than but only leading, trailing, and two or more consecutive s. Do this before diagnosing control characters because whitespace is a subset of controls. */ const char *other_than_space = NULL; while (ISSPACE (format_chars[nchars])) { if (format_chars[nchars] != ' ' && !other_than_space) other_than_space = format_chars + nchars; ++nchars; } if (nchars) { /* This is the most common problem: go the extra mile to describe the problem in as much helpful detail as possible. */ if (other_than_space) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted whitespace character %qc in format", *other_than_space); return format_chars + nchars - 1; } if (fmtchrpos == 0) /* Accept strings of leading spaces with no warning. */ return format_chars + nchars - 1; if (!format_chars[nchars]) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "spurious trailing space in format"); return format_chars + nchars - 1; } if (nchars > 1) { if (nchars == 2 && orig_format_chars < format_chars && format_chars[-1] == '.' && format_chars[0] == ' ' && format_chars[1] == ' ') { /* A period followed by two spaces. */ if (ISUPPER (*orig_format_chars)) { /* If the part before the period is a capitalized sentence check to make sure that what follows is also capitalized. */ if (ISLOWER (format_chars[2])) format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "inconsistent capitalization in " "format"); } } else format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted sequence of %i consecutive " "space characters in format", nchars); return format_chars + nchars - 1; } format_chars += nchars; nchars = 0; } fmtchrpos = format_chars - orig_format_chars; /* Diagnose any unquoted control characters other than the terminating NUL. */ while (format_chars[nchars] && ISCNTRL (format_chars[nchars])) ++nchars; if (nchars > 1) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted control characters in format"); return format_chars + nchars - 1; } if (nchars) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted control character %qc in format", *format_chars); return format_chars + nchars - 1; } if (ISPUNCT (format_chars[0])) { size_t nelts = ARRAY_SIZE (c_opers); if (const char *ret = check_tokens (c_opers, nelts, format_string_loc, format_string_cst, orig_format_chars, format_chars, baltoks)) return ret; nelts = c_dialect_cxx () ? ARRAY_SIZE (cxx_opers) : 0; if (const char *ret = check_tokens (cxx_opers, nelts, format_string_loc, format_string_cst, orig_format_chars, format_chars, baltoks)) return ret; } if (ISALPHA (format_chars[0])) { size_t nelts = ARRAY_SIZE (c_keywords); if (const char *ret = check_tokens (c_keywords, nelts, format_string_loc, format_string_cst, orig_format_chars, format_chars, baltoks)) return ret; nelts = c_dialect_cxx () ? ARRAY_SIZE (cxx_keywords) : 0; if (const char *ret = check_tokens (cxx_keywords, nelts, format_string_loc, format_string_cst, orig_format_chars, format_chars, baltoks)) return ret; } nchars = 0; /* Diagnose unquoted options. */ if ((format_chars == orig_format_chars || format_chars[-1] == ' ') && format_chars[0] == '-' && ((format_chars[1] == '-' && ISALPHA (format_chars[2])) || ISALPHA (format_chars[1]))) { nchars = 1; while (ISALNUM (format_chars[nchars]) || '_' == format_chars[nchars] || '-' == format_chars[nchars] || '+' == format_chars[nchars]) ++nchars; format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted option name %<%.*s%> in format", nchars, format_chars); return format_chars + nchars - 1; } /* Diagnose leading, trailing, and two or more consecutive punctuation characters. */ const char *unbalanced = NULL; while ('%' != format_chars[nchars] && ISPUNCT (format_chars[nchars]) && !unbalanced) { switch (format_chars[nchars]) { case '[': baltoks.brackets.safe_push (format_chars + nchars); break; case '{': baltoks.curly.safe_push (format_chars + nchars); break; case '(': baltoks.parens.safe_push (format_chars + nchars); break; case '<': baltoks.pointy.safe_push (format_chars + nchars); break; case ']': if (baltoks.brackets.length () > 0) baltoks.brackets.pop (); else unbalanced = format_chars + nchars; break; case '}': if (baltoks.curly.length () > 0) baltoks.curly.pop (); else unbalanced = format_chars + nchars; break; case ')': if (baltoks.parens.length () > 0) baltoks.parens.pop (); else unbalanced = format_chars + nchars; break; case '>': if (baltoks.pointy.length () > 0) baltoks.pointy.pop (); else unbalanced = format_chars + nchars; break; } ++nchars; } if (unbalanced) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unbalanced punctuation character %qc in format", *unbalanced); return format_chars + nchars - 1; } if (nchars) { /* Consider any identifier that follows the pound ('#') sign a preprocessing directive. */ if (nchars == 1 && format_chars[0] == '#' && ISALPHA (format_chars[1])) { while (ISALNUM (format_chars[nchars]) || format_chars[nchars] == '_') ++nchars; format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted preprocessing directive %<%.*s%> " "in format", nchars, format_chars); return format_chars + nchars - 1; } /* Diagnose a bare single quote. */ if (nchars == 1 && format_chars[0] == '\'' && format_chars - orig_format_chars && ISALPHA (format_chars[-1]) && ISALPHA (format_chars[1])) { /* Diagnose a subset of contractions that are best avoided. */ for (unsigned i = 0; i != ARRAY_SIZE (contrs); ++i) { const char *apos = strchr (contrs[i].name, '\''); gcc_assert (apos != NULL); int off = apos - contrs[i].name; if (format_chars - orig_format_chars >= off && !strncmp (format_chars - off, contrs[i].name, contrs[i].len)) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "contraction %<%.*s%> in format; " "use %qs instead", contrs[i].len, contrs[i].name, contrs[i].alt); return format_chars + nchars - 1; } } if (format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "bare apostrophe %<'%> in format")) inform (format_string_loc, "if avoiding the apostrophe is not feasible, enclose " "it in a pair of %qs and %qs directives instead", "%<", "%>"); return format_chars + nchars - 1; } /* Diagnose a backtick (grave accent). */ if (nchars == 1 && format_chars[0] == '`') { if (format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "grave accent %<`%> in format")) inform (format_string_loc, "use the apostrophe directive %qs instead", "%'"); return format_chars + nchars - 1; } /* Diagnose a punctuation character after a space. */ if (nchars == 1 && format_chars - orig_format_chars && format_chars[-1] == ' ' && strspn (format_chars, "!?:;.,") == 1) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos - 1, fmtchrpos, opt, "space followed by punctuation character " "%<%c%>", format_chars[0]); return format_chars; } if (nchars == 1) { if (startswith (format_chars, "\"%s\"")) { if (format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + 4, opt, "quoted %qs directive in format", "%s")) inform (format_string_loc, "if using %qs is not feasible, " "use %qs instead", "%qs", "\"%-s\""); } if (format_chars[0] == '"') { baltoks.doublequote = baltoks.doublequote ? NULL : format_chars; return format_chars + nchars - 1; } if (format_chars[0] == '\'') { baltoks.singlequote = baltoks.singlequote ? NULL : format_chars; return format_chars + nchars - 1; } } if (fmtchrpos == 0) { if (nchars == 1 && format_chars[0] == '(') ; /* Text beginning in an open parenthesis. */ else if (nchars == 3 && startswith (format_chars, "...") && format_chars[3]) ; /* Text beginning in an ellipsis. */ else { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "spurious leading punctuation sequence " "%<%.*s%> in format", nchars, format_chars); return format_chars + nchars - 1; } } else if (!format_chars[nchars]) { if (nchars == 1 && (format_chars[nchars - 1] == ':' || format_chars[nchars - 1] == ')')) ; /* Text ending in a colon or a closing parenthesis. */ else if (nchars == 1 && ((ISUPPER (*orig_format_chars) && format_chars[nchars - 1] == '.') || strspn (format_chars + nchars - 1, "?])") == 1)) ; /* Capitalized sentence terminated by a single period, or text ending in a question mark, closing bracket, or parenthesis. */ else if (nchars == 2 && format_chars[0] == '?' && format_chars[1] == ')') ; /* A question mark after a closing parenthetical note. */ else if (nchars == 2 && format_chars[0] == ')' && (format_chars[1] == '?' || format_chars[1] == ';' || format_chars[1] == ':' || (ISUPPER (*orig_format_chars) && format_chars[1] == '.'))) ; /* Closing parenthetical note followed by a question mark, semicolon, or colon at the end of the string, or by a period at the end of a capitalized sentence. */ else if (nchars == 3 && format_chars - orig_format_chars > 0 && startswith (format_chars, "...")) ; /* Text ending in the ellipsis. */ else format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "spurious trailing punctuation sequence " "%<%.*s%> in format", nchars, format_chars); return format_chars + nchars - 1; } else if (nchars == 2 && format_chars[0] == ')' && (format_chars[1] == ':' || format_chars[1] == ';' || format_chars[1] == ',') && format_chars[2] == ' ') ; /* Closing parenthetical note followed by a colon, semicolon or a comma followed by a space in the middle of the string. */ else if (nchars > 1) format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted sequence of %i consecutive " "punctuation characters %q.*s in format", nchars, nchars, format_chars); return format_chars + nchars - 1; } nchars = 0; /* Finally, diagnose any unquoted non-graph, non-punctuation characters other than the terminating NUL. */ while (format_chars[nchars] && '%' != format_chars[nchars] && !ISPUNCT (format_chars[nchars]) && !ISGRAPH (format_chars[nchars])) ++nchars; if (nchars > 1) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted non-graph characters in format"); return format_chars + nchars - 1; } if (nchars) { format_warning_substr (format_string_loc, format_string_cst, fmtchrpos, fmtchrpos + nchars, opt, "unquoted non-graph character %qc in format", *format_chars); return format_chars + nchars - 1; } return format_chars; } /* Diagnose unbalanced tokens described by BALTOKS in format string ORIG_FORMAT_CHARS and the corresponding FORMAT_STRING_CST. */ static void maybe_diag_unbalanced_tokens (location_t format_string_loc, const char *orig_format_chars, tree format_string_cst, baltoks_t &baltoks) { const char *unbalanced = NULL; if (baltoks.brackets.length ()) unbalanced = baltoks.brackets.pop (); else if (baltoks.curly.length ()) unbalanced = baltoks.curly.pop (); else if (baltoks.parens.length ()) unbalanced = baltoks.parens.pop (); else if (baltoks.pointy.length ()) unbalanced = baltoks.pointy.pop (); if (unbalanced) format_warning_at_char (format_string_loc, format_string_cst, unbalanced - orig_format_chars + 1, OPT_Wformat_diag, "unbalanced punctuation character %<%c%> in format", *unbalanced); if (baltoks.quotdirs.length ()) format_warning_at_char (format_string_loc, format_string_cst, baltoks.quotdirs.pop () - orig_format_chars, OPT_Wformat_, "unterminated quoting directive"); const char *quote = baltoks.singlequote ? baltoks.singlequote : baltoks.doublequote; if (quote) format_warning_at_char (format_string_loc, format_string_cst, quote - orig_format_chars + 1, OPT_Wformat_diag, "unterminated quote character %<%c%> in format", *quote); } /* Do the main part of checking a call to a format function. FORMAT_CHARS is the NUL-terminated format string (which at this point may contain internal NUL characters); FORMAT_LENGTH is its length (excluding the terminating NUL character). ARG_NUM is one less than the number of the first format argument to check; PARAMS points to that format argument in the list of arguments. */ static void check_format_info_main (format_check_results *res, function_format_info *info, const char *format_chars, location_t fmt_param_loc, tree format_string_cst, int format_length, tree params, unsigned HOST_WIDE_INT arg_num, object_allocator &fwt_pool, vec *arglocs, bool (*comp_types) (tree, tree)) { const char * const orig_format_chars = format_chars; const tree first_fillin_param = params; const format_kind_info * const fki = &format_types[info->format_type]; const format_flag_spec * const flag_specs = fki->flag_specs; const location_t format_string_loc = res->format_string_loc; /* -1 if no conversions taking an operand have been found; 0 if one has and it didn't use $; 1 if $ formats are in use. */ int has_operand_number = -1; /* Vectors of pointers to opening quoting directives (like GCC "%<"), opening braces, brackets, and parentheses. Used to detect unbalanced tokens. */ baltoks_t baltoks; /* Pointers to the most recent color directives (like GCC's "%r or %R"). A starting color directive much be terminated before the end of the format string. A terminating directive makes no sense without a prior starting directive. */ const char *color_begin = NULL; const char *color_end = NULL; init_dollar_format_checking (info->first_arg_num, first_fillin_param); /* In GCC diagnostic functions check plain directives (substrings within the format string that don't start with %) for quoting and punctuations problems. */ bool ck_plain = (!info->is_raw && (info->format_type == gcc_diag_format_type || info->format_type == gcc_tdiag_format_type || info->format_type == gcc_cdiag_format_type || info->format_type == gcc_cxxdiag_format_type)); while (*format_chars != 0) { if (ck_plain) format_chars = check_plain (format_string_loc, format_string_cst, orig_format_chars, format_chars, baltoks); if (*format_chars == 0 || *format_chars++ != '%') continue; if (*format_chars == 0) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "spurious trailing %<%%%> in format"); continue; } if (*format_chars == '%') { ++format_chars; continue; } /* ARGUMENT_PARSER ctor takes FORMAT_CHARS by reference and calls to ARG_PARSER members may modify the variable. */ flag_chars_t flag_chars; argument_parser arg_parser (info, format_chars, format_string_cst, orig_format_chars, format_string_loc, flag_chars, has_operand_number, first_fillin_param, fwt_pool, arglocs, comp_types); if (!arg_parser.read_any_dollar ()) return; if (!arg_parser.read_format_flags ()) return; /* Read any format width, possibly * or *m$. */ if (!arg_parser.read_any_format_width (params, arg_num)) return; /* Read any format left precision (must be a number, not *). */ arg_parser.read_any_format_left_precision (); /* Read any format precision, possibly * or *m$. */ if (!arg_parser.read_any_format_precision (params, arg_num)) return; const char *format_start = format_chars; arg_parser.handle_alloc_chars (); /* The rest of the conversion specification is the length modifier (if any), and the conversion specifier, so this is where the type information starts. If we need to issue a suggestion about a type mismatch, then we should preserve everything up to here. */ const char *type_start = format_chars; /* Read any length modifier, if this kind of format has them. */ const length_modifier len_modifier = arg_parser.read_any_length_modifier (); /* Read any modifier (strftime E/O). */ arg_parser.read_any_other_modifier (); char format_char = *format_chars; if (format_char == 0 || (!(fki->flags & (int) FMT_FLAG_FANCY_PERCENT_OK) && format_char == '%')) { format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "conversion lacks type at end of format"); continue; } format_chars++; const format_char_info * const fci = arg_parser.find_format_char_info (format_char); if (!fci) continue; flag_chars.validate (fki, fci, flag_specs, format_chars, format_string_cst, format_string_loc, orig_format_chars, format_char, baltoks.quotdirs.length () > 0); const int alloc_flag = flag_chars.get_alloc_flag (fki); const bool suppressed = flag_chars.assignment_suppression_p (fki); /* Diagnose nested or unmatched quoting directives such as GCC's "%<...%<" and "%>...%>". */ bool quot_begin_p = strchr (fci->flags2, '<'); bool quot_end_p = strchr (fci->flags2, '>'); if (quot_begin_p && !quot_end_p) { if (baltoks.quotdirs.length ()) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "nested quoting directive"); baltoks.quotdirs.safe_push (format_chars); } else if (!quot_begin_p && quot_end_p) { if (baltoks.quotdirs.length ()) baltoks.quotdirs.pop (); else format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "unmatched quoting directive"); } bool color_begin_p = strchr (fci->flags2, '/'); if (color_begin_p) { color_begin = format_chars; color_end = NULL; } else if (strchr (fci->flags2, '\\')) { if (color_end) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%qc directive redundant after prior " "occurence of the same", format_char); else if (!color_begin) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "unmatched color reset directive"); color_end = format_chars; } /* Diagnose directives that shouldn't appear in a quoted sequence. (They are denoted by a double quote in FLAGS2.) */ if (baltoks.quotdirs.length ()) { if (strchr (fci->flags2, '"')) format_warning_at_char (format_string_loc, format_string_cst, format_chars - orig_format_chars, OPT_Wformat_, "%qc conversion used within a quoted " "sequence", format_char); } /* Validate the pairs of flags used. */ arg_parser.validate_flag_pairs (fci, format_char); arg_parser.give_y2k_warnings (fci, format_char); arg_parser.parse_any_scan_set (fci); tree wanted_type = NULL; const char *wanted_type_name = NULL; if (!arg_parser.handle_conversions (fci, len_modifier, wanted_type, wanted_type_name, arg_num, params, format_char)) continue; arg_parser.main_wanted_type.next = NULL; /* Finally. . .check type of argument against desired type! */ if (!arg_parser.check_argument_type (fci, len_modifier, wanted_type, wanted_type_name, suppressed, arg_num, params, alloc_flag, format_start, type_start, fmt_param_loc, format_char)) return; } if (format_chars - orig_format_chars != format_length) format_warning_at_char (format_string_loc, format_string_cst, format_chars + 1 - orig_format_chars, OPT_Wformat_contains_nul, "embedded %<\\0%> in format"); if (info->first_arg_num != 0 && params != 0 && has_operand_number <= 0) { res->number_other--; res->number_extra_args++; } if (has_operand_number > 0) finish_dollar_format_checking (res, fki->flags & (int) FMT_FLAG_DOLLAR_GAP_POINTER_OK); maybe_diag_unbalanced_tokens (format_string_loc, orig_format_chars, format_string_cst, baltoks); if (color_begin && !color_end) format_warning_at_char (format_string_loc, format_string_cst, color_begin - orig_format_chars, OPT_Wformat_, "unterminated color directive"); } /* Special-case to support inheritance for %e. Return true for the case where we have %e with a valid pointer to a pp_element or pp_element subclass; false otherwise. */ static bool handle_subclass_of_pp_element_p (format_wanted_type *types, bool (*comp_types) (tree, tree)) { if (types->wanted_type != local_pp_element_ptr_node) return false; tree param_type = TREE_TYPE (types->param); if (param_type == error_mark_node) return false; if (comp_types (types->wanted_type, param_type)) return true; return false; } /* Check the argument types from a single format conversion (possibly including width and precision arguments). FMT_LOC is the location of the format conversion. TYPES is a singly-linked list expressing the parts of the format conversion that expect argument types, and the arguments they correspond to. OFFSET_TO_TYPE_START is the offset within the execution-charset encoded format string to where type information begins for the conversion (the length modifier and conversion specifier). CONVERSION_CHAR is the user-provided conversion specifier. For example, given: sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); then FMT_LOC covers this range: sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^^^^^^^^^ and TYPES in this case is a three-entry singly-linked list consisting of: (1) the check for the field width here: sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^ ^^^^ against arg3, and (2) the check for the field precision here: sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^^ ^^^^ against arg4, and (3) the check for the length modifier and conversion char here: sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^^^ ^^^^ against arg5. OFFSET_TO_TYPE_START is 13, the offset to the "lld" within the STRING_CST: 0000000000111111111122 0123456789012345678901 sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^ ^ | ` CONVERSION_CHAR: 'd' type starts here. */ static void check_format_types (const substring_loc &fmt_loc, format_wanted_type *types, const format_kind_info *fki, int offset_to_type_start, char conversion_char, vec *arglocs, bool (*comp_types) (tree, tree)) { for (; types != 0; types = types->next) { tree cur_param; tree cur_type; tree orig_cur_type; tree wanted_type; int arg_num; int i; int char_type_flag; wanted_type = types->wanted_type; arg_num = types->arg_num; /* The following should not occur here. */ gcc_assert (wanted_type); gcc_assert (wanted_type != void_type_node || types->pointer_count); if (types->pointer_count == 0) wanted_type = lang_hooks.types.type_promotes_to (wanted_type); if (handle_subclass_of_pp_element_p (types, comp_types)) continue; wanted_type = TYPE_MAIN_VARIANT (wanted_type); cur_param = types->param; if (!cur_param) { format_type_warning (fmt_loc, UNKNOWN_LOCATION, types, wanted_type, NULL, fki, offset_to_type_start, conversion_char); continue; } cur_type = TREE_TYPE (cur_param); if (cur_type == error_mark_node) continue; orig_cur_type = cur_type; char_type_flag = 0; location_t param_loc = UNKNOWN_LOCATION; if (EXPR_HAS_LOCATION (cur_param)) param_loc = EXPR_LOCATION (cur_param); else if (arglocs) { /* arg_num is 1-based. */ gcc_assert (types->arg_num > 0); param_loc = (*arglocs)[types->arg_num - 1]; } STRIP_NOPS (cur_param); /* Check the types of any additional pointer arguments that precede the "real" argument. */ for (i = 0; i < types->pointer_count; ++i) { if (TREE_CODE (cur_type) == POINTER_TYPE) { cur_type = TREE_TYPE (cur_type); if (cur_type == error_mark_node) break; /* Check for writing through a NULL pointer. */ if (types->writing_in_flag && i == 0 && cur_param != 0 && integer_zerop (cur_param)) warning (OPT_Wformat_, "writing through null pointer " "(argument %d)", arg_num); /* Check for reading through a NULL pointer. Ignore printf-family of functions as they are checked for null arguments by the middle-end. */ if (fki->conversion_specs != print_char_table && types->reading_from_flag && i == 0 && cur_param != 0 && integer_zerop (cur_param)) warning (OPT_Wformat_, "reading through null pointer " "(argument %d)", arg_num); if (cur_param != 0 && TREE_CODE (cur_param) == ADDR_EXPR) cur_param = TREE_OPERAND (cur_param, 0); else cur_param = 0; /* See if this is an attempt to write into a const type with scanf or with printf "%n". Note: the writing in happens at the first indirection only, if for example void * const * is passed to scanf %p; passing const void ** is simply passing an incompatible type. */ if (types->writing_in_flag && i == 0 && (TYPE_READONLY (cur_type) || (cur_param != 0 && (CONSTANT_CLASS_P (cur_param) || (DECL_P (cur_param) && TREE_READONLY (cur_param)))))) warning (OPT_Wformat_, "writing into constant object " "(argument %d)", arg_num); /* If there are extra type qualifiers beyond the first indirection, then this makes the types technically incompatible. */ if (i > 0 && pedantic && (TYPE_READONLY (cur_type) || TYPE_VOLATILE (cur_type) || TYPE_ATOMIC (cur_type) || TYPE_RESTRICT (cur_type))) warning (OPT_Wformat_, "extra type qualifiers in format " "argument (argument %d)", arg_num); } else { format_type_warning (fmt_loc, param_loc, types, wanted_type, orig_cur_type, fki, offset_to_type_start, conversion_char); break; } } if (i < types->pointer_count) continue; cur_type = TYPE_MAIN_VARIANT (cur_type); /* Check whether the argument type is a character type. This leniency only applies to certain formats, flagged with 'c'. */ if (types->char_lenient_flag) char_type_flag = (cur_type == char_type_node || cur_type == signed_char_type_node || cur_type == unsigned_char_type_node); /* Check the type of the "real" argument, if there's a type we want. */ if (lang_hooks.types_compatible_p (wanted_type, cur_type)) continue; /* If we want 'void *', allow any pointer type. (Anything else would already have got a warning.) With -Wpedantic, only allow pointers to void and to character types. */ if (wanted_type == void_type_node && (!pedantic || (i == 1 && char_type_flag))) continue; /* Don't warn about differences merely in signedness, unless -Wpedantic. With -Wpedantic, warn if the type is a pointer target and not a character type, and for character types at a second level of indirection. */ if (TREE_CODE (wanted_type) == INTEGER_TYPE && TREE_CODE (cur_type) == INTEGER_TYPE && ((!pedantic && !warn_format_signedness) || (i == 0 && !warn_format_signedness) || (i == 1 && char_type_flag)) && (TYPE_UNSIGNED (wanted_type) ? wanted_type == c_common_unsigned_type (cur_type) : wanted_type == c_common_signed_type (cur_type))) continue; /* Don't warn about differences merely in signedness if we know that the current type is integer-promoted and its original type was unsigned such as that it is in the range of WANTED_TYPE. */ if (TREE_CODE (wanted_type) == INTEGER_TYPE && TREE_CODE (cur_type) == INTEGER_TYPE && warn_format_signedness && TYPE_UNSIGNED (wanted_type) && cur_param != NULL_TREE && TREE_CODE (cur_param) == NOP_EXPR) { tree t = TREE_TYPE (TREE_OPERAND (cur_param, 0)); if (TYPE_UNSIGNED (t) && cur_type == lang_hooks.types.type_promotes_to (t)) continue; } /* Likewise, "signed char", "unsigned char" and "char" are equivalent but the above test won't consider them equivalent. */ if (wanted_type == char_type_node && (!pedantic || i < 2) && char_type_flag) continue; if (types->scalar_identity_flag && (TREE_CODE (cur_type) == TREE_CODE (wanted_type) || (INTEGRAL_TYPE_P (cur_type) && INTEGRAL_TYPE_P (wanted_type))) && TYPE_PRECISION (cur_type) == TYPE_PRECISION (wanted_type)) continue; /* Now we have a type mismatch. */ format_type_warning (fmt_loc, param_loc, types, wanted_type, orig_cur_type, fki, offset_to_type_start, conversion_char); } } /* Given type TYPE, attempt to dereference the type N times (e.g. from ("int ***", 2) to "int *") Return the derefenced type, with any qualifiers such as "const" stripped from the result, or NULL if unsuccessful (e.g. TYPE is not a pointer type). */ static tree deref_n_times (tree type, int n) { gcc_assert (type); for (int i = n; i > 0; i--) { if (TREE_CODE (type) != POINTER_TYPE) return NULL_TREE; type = TREE_TYPE (type); } /* Strip off any "const" etc. */ return build_qualified_type (type, 0); } /* Lookup the format code for FORMAT_LEN within FLI, returning the string code for expressing it, or NULL if it is not found. */ static const char * get_modifier_for_format_len (const format_length_info *fli, enum format_lengths format_len) { for (; fli->name; fli++) { if (fli->index == format_len) return fli->name; if (fli->double_index == format_len) return fli->double_name; } return NULL; } #if CHECKING_P namespace selftest { static void test_get_modifier_for_format_len () { ASSERT_STREQ ("h", get_modifier_for_format_len (printf_length_specs, FMT_LEN_h)); ASSERT_STREQ ("hh", get_modifier_for_format_len (printf_length_specs, FMT_LEN_hh)); ASSERT_STREQ ("L", get_modifier_for_format_len (printf_length_specs, FMT_LEN_L)); ASSERT_EQ (NULL, get_modifier_for_format_len (printf_length_specs, FMT_LEN_none)); } } // namespace selftest #endif /* CHECKING_P */ /* Determine if SPEC_TYPE and ARG_TYPE are sufficiently similar for a format_type_detail using SPEC_TYPE to be offered as a suggestion for Wformat type errors where the argument has type ARG_TYPE. */ static bool matching_type_p (tree spec_type, tree arg_type) { gcc_assert (spec_type); gcc_assert (arg_type); /* If any of the types requires structural equality, we can't compare their canonical types. */ if (TYPE_STRUCTURAL_EQUALITY_P (spec_type) || TYPE_STRUCTURAL_EQUALITY_P (arg_type)) return false; spec_type = TYPE_CANONICAL (spec_type); arg_type = TYPE_CANONICAL (arg_type); if (TREE_CODE (spec_type) == INTEGER_TYPE && TREE_CODE (arg_type) == INTEGER_TYPE && (TYPE_UNSIGNED (spec_type) ? spec_type == c_common_unsigned_type (arg_type) : spec_type == c_common_signed_type (arg_type))) return true; return spec_type == arg_type; } /* Subroutine of get_format_for_type. Generate a string containing the length modifier and conversion specifier that should be used to format arguments of type ARG_TYPE within FKI (effectively the inverse of the checking code). If CONVERSION_CHAR is not zero (the first pass), the resulting suggestion is required to use it, for correcting bogus length modifiers. If CONVERSION_CHAR is zero (the second pass), then allow any suggestion that matches ARG_TYPE. If successful, returns a non-NULL string which should be freed by the caller. Otherwise, returns NULL. */ static char * get_format_for_type_1 (const format_kind_info *fki, tree arg_type, char conversion_char) { gcc_assert (arg_type); const format_char_info *spec; for (spec = &fki->conversion_specs[0]; spec->format_chars; spec++) { if (conversion_char) if (!strchr (spec->format_chars, conversion_char)) continue; tree effective_arg_type = deref_n_times (arg_type, spec->pointer_count); if (!effective_arg_type) continue; for (int i = 0; i < FMT_LEN_MAX; i++) { const format_type_detail *ftd = &spec->types[i]; if (!ftd->type || *ftd->type == NULL_TREE) continue; if (matching_type_p (*ftd->type, effective_arg_type)) { const char *len_modifier = get_modifier_for_format_len (fki->length_char_specs, (enum format_lengths)i); if (!len_modifier) len_modifier = ""; if (conversion_char) /* We found a match, using the given conversion char - the length modifier was incorrect (or absent). Provide a suggestion using the conversion char with the correct length modifier for the type. */ return xasprintf ("%s%c", len_modifier, conversion_char); else /* 2nd pass: no match was possible using the user-provided conversion char, but we do have a match without using it. Provide a suggestion using the first conversion char listed for the given type. */ return xasprintf ("%s%c", len_modifier, spec->format_chars[0]); } } } return NULL; } /* Generate a string containing the length modifier and conversion specifier that should be used to format arguments of type ARG_TYPE within FKI (effectively the inverse of the checking code). If successful, returns a non-NULL string which should be freed by the caller. Otherwise, returns NULL. */ static char * get_format_for_type (const format_kind_info *fki, tree arg_type, char conversion_char) { gcc_assert (arg_type); gcc_assert (conversion_char); /* First pass: look for a format_char_info containing CONVERSION_CHAR If we find one, then presumably the length modifier was incorrect (or absent). */ char *result = get_format_for_type_1 (fki, arg_type, conversion_char); if (result) return result; /* Second pass: we didn't find a match for CONVERSION_CHAR, so try matching just on the type. */ return get_format_for_type_1 (fki, arg_type, '\0'); } /* Attempt to get a string for use as a replacement fix-it hint for the source range in FMT_LOC. Preserve all of the text within the range of FMT_LOC up to OFFSET_TO_TYPE_START, replacing the rest with an appropriate length modifier and conversion specifier for ARG_TYPE, attempting to keep the user-provided CONVERSION_CHAR if possible. For example, given a long vs long long mismatch for arg5 here: 000000000111111111122222222223333333333| 123456789012345678901234567890123456789` column numbers 0000000000111111111122| 0123456789012345678901` string offsets V~~~~~~~~ : range of FMT_LOC, from cols 23-31 sprintf (d, "before %-+*.*lld after", arg3, arg4, arg5); ^ ^ | ` CONVERSION_CHAR: 'd' type starts here where OFFSET_TO_TYPE_START is 13 (the offset to the "lld" within the STRING_CST), where the user provided: %-+*.*lld the result (assuming "long" argument 5) should be: %-+*.*ld If successful, returns a non-NULL string which should be freed by the caller. Otherwise, returns NULL. */ static char * get_corrected_substring (const substring_loc &fmt_loc, format_wanted_type *type, tree arg_type, const format_kind_info *fki, int offset_to_type_start, char conversion_char) { /* Attempt to provide hints for argument types, but not for field widths and precisions. */ if (!arg_type) return NULL; if (type->kind != CF_KIND_FORMAT) return NULL; /* Locate the current code within the source range, rejecting any awkward cases where the format string occupies more than one line. Lookup the place where the type starts (including any length modifiers), getting it as the caret location. */ substring_loc type_loc (fmt_loc); type_loc.set_caret_index (offset_to_type_start); location_t fmt_substring_loc; const char *err = type_loc.get_location (&fmt_substring_loc); if (err) return NULL; source_range fmt_substring_range = get_range_from_loc (line_table, fmt_substring_loc); expanded_location caret = expand_location_to_spelling_point (fmt_substring_loc); expanded_location start = expand_location_to_spelling_point (fmt_substring_range.m_start); expanded_location finish = expand_location_to_spelling_point (fmt_substring_range.m_finish); if (caret.file != start.file) return NULL; if (start.file != finish.file) return NULL; if (caret.line != start.line) return NULL; if (start.line != finish.line) return NULL; if (start.column > caret.column) return NULL; if (start.column > finish.column) return NULL; if (caret.column > finish.column) return NULL; char_span line = global_dc->get_file_cache ().get_source_line (start.file, start.line); if (!line) return NULL; /* If we got this far, then we have the line containing the existing conversion specification. Generate a trimmed copy, containing the prefix part of the conversion specification, up to the (but not including) the length modifier. In the above example, this would be "%-+*.*". */ int length_up_to_type = caret.column - start.column; char_span prefix_span = line.subspan (start.column - 1, length_up_to_type); char *prefix = prefix_span.xstrdup (); /* Now attempt to generate a suggestion for the rest of the specification (length modifier and conversion char), based on ARG_TYPE and CONVERSION_CHAR. In the above example, this would be "ld". */ char *format_for_type = get_format_for_type (fki, arg_type, conversion_char); if (!format_for_type) { free (prefix); return NULL; } /* Success. Generate the resulting suggestion for the whole range of FMT_LOC by concatenating the two strings. In the above example, this would be "%-+*.*ld". */ char *result = concat (prefix, format_for_type, NULL); free (format_for_type); free (prefix); return result; } /* Helper class for adding zero or more trailing '*' to types. The format type and name exclude any '*' for pointers, so those must be formatted manually. For all the types we currently have, this is adequate, but formats taking pointers to functions or arrays would require the full type to be built up in order to print it with %T. */ class indirection_suffix { public: indirection_suffix (int pointer_count) : m_pointer_count (pointer_count) {} /* Determine the size of the buffer (including NUL-terminator). */ size_t get_buffer_size () const { return m_pointer_count + 2; } /* Write the '*' to DST and add a NUL-terminator. */ void fill_buffer (char *dst) const { if (m_pointer_count == 0) dst[0] = 0; else if (c_dialect_cxx ()) { memset (dst, '*', m_pointer_count); dst[m_pointer_count] = 0; } else { dst[0] = ' '; memset (dst + 1, '*', m_pointer_count); dst[m_pointer_count + 1] = 0; } } private: int m_pointer_count; }; /* Subclass of range_label for labelling the range in the format string with the type in question, adding trailing '*' for pointer_count. */ class range_label_for_format_type_mismatch : public range_label_for_type_mismatch { public: range_label_for_format_type_mismatch (tree labelled_type, tree other_type, int pointer_count) : range_label_for_type_mismatch (labelled_type, other_type), m_pointer_count (pointer_count) { } label_text get_text (unsigned range_idx) const final override { label_text text = range_label_for_type_mismatch::get_text (range_idx); if (text.get () == NULL) return text; indirection_suffix suffix (m_pointer_count); char *p = (char *) alloca (suffix.get_buffer_size ()); suffix.fill_buffer (p); char *result = concat (text.get (), p, NULL); return label_text::take (result); } private: int m_pointer_count; }; /* Subclass of pp_element for text describing part of a format string. */ class element_format_substring : public pp_element { public: element_format_substring (const char *highlight_color, const char *prefix, int format_length, const char *format_start) : m_highlight_color (highlight_color), m_prefix (prefix), m_format_length (format_length), m_format_start (format_start) { } void add_to_phase_2 (pp_markup::context &ctxt) final override { ctxt.begin_quote (); ctxt.begin_highlight_color (m_highlight_color); pp_string (&ctxt.m_pp, m_prefix); pp_string_n (&ctxt.m_pp, m_format_start, m_format_length); ctxt.end_highlight_color (); ctxt.end_quote (); } private: const char *m_highlight_color; const char *m_prefix; int m_format_length; const char *m_format_start; }; /* Subclass of pp_element for text describing an optional WANTED_TYPE_NAME with a fallback TYPE, part of an expected type with some number of indirections. */ class element_expected_type_with_indirection : public pp_markup::element_expected_type { public: element_expected_type_with_indirection (tree wanted_type, const char *wanted_type_name, int pointer_count) : pp_markup::element_expected_type (wanted_type), m_wanted_type_name (wanted_type_name), m_pointer_count (pointer_count) { // m_wanted_type_name can be nullptr } void add_to_phase_2 (pp_markup::context &ctxt) final override { indirection_suffix suffix (m_pointer_count); char *indirection_buf = (char *) alloca (suffix.get_buffer_size ()); suffix.fill_buffer (indirection_buf); ctxt.begin_quote (); ctxt.begin_highlight_color (highlight_colors::expected); if (m_wanted_type_name) pp_string (&ctxt.m_pp, m_wanted_type_name); else { /* Any trailing quotes should be printed within the quoted. */ ctxt.m_quoted = false; print_type (ctxt); ctxt.m_quoted = true; } pp_string (&ctxt.m_pp, indirection_buf); ctxt.end_highlight_color (); ctxt.end_quote (); } private: const char *m_wanted_type_name; tree m_wanted_type; int m_pointer_count; }; /* Give a warning about a format argument of different type from that expected. The range of the diagnostic is taken from WHOLE_FMT_LOC; the caret location is based on the location of the char at TYPE->offset_loc. PARAM_LOC is the location of the relevant argument, or UNKNOWN_LOCATION if this is unavailable. WANTED_TYPE is the type the argument should have, possibly stripped of pointer dereferences. The description (such as "field precision"), the placement in the format string, a possibly more friendly name of WANTED_TYPE, and the number of pointer dereferences are taken from TYPE. ARG_TYPE is the type of the actual argument, or NULL if it is missing. OFFSET_TO_TYPE_START is the offset within the execution-charset encoded format string to where type information begins for the conversion (the length modifier and conversion specifier). CONVERSION_CHAR is the user-provided conversion specifier. For example, given a type mismatch for argument 5 here: 00000000011111111112222222222333333333344444444445555555555| 12345678901234567890123456789012345678901234567890123456789` column numbers 0000000000111111111122| 0123456789012345678901` offsets within STRING_CST V~~~~~~~~ : range of WHOLE_FMT_LOC, from cols 23-31 sprintf (d, "before %-+*.*lld after", int_expr, int_expr, long_expr); ^ ^ ^~~~~~~~~ | ` CONVERSION_CHAR: 'd' PARAM_LOC type starts here OFFSET_TO_TYPE_START is 13, the offset to the "lld" within the STRING_CST. */ static void format_type_warning (const substring_loc &whole_fmt_loc, location_t param_loc, format_wanted_type *type, tree wanted_type, tree arg_type, const format_kind_info *fki, int offset_to_type_start, char conversion_char) { enum format_specifier_kind kind = type->kind; const char *wanted_type_name = type->wanted_type_name; const char *format_start = type->format_start; int format_length = type->format_length; int pointer_count = type->pointer_count; int arg_num = type->arg_num; /* If ARG_TYPE is a typedef with a misleading name (for example, size_t but not the standard size_t expected by printf %zu), avoid printing the typedef name. */ if (wanted_type_name && arg_type && TYPE_NAME (arg_type) && TREE_CODE (TYPE_NAME (arg_type)) == TYPE_DECL && DECL_NAME (TYPE_NAME (arg_type)) && !strcmp (wanted_type_name, lang_hooks.decl_printable_name (TYPE_NAME (arg_type), 2))) arg_type = TYPE_MAIN_VARIANT (arg_type); /* WHOLE_FMT_LOC has the caret at the end of the range. Set the caret to be at the offset from TYPE. Subtract one from the offset for the same reason as in format_warning_at_char. */ substring_loc fmt_loc (whole_fmt_loc); fmt_loc.set_caret_index (type->offset_loc - 1); range_label_for_format_type_mismatch fmt_label (wanted_type, arg_type, pointer_count); range_label_for_type_mismatch param_label (arg_type, wanted_type); /* Get a string for use as a replacement fix-it hint for the range in fmt_loc, or NULL. */ char *corrected_substring = get_corrected_substring (fmt_loc, type, arg_type, fki, offset_to_type_start, conversion_char); format_string_diagnostic_t diag (fmt_loc, &fmt_label, param_loc, ¶m_label, corrected_substring); element_format_substring elem_format_substring (format_string_diagnostic_t::highlight_color_format_string, (kind == CF_KIND_FORMAT ? "%" : ""), format_length, format_start); pp_markup::element_actual_type elem_actual_param_type (arg_type); element_expected_type_with_indirection elem_expected_type (wanted_type, wanted_type_name, pointer_count); if (arg_type) diag.emit_warning (OPT_Wformat_, "%s %e expects argument of type %e, " "but argument %d has type %e", gettext (kind_descriptions[kind]), &elem_format_substring, &elem_expected_type, arg_num, &elem_actual_param_type); else diag.emit_warning (OPT_Wformat_, "%s %e expects a matching %e argument", gettext (kind_descriptions[kind]), &elem_format_substring, &elem_expected_type); free (corrected_substring); } /* Given a format_char_info array FCI, and a character C, this function returns the index into the conversion_specs where that specifier's data is located. The character must exist. */ static unsigned int find_char_info_specifier_index (const format_char_info *fci, int c) { unsigned i; for (i = 0; fci->format_chars; i++, fci++) if (strchr (fci->format_chars, c)) return i; /* We shouldn't be looking for a non-existent specifier. */ gcc_unreachable (); } /* Given a format_length_info array FLI, and a character C, this function returns the index into the conversion_specs where that modifier's data is located. The character must exist. */ static unsigned int find_length_info_modifier_index (const format_length_info *fli, int c) { unsigned i; for (i = 0; fli->name; i++, fli++) if (strchr (fli->name, c)) return i; /* We shouldn't be looking for a non-existent modifier. */ gcc_unreachable (); } /* Determine the type of HOST_WIDE_INT in the code being compiled for use in GCC's __asm_fprintf__ custom format attribute. You must have set dynamic_format_types before calling this function. */ static void init_dynamic_asm_fprintf_info (void) { static tree hwi; if (!hwi) { format_length_info *new_asm_fprintf_length_specs; unsigned int i; /* Find the underlying type for HOST_WIDE_INT. For the %w length modifier to work, one must have issued: "typedef HOST_WIDE_INT __gcc_host_wide_int__;" in one's source code prior to using that modifier. */ hwi = maybe_get_identifier ("__gcc_host_wide_int__"); if (!hwi) { error ("%<__gcc_host_wide_int__%> is not defined as a type"); return; } hwi = identifier_global_value (hwi); if (!hwi || TREE_CODE (hwi) != TYPE_DECL) { error ("%<__gcc_host_wide_int__%> is not defined as a type"); return; } hwi = DECL_ORIGINAL_TYPE (hwi); gcc_assert (hwi); if (hwi != long_integer_type_node && hwi != long_long_integer_type_node) { error ("%<__gcc_host_wide_int__%> is not defined as %" " or %"); return; } /* Create a new (writable) copy of asm_fprintf_length_specs. */ new_asm_fprintf_length_specs = (format_length_info *) xmemdup (asm_fprintf_length_specs, sizeof (asm_fprintf_length_specs), sizeof (asm_fprintf_length_specs)); /* HOST_WIDE_INT must be one of 'long' or 'long long'. */ i = find_length_info_modifier_index (new_asm_fprintf_length_specs, 'w'); if (hwi == long_integer_type_node) new_asm_fprintf_length_specs[i].index = FMT_LEN_l; else if (hwi == long_long_integer_type_node) new_asm_fprintf_length_specs[i].index = FMT_LEN_ll; else gcc_unreachable (); /* Assign the new data for use. */ dynamic_format_types[asm_fprintf_format_type].length_char_specs = new_asm_fprintf_length_specs; } } static const format_length_info* get_init_dynamic_hwi (void) { static tree hwi; static format_length_info *diag_ls; if (!hwi) { unsigned int i; /* Find the underlying type for HOST_WIDE_INT. For the 'w' length modifier to work, one must have issued: "typedef HOST_WIDE_INT __gcc_host_wide_int__;" in one's source code prior to using that modifier. */ if ((hwi = maybe_get_identifier ("__gcc_host_wide_int__"))) { hwi = identifier_global_value (hwi); if (hwi) { if (TREE_CODE (hwi) != TYPE_DECL) { error ("%<__gcc_host_wide_int__%> is not defined as a type"); hwi = 0; } else { hwi = DECL_ORIGINAL_TYPE (hwi); gcc_assert (hwi); if (hwi != long_integer_type_node && hwi != long_long_integer_type_node) { error ("%<__gcc_host_wide_int__%> is not defined" " as % or %"); hwi = 0; } } } } if (!diag_ls) diag_ls = (format_length_info *) xmemdup (gcc_diag_length_specs, sizeof (gcc_diag_length_specs), sizeof (gcc_diag_length_specs)); if (hwi) { /* HOST_WIDE_INT must be one of 'long' or 'long long'. */ i = find_length_info_modifier_index (diag_ls, 'w'); if (hwi == long_integer_type_node) diag_ls[i].index = FMT_LEN_l; else if (hwi == long_long_integer_type_node) diag_ls[i].index = FMT_LEN_ll; else gcc_unreachable (); } } return diag_ls; } /* Determine the type of a "locus" in the code being compiled for use in GCC's __gcc_gfc__ custom format attribute. You must have set dynamic_format_types before calling this function. */ static void init_dynamic_gfc_info (void) { dynamic_format_types[gcc_gfc_format_type].length_char_specs = get_init_dynamic_hwi (); if (!locus) { static format_char_info *gfc_fci; /* For the GCC __gcc_gfc__ custom format specifier to work, one must have declared 'locus' prior to using this attribute. If we haven't seen this declarations then you shouldn't use the specifier requiring that type. */ if ((locus = maybe_get_identifier ("locus"))) { locus = identifier_global_value (locus); if (locus) { if (TREE_CODE (locus) != TYPE_DECL || TREE_TYPE (locus) == error_mark_node) { error ("% is not defined as a type"); locus = 0; } else locus = TREE_TYPE (locus); } } /* Assign the new data for use. */ /* Handle the __gcc_gfc__ format specifics. */ if (!gfc_fci) dynamic_format_types[gcc_gfc_format_type].conversion_specs = gfc_fci = (format_char_info *) xmemdup (gcc_gfc_char_table, sizeof (gcc_gfc_char_table), sizeof (gcc_gfc_char_table)); if (locus) { const unsigned i = find_char_info_specifier_index (gfc_fci, 'L'); gfc_fci[i].types[0].type = &locus; gfc_fci[i].pointer_count = 1; } } } /* Lookup the type named NAME and return a NAME type if found. Otherwise, return void_type_node if NAME has not been used yet, or NULL_TREE if NAME is not a type (issuing an error). */ static tree get_named_type (const char *name) { if (tree result = maybe_get_identifier (name)) { result = identifier_global_tag (result); if (result) { if (TYPE_P (result)) ; else if (TREE_CODE (result) == TYPE_DECL) result = TREE_TYPE (result); else { error ("%qs is not defined as a type", name); result = NULL_TREE; } } return result; } else return void_type_node; } /* Determine the types of "tree" and "location_t" in the code being compiled for use in GCC's diagnostic custom format attributes. You must have set dynamic_format_types before calling this function. */ static void init_dynamic_diag_info (void) { /* For the GCC-diagnostics custom format specifiers to work, one must have declared 'tree' and 'location_t' prior to using those attributes. If we haven't seen these declarations then the specifiers requiring these types shouldn't be used. However we don't force a hard ICE because we may see only one or the other type. */ if (tree loc = maybe_get_identifier ("location_t")) { loc = identifier_global_value (loc); if (loc && TREE_CODE (loc) != TYPE_DECL) error ("% is not defined as a type"); } /* Initialize the global tree node type local to this file. */ if (!local_tree_type_node || local_tree_type_node == void_type_node) { /* We need to grab the underlying 'union tree_node' so peek into an extra type level. */ if ((local_tree_type_node = maybe_get_identifier ("tree"))) { local_tree_type_node = identifier_global_value (local_tree_type_node); if (local_tree_type_node) { if (TREE_CODE (local_tree_type_node) != TYPE_DECL) { error ("% is not defined as a type"); local_tree_type_node = NULL_TREE; } else if (TREE_CODE (TREE_TYPE (local_tree_type_node)) != POINTER_TYPE) { error ("% is not defined as a pointer type"); local_tree_type_node = NULL_TREE; } else local_tree_type_node = TREE_TYPE (TREE_TYPE (local_tree_type_node)); } } else local_tree_type_node = void_type_node; } /* Similar to the above but for gimple*. */ if (!local_gimple_ptr_node || local_gimple_ptr_node == void_type_node) local_gimple_ptr_node = get_named_type ("gimple"); /* Similar to the above but for cgraph_node*. */ if (!local_cgraph_node_ptr_node || local_cgraph_node_ptr_node == void_type_node) local_cgraph_node_ptr_node = get_named_type ("cgraph_node"); /* Similar to the above but for diagnostic_event_id_t*. */ if (!local_event_ptr_node || local_event_ptr_node == void_type_node) local_event_ptr_node = get_named_type ("diagnostic_event_id_t"); /* Similar to the above but for pp_element*. */ if (!local_pp_element_ptr_node || local_pp_element_ptr_node == void_type_node) { if (tree pp_element_node = get_named_type ("pp_element")) local_pp_element_ptr_node = build_pointer_type (pp_element_node); } /* All the GCC diag formats use the same length specs. */ dynamic_format_types[gcc_diag_format_type].length_char_specs = dynamic_format_types[gcc_tdiag_format_type].length_char_specs = dynamic_format_types[gcc_cdiag_format_type].length_char_specs = dynamic_format_types[gcc_cxxdiag_format_type].length_char_specs = dynamic_format_types[gcc_dump_printf_format_type].length_char_specs = get_init_dynamic_hwi (); /* It's safe to "re-initialize these to the same values. */ dynamic_format_types[gcc_diag_format_type].conversion_specs = gcc_diag_char_table; dynamic_format_types[gcc_tdiag_format_type].conversion_specs = gcc_tdiag_char_table; dynamic_format_types[gcc_cdiag_format_type].conversion_specs = gcc_cdiag_char_table; dynamic_format_types[gcc_cxxdiag_format_type].conversion_specs = gcc_cxxdiag_char_table; dynamic_format_types[gcc_dump_printf_format_type].conversion_specs = gcc_dump_printf_char_table; } #ifdef TARGET_FORMAT_TYPES extern const format_kind_info TARGET_FORMAT_TYPES[]; #endif #ifdef TARGET_OVERRIDES_FORMAT_ATTRIBUTES extern const target_ovr_attr TARGET_OVERRIDES_FORMAT_ATTRIBUTES[]; #endif #ifdef TARGET_OVERRIDES_FORMAT_INIT extern void TARGET_OVERRIDES_FORMAT_INIT (void); #endif /* Attributes such as "printf" are equivalent to those such as "gnu_printf" unless this is overridden by a target. */ static const target_ovr_attr gnu_target_overrides_format_attributes[] = { { "gnu_printf", "printf" }, { "gnu_scanf", "scanf" }, { "gnu_strftime", "strftime" }, { "gnu_strfmon", "strfmon" }, { NULL, NULL } }; /* Translate to unified attribute name. This is used in decode_format_type and decode_format_attr. In attr_name the user specified argument is passed. It returns the unified format name from TARGET_OVERRIDES_FORMAT_ATTRIBUTES or the attr_name passed to this function, if there is no matching entry. */ static const char * convert_format_name_to_system_name (const char *attr_name) { int i; if (attr_name == NULL || *attr_name == 0 || startswith (attr_name, "gcc_")) return attr_name; #ifdef TARGET_OVERRIDES_FORMAT_INIT TARGET_OVERRIDES_FORMAT_INIT (); #endif #ifdef TARGET_OVERRIDES_FORMAT_ATTRIBUTES /* Check if format attribute is overridden by target. */ if (TARGET_OVERRIDES_FORMAT_ATTRIBUTES_COUNT > 0) { for (i = 0; i < TARGET_OVERRIDES_FORMAT_ATTRIBUTES_COUNT; ++i) { if (cmp_attribs (TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_src, attr_name)) return attr_name; if (cmp_attribs (TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_dst, attr_name)) return TARGET_OVERRIDES_FORMAT_ATTRIBUTES[i].named_attr_src; } } #endif /* Otherwise default to gnu format. */ for (i = 0; gnu_target_overrides_format_attributes[i].named_attr_src != NULL; ++i) { if (cmp_attribs (gnu_target_overrides_format_attributes[i].named_attr_src, attr_name)) return attr_name; if (cmp_attribs (gnu_target_overrides_format_attributes[i].named_attr_dst, attr_name)) return gnu_target_overrides_format_attributes[i].named_attr_src; } return attr_name; } /* Handle a "format" attribute; arguments as in struct attribute_spec.handler. */ tree handle_format_attribute (tree node[3], tree atname, tree args, int flags, bool *no_add_attrs) { const_tree type = *node; /* NODE[2] may be NULL, and it also may be a PARM_DECL for function pointers. */ const_tree fndecl = ((node[2] && TREE_CODE (node[2]) == FUNCTION_DECL) ? node[2] : NULL_TREE); function_format_info info; #ifdef TARGET_FORMAT_TYPES /* If the target provides additional format types, we need to add them to FORMAT_TYPES at first use. */ if (!dynamic_format_types) { dynamic_format_types = XNEWVEC (format_kind_info, n_format_types + TARGET_N_FORMAT_TYPES); memcpy (dynamic_format_types, format_types_orig, sizeof (format_types_orig)); memcpy (&dynamic_format_types[n_format_types], TARGET_FORMAT_TYPES, TARGET_N_FORMAT_TYPES * sizeof (dynamic_format_types[0])); format_types = dynamic_format_types; /* Provide a reference for the first potential external type. */ first_target_format_type = n_format_types; n_format_types += TARGET_N_FORMAT_TYPES; } #endif /* Canonicalize name of format function. */ if (TREE_CODE (TREE_VALUE (args)) == IDENTIFIER_NODE) TREE_VALUE (args) = canonicalize_attr_name (TREE_VALUE (args)); /* record the flags for check_function_format */ TREE_PURPOSE (args) = build_int_cst (unsigned_type_node, flags); if (!decode_format_attr (fndecl ? fndecl : type, atname, args, &info, /* validated_p = */false)) { *no_add_attrs = true; return NULL_TREE; } if (prototype_p (type)) { if (!check_format_string (type, info.format_num, flags, no_add_attrs, info.format_type)) return NULL_TREE; if (info.first_arg_num != 0) { unsigned HOST_WIDE_INT arg_num = 1; function_args_iterator iter; tree arg_type; /* Verify that first_arg_num points to the last arg, the ... */ FOREACH_FUNCTION_ARGS (type, arg_type, iter) arg_num++; if (arg_num != info.first_arg_num) { if (!(flags & (int) ATTR_FLAG_BUILT_IN)) error ("argument to be formatted is not %<...%>"); *no_add_attrs = true; return NULL_TREE; } } } /* Check if this is a strftime variant. Just for this variant FMT_FLAG_ARG_CONVERT is not set. */ if ((format_types[info.format_type].flags & (int) FMT_FLAG_ARG_CONVERT) == 0 && info.first_arg_num != 0) { error ("strftime formats cannot format arguments"); *no_add_attrs = true; return NULL_TREE; } /* If this is a custom GCC-internal format type, we have to initialize certain bits at runtime. */ if (info.format_type == asm_fprintf_format_type || info.format_type == gcc_gfc_format_type || info.format_type == gcc_diag_format_type || info.format_type == gcc_tdiag_format_type || info.format_type == gcc_cdiag_format_type || info.format_type == gcc_cxxdiag_format_type || info.format_type == gcc_dump_printf_format_type) { /* Our first time through, we have to make sure that our format_type data is allocated dynamically and is modifiable. */ if (!dynamic_format_types) format_types = dynamic_format_types = (format_kind_info *) xmemdup (format_types_orig, sizeof (format_types_orig), sizeof (format_types_orig)); /* If this is format __asm_fprintf__, we have to initialize GCC's notion of HOST_WIDE_INT for checking %wd. */ if (info.format_type == asm_fprintf_format_type) init_dynamic_asm_fprintf_info (); /* If this is format __gcc_gfc__, we have to initialize GCC's notion of 'locus' at runtime for %L. */ else if (info.format_type == gcc_gfc_format_type) init_dynamic_gfc_info (); /* If this is one of the diagnostic attributes, then we have to initialize 'location_t' and 'tree' at runtime. */ else if (info.format_type == gcc_diag_format_type || info.format_type == gcc_tdiag_format_type || info.format_type == gcc_cdiag_format_type || info.format_type == gcc_cxxdiag_format_type || info.format_type == gcc_dump_printf_format_type) init_dynamic_diag_info (); else gcc_unreachable (); } return NULL_TREE; } #if CHECKING_P namespace selftest { /* Selftests of location handling. */ /* Get the format_kind_info with the given name. */ static const format_kind_info * get_info (const char *name) { int idx = decode_format_type (name); const format_kind_info *fki = &format_types[idx]; ASSERT_STREQ (fki->name, name); return fki; } /* Verify that get_format_for_type (FKI, TYPE, CONVERSION_CHAR) is EXPECTED_FORMAT. */ static void assert_format_for_type_streq (const location &loc, const format_kind_info *fki, const char *expected_format, tree type, char conversion_char) { gcc_assert (fki); gcc_assert (expected_format); gcc_assert (type); char *actual_format = get_format_for_type (fki, type, conversion_char); ASSERT_STREQ_AT (loc, expected_format, actual_format); free (actual_format); } /* Selftests for get_format_for_type. */ #define ASSERT_FORMAT_FOR_TYPE_STREQ(EXPECTED_FORMAT, TYPE, CONVERSION_CHAR) \ assert_format_for_type_streq (SELFTEST_LOCATION, (fki), (EXPECTED_FORMAT), \ (TYPE), (CONVERSION_CHAR)) /* Selftest for get_format_for_type for "printf"-style functions. */ static void test_get_format_for_type_printf () { const format_kind_info *fki = get_info ("gnu_printf"); ASSERT_NE (fki, NULL); ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("f", double_type_node, 'X'); ASSERT_FORMAT_FOR_TYPE_STREQ ("Lf", long_double_type_node, 'X'); ASSERT_FORMAT_FOR_TYPE_STREQ ("d", integer_type_node, 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("i", integer_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("o", integer_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("x", integer_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("X", integer_type_node, 'X'); ASSERT_FORMAT_FOR_TYPE_STREQ ("d", unsigned_type_node, 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("i", unsigned_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("o", unsigned_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("x", unsigned_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("X", unsigned_type_node, 'X'); ASSERT_FORMAT_FOR_TYPE_STREQ ("ld", long_integer_type_node, 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("li", long_integer_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lx", long_integer_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lo", long_unsigned_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lx", long_unsigned_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lld", long_long_integer_type_node, 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lli", long_long_integer_type_node, 'i'); ASSERT_FORMAT_FOR_TYPE_STREQ ("llo", long_long_unsigned_type_node, 'o'); ASSERT_FORMAT_FOR_TYPE_STREQ ("llx", long_long_unsigned_type_node, 'x'); ASSERT_FORMAT_FOR_TYPE_STREQ ("s", build_pointer_type (char_type_node), 'i'); } /* Selftest for get_format_for_type for "scanf"-style functions. */ static void test_get_format_for_type_scanf () { const format_kind_info *fki = get_info ("gnu_scanf"); ASSERT_NE (fki, NULL); ASSERT_FORMAT_FOR_TYPE_STREQ ("d", build_pointer_type (integer_type_node), 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("u", build_pointer_type (unsigned_type_node), 'u'); ASSERT_FORMAT_FOR_TYPE_STREQ ("ld", build_pointer_type (long_integer_type_node), 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lu", build_pointer_type (long_unsigned_type_node), 'u'); ASSERT_FORMAT_FOR_TYPE_STREQ ("lld", build_pointer_type (long_long_integer_type_node), 'd'); ASSERT_FORMAT_FOR_TYPE_STREQ ("llu", build_pointer_type (long_long_unsigned_type_node), 'u'); ASSERT_FORMAT_FOR_TYPE_STREQ ("e", build_pointer_type (float_type_node), 'e'); ASSERT_FORMAT_FOR_TYPE_STREQ ("le", build_pointer_type (double_type_node), 'e'); } #undef ASSERT_FORMAT_FOR_TYPE_STREQ /* Exercise the type-printing label code, to give some coverage under "make selftest-valgrind" (in particular, to ensure that the label-printing machinery doesn't leak). */ static void test_type_mismatch_range_labels () { /* Create a tempfile and write some text to it. ....................0000000001 11111111 12 22222222 ....................1234567890 12345678 90 12345678. */ const char *content = " printf (\"msg: %i\\n\", msg);\n"; temp_source_file tmp (SELFTEST_LOCATION, ".c", content); line_table_test ltt; linemap_add (line_table, LC_ENTER, false, tmp.get_filename (), 1); location_t c17 = linemap_position_for_column (line_table, 17); ASSERT_EQ (LOCATION_COLUMN (c17), 17); location_t c18 = linemap_position_for_column (line_table, 18); location_t c24 = linemap_position_for_column (line_table, 24); location_t c26 = linemap_position_for_column (line_table, 26); /* Don't attempt to run the tests if column data might be unavailable. */ if (c26 > LINE_MAP_MAX_LOCATION_WITH_COLS) return; location_t fmt = make_location (c18, c17, c18); ASSERT_EQ (LOCATION_COLUMN (fmt), 18); location_t param = make_location (c24, c24, c26); ASSERT_EQ (LOCATION_COLUMN (param), 24); range_label_for_format_type_mismatch fmt_label (char_type_node, integer_type_node, 1); range_label_for_type_mismatch param_label (integer_type_node, char_type_node); gcc_rich_location richloc (fmt, &fmt_label, nullptr); richloc.add_range (param, SHOW_RANGE_WITHOUT_CARET, ¶m_label); test_diagnostic_context dc; diagnostic_show_locus (&dc, dc.m_source_printing, &richloc, DK_ERROR, dc.get_reference_printer ()); if (c_dialect_cxx ()) /* "char*", without a space. */ ASSERT_STREQ (" printf (\"msg: %i\\n\", msg);\n" " ~^ ~~~\n" " | |\n" " char* int\n", pp_formatted_text (dc.get_reference_printer ())); else /* "char *", with a space. */ ASSERT_STREQ (" printf (\"msg: %i\\n\", msg);\n" " ~^ ~~~\n" " | |\n" " | int\n" " char *\n", pp_formatted_text (dc.get_reference_printer ())); } /* Run all of the selftests within this file. */ void c_format_cc_tests () { test_get_modifier_for_format_len (); test_get_format_for_type_printf (); test_get_format_for_type_scanf (); test_type_mismatch_range_labels (); } } // namespace selftest #endif /* CHECKING_P */ #include "gt-c-family-c-format.h"