]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/gimple-ssa-sprintf.c
[Ada] Fold Enum_Rep attribute in evaluation and not in expansion
[thirdparty/gcc.git] / gcc / gimple-ssa-sprintf.c
1 /* Copyright (C) 2016-2020 Free Software Foundation, Inc.
2 Contributed by Martin Sebor <msebor@redhat.com>.
3
4 This file is part of GCC.
5
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
10
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
19
20 /* This file implements the printf-return-value pass. The pass does
21 two things: 1) it analyzes calls to formatted output functions like
22 sprintf looking for possible buffer overflows and calls to bounded
23 functions like snprintf for early truncation (and under the control
24 of the -Wformat-length option issues warnings), and 2) under the
25 control of the -fprintf-return-value option it folds the return
26 value of safe calls into constants, making it possible to eliminate
27 code that depends on the value of those constants.
28
29 For all functions (bounded or not) the pass uses the size of the
30 destination object. That means that it will diagnose calls to
31 snprintf not on the basis of the size specified by the function's
32 second argument but rathger on the basis of the size the first
33 argument points to (if possible). For bound-checking built-ins
34 like __builtin___snprintf_chk the pass uses the size typically
35 determined by __builtin_object_size and passed to the built-in
36 by the Glibc inline wrapper.
37
38 The pass handles all forms standard sprintf format directives,
39 including character, integer, floating point, pointer, and strings,
40 with the standard C flags, widths, and precisions. For integers
41 and strings it computes the length of output itself. For floating
42 point it uses MPFR to fornmat known constants with up and down
43 rounding and uses the resulting range of output lengths. For
44 strings it uses the length of string literals and the sizes of
45 character arrays that a character pointer may point to as a bound
46 on the longest string. */
47
48 #include "config.h"
49 #include "system.h"
50 #include "coretypes.h"
51 #include "backend.h"
52 #include "tree.h"
53 #include "gimple.h"
54 #include "tree-pass.h"
55 #include "ssa.h"
56 #include "gimple-fold.h"
57 #include "gimple-pretty-print.h"
58 #include "diagnostic-core.h"
59 #include "fold-const.h"
60 #include "gimple-iterator.h"
61 #include "tree-ssa.h"
62 #include "tree-object-size.h"
63 #include "tree-cfg.h"
64 #include "tree-ssa-propagate.h"
65 #include "calls.h"
66 #include "cfgloop.h"
67 #include "tree-scalar-evolution.h"
68 #include "tree-ssa-loop.h"
69 #include "intl.h"
70 #include "langhooks.h"
71
72 #include "attribs.h"
73 #include "builtins.h"
74 #include "stor-layout.h"
75
76 #include "realmpfr.h"
77 #include "target.h"
78
79 #include "cpplib.h"
80 #include "input.h"
81 #include "toplev.h"
82 #include "substring-locations.h"
83 #include "diagnostic.h"
84 #include "domwalk.h"
85 #include "alloc-pool.h"
86 #include "vr-values.h"
87 #include "tree-ssa-strlen.h"
88 #include "tree-dfa.h"
89
90 /* The likely worst case value of MB_LEN_MAX for the target, large enough
91 for UTF-8. Ideally, this would be obtained by a target hook if it were
92 to be used for optimization but it's good enough as is for warnings. */
93 #define target_mb_len_max() 6
94
95 /* The maximum number of bytes a single non-string directive can result
96 in. This is the result of printf("%.*Lf", INT_MAX, -LDBL_MAX) for
97 LDBL_MAX_10_EXP of 4932. */
98 #define IEEE_MAX_10_EXP 4932
99 #define target_dir_max() (target_int_max () + IEEE_MAX_10_EXP + 2)
100
101 namespace {
102
103 /* Set to the warning level for the current function which is equal
104 either to warn_format_trunc for bounded functions or to
105 warn_format_overflow otherwise. */
106
107 static int warn_level;
108
109 /* The minimum, maximum, likely, and unlikely maximum number of bytes
110 of output either a formatting function or an individual directive
111 can result in. */
112
113 struct result_range
114 {
115 /* The absolute minimum number of bytes. The result of a successful
116 conversion is guaranteed to be no less than this. (An erroneous
117 conversion can be indicated by MIN > HOST_WIDE_INT_MAX.) */
118 unsigned HOST_WIDE_INT min;
119 /* The likely maximum result that is used in diagnostics. In most
120 cases MAX is the same as the worst case UNLIKELY result. */
121 unsigned HOST_WIDE_INT max;
122 /* The likely result used to trigger diagnostics. For conversions
123 that result in a range of bytes [MIN, MAX], LIKELY is somewhere
124 in that range. */
125 unsigned HOST_WIDE_INT likely;
126 /* In rare cases (e.g., for nultibyte characters) UNLIKELY gives
127 the worst cases maximum result of a directive. In most cases
128 UNLIKELY == MAX. UNLIKELY is used to control the return value
129 optimization but not in diagnostics. */
130 unsigned HOST_WIDE_INT unlikely;
131 };
132
133 /* Return the value of INT_MIN for the target. */
134
135 static inline HOST_WIDE_INT
136 target_int_min ()
137 {
138 return tree_to_shwi (TYPE_MIN_VALUE (integer_type_node));
139 }
140
141 /* Return the value of INT_MAX for the target. */
142
143 static inline unsigned HOST_WIDE_INT
144 target_int_max ()
145 {
146 return tree_to_uhwi (TYPE_MAX_VALUE (integer_type_node));
147 }
148
149 /* Return the value of SIZE_MAX for the target. */
150
151 static inline unsigned HOST_WIDE_INT
152 target_size_max ()
153 {
154 return tree_to_uhwi (TYPE_MAX_VALUE (size_type_node));
155 }
156
157 /* A straightforward mapping from the execution character set to the host
158 character set indexed by execution character. */
159
160 static char target_to_host_charmap[256];
161
162 /* Initialize a mapping from the execution character set to the host
163 character set. */
164
165 static bool
166 init_target_to_host_charmap ()
167 {
168 /* If the percent sign is non-zero the mapping has already been
169 initialized. */
170 if (target_to_host_charmap['%'])
171 return true;
172
173 /* Initialize the target_percent character (done elsewhere). */
174 if (!init_target_chars ())
175 return false;
176
177 /* The subset of the source character set used by printf conversion
178 specifications (strictly speaking, not all letters are used but
179 they are included here for the sake of simplicity). The dollar
180 sign must be included even though it's not in the basic source
181 character set. */
182 const char srcset[] = " 0123456789!\"#%&'()*+,-./:;<=>?[\\]^_{|}~$"
183 "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz";
184
185 /* Set the mapping for all characters to some ordinary value (i,e.,
186 not none used in printf conversion specifications) and overwrite
187 those that are used by conversion specifications with their
188 corresponding values. */
189 memset (target_to_host_charmap + 1, '?', sizeof target_to_host_charmap - 1);
190
191 /* Are the two sets of characters the same? */
192 bool all_same_p = true;
193
194 for (const char *pc = srcset; *pc; ++pc)
195 {
196 /* Slice off the high end bits in case target characters are
197 signed. All values are expected to be non-nul, otherwise
198 there's a problem. */
199 if (unsigned char tc = lang_hooks.to_target_charset (*pc))
200 {
201 target_to_host_charmap[tc] = *pc;
202 if (tc != *pc)
203 all_same_p = false;
204 }
205 else
206 return false;
207
208 }
209
210 /* Set the first element to a non-zero value if the mapping
211 is 1-to-1, otherwise leave it clear (NUL is assumed to be
212 the same in both character sets). */
213 target_to_host_charmap[0] = all_same_p;
214
215 return true;
216 }
217
218 /* Return the host source character corresponding to the character
219 CH in the execution character set if one exists, or some innocuous
220 (non-special, non-nul) source character otherwise. */
221
222 static inline unsigned char
223 target_to_host (unsigned char ch)
224 {
225 return target_to_host_charmap[ch];
226 }
227
228 /* Convert an initial substring of the string TARGSTR consisting of
229 characters in the execution character set into a string in the
230 source character set on the host and store up to HOSTSZ characters
231 in the buffer pointed to by HOSTR. Return HOSTR. */
232
233 static const char*
234 target_to_host (char *hostr, size_t hostsz, const char *targstr)
235 {
236 /* Make sure the buffer is reasonably big. */
237 gcc_assert (hostsz > 4);
238
239 /* The interesting subset of source and execution characters are
240 the same so no conversion is necessary. However, truncate
241 overlong strings just like the translated strings are. */
242 if (target_to_host_charmap['\0'] == 1)
243 {
244 size_t len = strlen (targstr);
245 if (len >= hostsz)
246 {
247 memcpy (hostr, targstr, hostsz - 4);
248 strcpy (hostr + hostsz - 4, "...");
249 }
250 else
251 memcpy (hostr, targstr, len + 1);
252 return hostr;
253 }
254
255 /* Convert the initial substring of TARGSTR to the corresponding
256 characters in the host set, appending "..." if TARGSTR is too
257 long to fit. Using the static buffer assumes the function is
258 not called in between sequence points (which it isn't). */
259 for (char *ph = hostr; ; ++targstr)
260 {
261 *ph++ = target_to_host (*targstr);
262 if (!*targstr)
263 break;
264
265 if (size_t (ph - hostr) == hostsz)
266 {
267 strcpy (ph - 4, "...");
268 break;
269 }
270 }
271
272 return hostr;
273 }
274
275 /* Convert the sequence of decimal digits in the execution character
276 starting at *PS to a HOST_WIDE_INT, analogously to strtol. Return
277 the result and set *PS to one past the last converted character.
278 On range error set ERANGE to the digit that caused it. */
279
280 static inline HOST_WIDE_INT
281 target_strtowi (const char **ps, const char **erange)
282 {
283 unsigned HOST_WIDE_INT val = 0;
284 for ( ; ; ++*ps)
285 {
286 unsigned char c = target_to_host (**ps);
287 if (ISDIGIT (c))
288 {
289 c -= '0';
290
291 /* Check for overflow. */
292 if (val > ((unsigned HOST_WIDE_INT) HOST_WIDE_INT_MAX - c) / 10LU)
293 {
294 val = HOST_WIDE_INT_MAX;
295 *erange = *ps;
296
297 /* Skip the remaining digits. */
298 do
299 c = target_to_host (*++*ps);
300 while (ISDIGIT (c));
301 break;
302 }
303 else
304 val = val * 10 + c;
305 }
306 else
307 break;
308 }
309
310 return val;
311 }
312
313 /* Given FORMAT, set *PLOC to the source location of the format string
314 and return the format string if it is known or null otherwise. */
315
316 static const char*
317 get_format_string (tree format, location_t *ploc)
318 {
319 *ploc = EXPR_LOC_OR_LOC (format, input_location);
320
321 return c_getstr (format);
322 }
323
324 /* For convenience and brevity, shorter named entrypoints of
325 format_string_diagnostic_t::emit_warning_va and
326 format_string_diagnostic_t::emit_warning_n_va.
327 These have to be functions with the attribute so that exgettext
328 works properly. */
329
330 static bool
331 ATTRIBUTE_GCC_DIAG (5, 6)
332 fmtwarn (const substring_loc &fmt_loc, location_t param_loc,
333 const char *corrected_substring, int opt, const char *gmsgid, ...)
334 {
335 format_string_diagnostic_t diag (fmt_loc, NULL, param_loc, NULL,
336 corrected_substring);
337 va_list ap;
338 va_start (ap, gmsgid);
339 bool warned = diag.emit_warning_va (opt, gmsgid, &ap);
340 va_end (ap);
341
342 return warned;
343 }
344
345 static bool
346 ATTRIBUTE_GCC_DIAG (6, 8) ATTRIBUTE_GCC_DIAG (7, 8)
347 fmtwarn_n (const substring_loc &fmt_loc, location_t param_loc,
348 const char *corrected_substring, int opt, unsigned HOST_WIDE_INT n,
349 const char *singular_gmsgid, const char *plural_gmsgid, ...)
350 {
351 format_string_diagnostic_t diag (fmt_loc, NULL, param_loc, NULL,
352 corrected_substring);
353 va_list ap;
354 va_start (ap, plural_gmsgid);
355 bool warned = diag.emit_warning_n_va (opt, n, singular_gmsgid, plural_gmsgid,
356 &ap);
357 va_end (ap);
358
359 return warned;
360 }
361
362 /* Format length modifiers. */
363
364 enum format_lengths
365 {
366 FMT_LEN_none,
367 FMT_LEN_hh, // char argument
368 FMT_LEN_h, // short
369 FMT_LEN_l, // long
370 FMT_LEN_ll, // long long
371 FMT_LEN_L, // long double (and GNU long long)
372 FMT_LEN_z, // size_t
373 FMT_LEN_t, // ptrdiff_t
374 FMT_LEN_j // intmax_t
375 };
376
377
378 /* Description of the result of conversion either of a single directive
379 or the whole format string. */
380
381 class fmtresult
382 {
383 public:
384 /* Construct a FMTRESULT object with all counters initialized
385 to MIN. KNOWNRANGE is set when MIN is valid. */
386 fmtresult (unsigned HOST_WIDE_INT min = HOST_WIDE_INT_MAX)
387 : argmin (), argmax (), dst_offset (HOST_WIDE_INT_MIN), nonstr (),
388 knownrange (min < HOST_WIDE_INT_MAX),
389 mayfail (), nullp ()
390 {
391 range.min = min;
392 range.max = min;
393 range.likely = min;
394 range.unlikely = min;
395 }
396
397 /* Construct a FMTRESULT object with MIN, MAX, and LIKELY counters.
398 KNOWNRANGE is set when both MIN and MAX are valid. */
399 fmtresult (unsigned HOST_WIDE_INT min, unsigned HOST_WIDE_INT max,
400 unsigned HOST_WIDE_INT likely = HOST_WIDE_INT_MAX)
401 : argmin (), argmax (), dst_offset (HOST_WIDE_INT_MIN), nonstr (),
402 knownrange (min < HOST_WIDE_INT_MAX && max < HOST_WIDE_INT_MAX),
403 mayfail (), nullp ()
404 {
405 range.min = min;
406 range.max = max;
407 range.likely = max < likely ? min : likely;
408 range.unlikely = max;
409 }
410
411 /* Adjust result upward to reflect the RANGE of values the specified
412 width or precision is known to be in. */
413 fmtresult& adjust_for_width_or_precision (const HOST_WIDE_INT[2],
414 tree = NULL_TREE,
415 unsigned = 0, unsigned = 0);
416
417 /* Return the maximum number of decimal digits a value of TYPE
418 formats as on output. */
419 static unsigned type_max_digits (tree, int);
420
421 /* The range a directive's argument is in. */
422 tree argmin, argmax;
423
424 /* The starting offset into the destination of the formatted function
425 call of the %s argument that points into (aliases with) the same
426 destination array. */
427 HOST_WIDE_INT dst_offset;
428
429 /* The minimum and maximum number of bytes that a directive
430 results in on output for an argument in the range above. */
431 result_range range;
432
433 /* Non-nul when the argument of a string directive is not a nul
434 terminated string. */
435 tree nonstr;
436
437 /* True when the range above is obtained from a known value of
438 a directive's argument or its bounds and not the result of
439 heuristics that depend on warning levels. */
440 bool knownrange;
441
442 /* True for a directive that may fail (such as wide character
443 directives). */
444 bool mayfail;
445
446 /* True when the argument is a null pointer. */
447 bool nullp;
448 };
449
450 /* Adjust result upward to reflect the range ADJUST of values the
451 specified width or precision is known to be in. When non-null,
452 TYPE denotes the type of the directive whose result is being
453 adjusted, BASE gives the base of the directive (octal, decimal,
454 or hex), and ADJ denotes the additional adjustment to the LIKELY
455 counter that may need to be added when ADJUST is a range. */
456
457 fmtresult&
458 fmtresult::adjust_for_width_or_precision (const HOST_WIDE_INT adjust[2],
459 tree type /* = NULL_TREE */,
460 unsigned base /* = 0 */,
461 unsigned adj /* = 0 */)
462 {
463 bool minadjusted = false;
464
465 /* Adjust the minimum and likely counters. */
466 if (adjust[0] >= 0)
467 {
468 if (range.min < (unsigned HOST_WIDE_INT)adjust[0])
469 {
470 range.min = adjust[0];
471 minadjusted = true;
472 }
473
474 /* Adjust the likely counter. */
475 if (range.likely < range.min)
476 range.likely = range.min;
477 }
478 else if (adjust[0] == target_int_min ()
479 && (unsigned HOST_WIDE_INT)adjust[1] == target_int_max ())
480 knownrange = false;
481
482 /* Adjust the maximum counter. */
483 if (adjust[1] > 0)
484 {
485 if (range.max < (unsigned HOST_WIDE_INT)adjust[1])
486 {
487 range.max = adjust[1];
488
489 /* Set KNOWNRANGE if both the minimum and maximum have been
490 adjusted. Otherwise leave it at what it was before. */
491 knownrange = minadjusted;
492 }
493 }
494
495 if (warn_level > 1 && type)
496 {
497 /* For large non-constant width or precision whose range spans
498 the maximum number of digits produced by the directive for
499 any argument, set the likely number of bytes to be at most
500 the number digits plus other adjustment determined by the
501 caller (one for sign or two for the hexadecimal "0x"
502 prefix). */
503 unsigned dirdigs = type_max_digits (type, base);
504 if (adjust[0] < dirdigs && dirdigs < adjust[1]
505 && range.likely < dirdigs)
506 range.likely = dirdigs + adj;
507 }
508 else if (range.likely < (range.min ? range.min : 1))
509 {
510 /* Conservatively, set LIKELY to at least MIN but no less than
511 1 unless MAX is zero. */
512 range.likely = (range.min
513 ? range.min
514 : range.max && (range.max < HOST_WIDE_INT_MAX
515 || warn_level > 1) ? 1 : 0);
516 }
517
518 /* Finally adjust the unlikely counter to be at least as large as
519 the maximum. */
520 if (range.unlikely < range.max)
521 range.unlikely = range.max;
522
523 return *this;
524 }
525
526 /* Return the maximum number of digits a value of TYPE formats in
527 BASE on output, not counting base prefix . */
528
529 unsigned
530 fmtresult::type_max_digits (tree type, int base)
531 {
532 unsigned prec = TYPE_PRECISION (type);
533 switch (base)
534 {
535 case 8:
536 return (prec + 2) / 3;
537 case 10:
538 /* Decimal approximation: yields 3, 5, 10, and 20 for precision
539 of 8, 16, 32, and 64 bits. */
540 return prec * 301 / 1000 + 1;
541 case 16:
542 return prec / 4;
543 }
544
545 gcc_unreachable ();
546 }
547
548 static bool
549 get_int_range (tree, HOST_WIDE_INT *, HOST_WIDE_INT *, bool, HOST_WIDE_INT,
550 const vr_values *);
551
552 struct call_info;
553
554 /* Description of a format directive. A directive is either a plain
555 string or a conversion specification that starts with '%'. */
556
557 struct directive
558 {
559 directive (const call_info *inf, unsigned dno)
560 : info (inf), dirno (dno), argno (), beg (), len (), flags (),
561 width (), prec (), modifier (), specifier (), arg (), fmtfunc ()
562 { }
563
564 /* Reference to the info structure describing the call that this
565 directive is a part of. */
566 const call_info *info;
567
568 /* The 1-based directive number (for debugging). */
569 unsigned dirno;
570
571 /* The zero-based argument number of the directive's argument ARG in
572 the function's argument list. */
573 unsigned argno;
574
575 /* The first character of the directive and its length. */
576 const char *beg;
577 size_t len;
578
579 /* A bitmap of flags, one for each character. */
580 unsigned flags[256 / sizeof (int)];
581
582 /* The range of values of the specified width, or -1 if not specified. */
583 HOST_WIDE_INT width[2];
584 /* The range of values of the specified precision, or -1 if not
585 specified. */
586 HOST_WIDE_INT prec[2];
587
588 /* Length modifier. */
589 format_lengths modifier;
590
591 /* Format specifier character. */
592 char specifier;
593
594 /* The argument of the directive or null when the directive doesn't
595 take one or when none is available (such as for vararg functions). */
596 tree arg;
597
598 /* Format conversion function that given a directive and an argument
599 returns the formatting result. */
600 fmtresult (*fmtfunc) (const directive &, tree, const vr_values *);
601
602 /* Return True when a the format flag CHR has been used. */
603 bool get_flag (char chr) const
604 {
605 unsigned char c = chr & 0xff;
606 return (flags[c / (CHAR_BIT * sizeof *flags)]
607 & (1U << (c % (CHAR_BIT * sizeof *flags))));
608 }
609
610 /* Make a record of the format flag CHR having been used. */
611 void set_flag (char chr)
612 {
613 unsigned char c = chr & 0xff;
614 flags[c / (CHAR_BIT * sizeof *flags)]
615 |= (1U << (c % (CHAR_BIT * sizeof *flags)));
616 }
617
618 /* Reset the format flag CHR. */
619 void clear_flag (char chr)
620 {
621 unsigned char c = chr & 0xff;
622 flags[c / (CHAR_BIT * sizeof *flags)]
623 &= ~(1U << (c % (CHAR_BIT * sizeof *flags)));
624 }
625
626 /* Set both bounds of the width range to VAL. */
627 void set_width (HOST_WIDE_INT val)
628 {
629 width[0] = width[1] = val;
630 }
631
632 /* Set the width range according to ARG, with both bounds being
633 no less than 0. For a constant ARG set both bounds to its value
634 or 0, whichever is greater. For a non-constant ARG in some range
635 set width to its range adjusting each bound to -1 if it's less.
636 For an indeterminate ARG set width to [0, INT_MAX]. */
637 void set_width (tree arg, const vr_values *vr)
638 {
639 get_int_range (arg, width, width + 1, true, 0, vr);
640 }
641
642 /* Set both bounds of the precision range to VAL. */
643 void set_precision (HOST_WIDE_INT val)
644 {
645 prec[0] = prec[1] = val;
646 }
647
648 /* Set the precision range according to ARG, with both bounds being
649 no less than -1. For a constant ARG set both bounds to its value
650 or -1 whichever is greater. For a non-constant ARG in some range
651 set precision to its range adjusting each bound to -1 if it's less.
652 For an indeterminate ARG set precision to [-1, INT_MAX]. */
653 void set_precision (tree arg, const vr_values *vr)
654 {
655 get_int_range (arg, prec, prec + 1, false, -1, vr);
656 }
657
658 /* Return true if both width and precision are known to be
659 either constant or in some range, false otherwise. */
660 bool known_width_and_precision () const
661 {
662 return ((width[1] < 0
663 || (unsigned HOST_WIDE_INT)width[1] <= target_int_max ())
664 && (prec[1] < 0
665 || (unsigned HOST_WIDE_INT)prec[1] < target_int_max ()));
666 }
667 };
668
669 /* The result of a call to a formatted function. */
670
671 struct format_result
672 {
673 format_result ()
674 : range (), aliases (), alias_count (), knownrange (), posunder4k (),
675 floating (), warned () { /* No-op. */ }
676
677 ~format_result ()
678 {
679 XDELETEVEC (aliases);
680 }
681
682 /* Range of characters written by the formatted function.
683 Setting the minimum to HOST_WIDE_INT_MAX disables all
684 length tracking for the remainder of the format string. */
685 result_range range;
686
687 struct alias_info
688 {
689 directive dir; /* The directive that aliases the destination. */
690 HOST_WIDE_INT offset; /* The offset at which it aliases it. */
691 result_range range; /* The raw result of the directive. */
692 };
693
694 /* An array of directives whose pointer argument aliases a part
695 of the destination object of the formatted function. */
696 alias_info *aliases;
697 unsigned alias_count;
698
699 /* True when the range above is obtained from known values of
700 directive arguments, or bounds on the amount of output such
701 as width and precision, and not the result of heuristics that
702 depend on warning levels. It's used to issue stricter diagnostics
703 in cases where strings of unknown lengths are bounded by the arrays
704 they are determined to refer to. KNOWNRANGE must not be used for
705 the return value optimization. */
706 bool knownrange;
707
708 /* True if no individual directive could fail or result in more than
709 4095 bytes of output (the total NUMBER_CHARS_{MIN,MAX} might be
710 greater). Implementations are not required to handle directives
711 that produce more than 4K bytes (leading to undefined behavior)
712 and so when one is found it disables the return value optimization.
713 Similarly, directives that can fail (such as wide character
714 directives) disable the optimization. */
715 bool posunder4k;
716
717 /* True when a floating point directive has been seen in the format
718 string. */
719 bool floating;
720
721 /* True when an intermediate result has caused a warning. Used to
722 avoid issuing duplicate warnings while finishing the processing
723 of a call. WARNED also disables the return value optimization. */
724 bool warned;
725
726 /* Preincrement the number of output characters by 1. */
727 format_result& operator++ ()
728 {
729 return *this += 1;
730 }
731
732 /* Postincrement the number of output characters by 1. */
733 format_result operator++ (int)
734 {
735 format_result prev (*this);
736 *this += 1;
737 return prev;
738 }
739
740 /* Increment the number of output characters by N. */
741 format_result& operator+= (unsigned HOST_WIDE_INT);
742
743 /* Add a directive to the sequence of those with potentially aliasing
744 arguments. */
745 void append_alias (const directive &, HOST_WIDE_INT, const result_range &);
746
747 private:
748 /* Not copyable or assignable. */
749 format_result (format_result&);
750 void operator= (format_result&);
751 };
752
753 format_result&
754 format_result::operator+= (unsigned HOST_WIDE_INT n)
755 {
756 gcc_assert (n < HOST_WIDE_INT_MAX);
757
758 if (range.min < HOST_WIDE_INT_MAX)
759 range.min += n;
760
761 if (range.max < HOST_WIDE_INT_MAX)
762 range.max += n;
763
764 if (range.likely < HOST_WIDE_INT_MAX)
765 range.likely += n;
766
767 if (range.unlikely < HOST_WIDE_INT_MAX)
768 range.unlikely += n;
769
770 return *this;
771 }
772
773 void
774 format_result::append_alias (const directive &d, HOST_WIDE_INT off,
775 const result_range &resrng)
776 {
777 unsigned cnt = alias_count + 1;
778 alias_info *ar = XNEWVEC (alias_info, cnt);
779
780 for (unsigned i = 0; i != alias_count; ++i)
781 ar[i] = aliases[i];
782
783 ar[alias_count].dir = d;
784 ar[alias_count].offset = off;
785 ar[alias_count].range = resrng;
786
787 XDELETEVEC (aliases);
788
789 alias_count = cnt;
790 aliases = ar;
791 }
792
793 /* Return the logarithm of X in BASE. */
794
795 static int
796 ilog (unsigned HOST_WIDE_INT x, int base)
797 {
798 int res = 0;
799 do
800 {
801 ++res;
802 x /= base;
803 } while (x);
804 return res;
805 }
806
807 /* Return the number of bytes resulting from converting into a string
808 the INTEGER_CST tree node X in BASE with a minimum of PREC digits.
809 PLUS indicates whether 1 for a plus sign should be added for positive
810 numbers, and PREFIX whether the length of an octal ('O') or hexadecimal
811 ('0x') prefix should be added for nonzero numbers. Return -1 if X cannot
812 be represented. */
813
814 static HOST_WIDE_INT
815 tree_digits (tree x, int base, HOST_WIDE_INT prec, bool plus, bool prefix)
816 {
817 unsigned HOST_WIDE_INT absval;
818
819 HOST_WIDE_INT res;
820
821 if (TYPE_UNSIGNED (TREE_TYPE (x)))
822 {
823 if (tree_fits_uhwi_p (x))
824 {
825 absval = tree_to_uhwi (x);
826 res = plus;
827 }
828 else
829 return -1;
830 }
831 else
832 {
833 if (tree_fits_shwi_p (x))
834 {
835 HOST_WIDE_INT i = tree_to_shwi (x);
836 if (HOST_WIDE_INT_MIN == i)
837 {
838 /* Avoid undefined behavior due to negating a minimum. */
839 absval = HOST_WIDE_INT_MAX;
840 res = 1;
841 }
842 else if (i < 0)
843 {
844 absval = -i;
845 res = 1;
846 }
847 else
848 {
849 absval = i;
850 res = plus;
851 }
852 }
853 else
854 return -1;
855 }
856
857 int ndigs = ilog (absval, base);
858
859 res += prec < ndigs ? ndigs : prec;
860
861 /* Adjust a non-zero value for the base prefix, either hexadecimal,
862 or, unless precision has resulted in a leading zero, also octal. */
863 if (prefix && absval && (base == 16 || prec <= ndigs))
864 {
865 if (base == 8)
866 res += 1;
867 else if (base == 16)
868 res += 2;
869 }
870
871 return res;
872 }
873
874 /* Description of a call to a formatted function. */
875
876 struct call_info
877 {
878 /* Function call statement. */
879 gimple *callstmt;
880
881 /* Function called. */
882 tree func;
883
884 /* Called built-in function code. */
885 built_in_function fncode;
886
887 /* The "origin" of the destination pointer argument, which is either
888 the DECL of the destination buffer being written into or a pointer
889 that points to it, plus some offset. */
890 tree dst_origin;
891
892 /* For a destination pointing to a struct array member, the offset of
893 the member. */
894 HOST_WIDE_INT dst_field;
895
896 /* The offset into the destination buffer. */
897 HOST_WIDE_INT dst_offset;
898
899 /* Format argument and format string extracted from it. */
900 tree format;
901 const char *fmtstr;
902
903 /* The location of the format argument. */
904 location_t fmtloc;
905
906 /* The destination object size for __builtin___xxx_chk functions
907 typically determined by __builtin_object_size, or -1 if unknown. */
908 unsigned HOST_WIDE_INT objsize;
909
910 /* Number of the first variable argument. */
911 unsigned HOST_WIDE_INT argidx;
912
913 /* True for functions like snprintf that specify the size of
914 the destination, false for others like sprintf that don't. */
915 bool bounded;
916
917 /* True for bounded functions like snprintf that specify a zero-size
918 buffer as a request to compute the size of output without actually
919 writing any. NOWRITE is cleared in response to the %n directive
920 which has side-effects similar to writing output. */
921 bool nowrite;
922
923 /* Return true if the called function's return value is used. */
924 bool retval_used () const
925 {
926 return gimple_get_lhs (callstmt);
927 }
928
929 /* Return the warning option corresponding to the called function. */
930 int warnopt () const
931 {
932 return bounded ? OPT_Wformat_truncation_ : OPT_Wformat_overflow_;
933 }
934
935 /* Return true for calls to file formatted functions. */
936 bool is_file_func () const
937 {
938 return (fncode == BUILT_IN_FPRINTF
939 || fncode == BUILT_IN_FPRINTF_CHK
940 || fncode == BUILT_IN_FPRINTF_UNLOCKED
941 || fncode == BUILT_IN_VFPRINTF
942 || fncode == BUILT_IN_VFPRINTF_CHK);
943 }
944
945 /* Return true for calls to string formatted functions. */
946 bool is_string_func () const
947 {
948 return (fncode == BUILT_IN_SPRINTF
949 || fncode == BUILT_IN_SPRINTF_CHK
950 || fncode == BUILT_IN_SNPRINTF
951 || fncode == BUILT_IN_SNPRINTF_CHK
952 || fncode == BUILT_IN_VSPRINTF
953 || fncode == BUILT_IN_VSPRINTF_CHK
954 || fncode == BUILT_IN_VSNPRINTF
955 || fncode == BUILT_IN_VSNPRINTF_CHK);
956 }
957 };
958
959 /* Return the result of formatting a no-op directive (such as '%n'). */
960
961 static fmtresult
962 format_none (const directive &, tree, const vr_values *)
963 {
964 fmtresult res (0);
965 return res;
966 }
967
968 /* Return the result of formatting the '%%' directive. */
969
970 static fmtresult
971 format_percent (const directive &, tree, const vr_values *)
972 {
973 fmtresult res (1);
974 return res;
975 }
976
977
978 /* Compute intmax_type_node and uintmax_type_node similarly to how
979 tree.c builds size_type_node. */
980
981 static void
982 build_intmax_type_nodes (tree *pintmax, tree *puintmax)
983 {
984 if (strcmp (UINTMAX_TYPE, "unsigned int") == 0)
985 {
986 *pintmax = integer_type_node;
987 *puintmax = unsigned_type_node;
988 }
989 else if (strcmp (UINTMAX_TYPE, "long unsigned int") == 0)
990 {
991 *pintmax = long_integer_type_node;
992 *puintmax = long_unsigned_type_node;
993 }
994 else if (strcmp (UINTMAX_TYPE, "long long unsigned int") == 0)
995 {
996 *pintmax = long_long_integer_type_node;
997 *puintmax = long_long_unsigned_type_node;
998 }
999 else
1000 {
1001 for (int i = 0; i < NUM_INT_N_ENTS; i++)
1002 if (int_n_enabled_p[i])
1003 {
1004 char name[50], altname[50];
1005 sprintf (name, "__int%d unsigned", int_n_data[i].bitsize);
1006 sprintf (altname, "__int%d__ unsigned", int_n_data[i].bitsize);
1007
1008 if (strcmp (name, UINTMAX_TYPE) == 0
1009 || strcmp (altname, UINTMAX_TYPE) == 0)
1010 {
1011 *pintmax = int_n_trees[i].signed_type;
1012 *puintmax = int_n_trees[i].unsigned_type;
1013 return;
1014 }
1015 }
1016 gcc_unreachable ();
1017 }
1018 }
1019
1020 /* Determine the range [*PMIN, *PMAX] that the expression ARG is
1021 in and that is representable in type int.
1022 Return true when the range is a subrange of that of int.
1023 When ARG is null it is as if it had the full range of int.
1024 When ABSOLUTE is true the range reflects the absolute value of
1025 the argument. When ABSOLUTE is false, negative bounds of
1026 the determined range are replaced with NEGBOUND. */
1027
1028 static bool
1029 get_int_range (tree arg, HOST_WIDE_INT *pmin, HOST_WIDE_INT *pmax,
1030 bool absolute, HOST_WIDE_INT negbound,
1031 const class vr_values *vr_values)
1032 {
1033 /* The type of the result. */
1034 const_tree type = integer_type_node;
1035
1036 bool knownrange = false;
1037
1038 if (!arg)
1039 {
1040 *pmin = tree_to_shwi (TYPE_MIN_VALUE (type));
1041 *pmax = tree_to_shwi (TYPE_MAX_VALUE (type));
1042 }
1043 else if (TREE_CODE (arg) == INTEGER_CST
1044 && TYPE_PRECISION (TREE_TYPE (arg)) <= TYPE_PRECISION (type))
1045 {
1046 /* For a constant argument return its value adjusted as specified
1047 by NEGATIVE and NEGBOUND and return true to indicate that the
1048 result is known. */
1049 *pmin = tree_fits_shwi_p (arg) ? tree_to_shwi (arg) : tree_to_uhwi (arg);
1050 *pmax = *pmin;
1051 knownrange = true;
1052 }
1053 else
1054 {
1055 /* True if the argument's range cannot be determined. */
1056 bool unknown = true;
1057
1058 tree argtype = TREE_TYPE (arg);
1059
1060 /* Ignore invalid arguments with greater precision that that
1061 of the expected type (e.g., in sprintf("%*i", 12LL, i)).
1062 They will have been detected and diagnosed by -Wformat and
1063 so it's not important to complicate this code to try to deal
1064 with them again. */
1065 if (TREE_CODE (arg) == SSA_NAME
1066 && INTEGRAL_TYPE_P (argtype)
1067 && TYPE_PRECISION (argtype) <= TYPE_PRECISION (type))
1068 {
1069 /* Try to determine the range of values of the integer argument. */
1070 const value_range_equiv *vr
1071 = CONST_CAST (class vr_values *, vr_values)->get_value_range (arg);
1072
1073 if (range_int_cst_p (vr))
1074 {
1075 HOST_WIDE_INT type_min
1076 = (TYPE_UNSIGNED (argtype)
1077 ? tree_to_uhwi (TYPE_MIN_VALUE (argtype))
1078 : tree_to_shwi (TYPE_MIN_VALUE (argtype)));
1079
1080 HOST_WIDE_INT type_max = tree_to_uhwi (TYPE_MAX_VALUE (argtype));
1081
1082 *pmin = TREE_INT_CST_LOW (vr->min ());
1083 *pmax = TREE_INT_CST_LOW (vr->max ());
1084
1085 if (*pmin < *pmax)
1086 {
1087 /* Return true if the adjusted range is a subrange of
1088 the full range of the argument's type. *PMAX may
1089 be less than *PMIN when the argument is unsigned
1090 and its upper bound is in excess of TYPE_MAX. In
1091 that (invalid) case disregard the range and use that
1092 of the expected type instead. */
1093 knownrange = type_min < *pmin || *pmax < type_max;
1094
1095 unknown = false;
1096 }
1097 }
1098 }
1099
1100 /* Handle an argument with an unknown range as if none had been
1101 provided. */
1102 if (unknown)
1103 return get_int_range (NULL_TREE, pmin, pmax, absolute,
1104 negbound, vr_values);
1105 }
1106
1107 /* Adjust each bound as specified by ABSOLUTE and NEGBOUND. */
1108 if (absolute)
1109 {
1110 if (*pmin < 0)
1111 {
1112 if (*pmin == *pmax)
1113 *pmin = *pmax = -*pmin;
1114 else
1115 {
1116 /* Make sure signed overlow is avoided. */
1117 gcc_assert (*pmin != HOST_WIDE_INT_MIN);
1118
1119 HOST_WIDE_INT tmp = -*pmin;
1120 *pmin = 0;
1121 if (*pmax < tmp)
1122 *pmax = tmp;
1123 }
1124 }
1125 }
1126 else if (*pmin < negbound)
1127 *pmin = negbound;
1128
1129 return knownrange;
1130 }
1131
1132 /* With the range [*ARGMIN, *ARGMAX] of an integer directive's actual
1133 argument, due to the conversion from either *ARGMIN or *ARGMAX to
1134 the type of the directive's formal argument it's possible for both
1135 to result in the same number of bytes or a range of bytes that's
1136 less than the number of bytes that would result from formatting
1137 some other value in the range [*ARGMIN, *ARGMAX]. This can be
1138 determined by checking for the actual argument being in the range
1139 of the type of the directive. If it isn't it must be assumed to
1140 take on the full range of the directive's type.
1141 Return true when the range has been adjusted to the full range
1142 of DIRTYPE, and false otherwise. */
1143
1144 static bool
1145 adjust_range_for_overflow (tree dirtype, tree *argmin, tree *argmax)
1146 {
1147 tree argtype = TREE_TYPE (*argmin);
1148 unsigned argprec = TYPE_PRECISION (argtype);
1149 unsigned dirprec = TYPE_PRECISION (dirtype);
1150
1151 /* If the actual argument and the directive's argument have the same
1152 precision and sign there can be no overflow and so there is nothing
1153 to adjust. */
1154 if (argprec == dirprec && TYPE_SIGN (argtype) == TYPE_SIGN (dirtype))
1155 return false;
1156
1157 /* The logic below was inspired/lifted from the CONVERT_EXPR_CODE_P
1158 branch in the extract_range_from_unary_expr function in tree-vrp.c. */
1159
1160 if (TREE_CODE (*argmin) == INTEGER_CST
1161 && TREE_CODE (*argmax) == INTEGER_CST
1162 && (dirprec >= argprec
1163 || integer_zerop (int_const_binop (RSHIFT_EXPR,
1164 int_const_binop (MINUS_EXPR,
1165 *argmax,
1166 *argmin),
1167 size_int (dirprec)))))
1168 {
1169 *argmin = force_fit_type (dirtype, wi::to_widest (*argmin), 0, false);
1170 *argmax = force_fit_type (dirtype, wi::to_widest (*argmax), 0, false);
1171
1172 /* If *ARGMIN is still less than *ARGMAX the conversion above
1173 is safe. Otherwise, it has overflowed and would be unsafe. */
1174 if (tree_int_cst_le (*argmin, *argmax))
1175 return false;
1176 }
1177
1178 *argmin = TYPE_MIN_VALUE (dirtype);
1179 *argmax = TYPE_MAX_VALUE (dirtype);
1180 return true;
1181 }
1182
1183 /* Return a range representing the minimum and maximum number of bytes
1184 that the format directive DIR will output for any argument given
1185 the WIDTH and PRECISION (extracted from DIR). This function is
1186 used when the directive argument or its value isn't known. */
1187
1188 static fmtresult
1189 format_integer (const directive &dir, tree arg, const vr_values *vr_values)
1190 {
1191 tree intmax_type_node;
1192 tree uintmax_type_node;
1193
1194 /* Base to format the number in. */
1195 int base;
1196
1197 /* True when a conversion is preceded by a prefix indicating the base
1198 of the argument (octal or hexadecimal). */
1199 bool maybebase = dir.get_flag ('#');
1200
1201 /* True when a signed conversion is preceded by a sign or space. */
1202 bool maybesign = false;
1203
1204 /* True for signed conversions (i.e., 'd' and 'i'). */
1205 bool sign = false;
1206
1207 switch (dir.specifier)
1208 {
1209 case 'd':
1210 case 'i':
1211 /* Space and '+' are only meaningful for signed conversions. */
1212 maybesign = dir.get_flag (' ') | dir.get_flag ('+');
1213 sign = true;
1214 base = 10;
1215 break;
1216 case 'u':
1217 base = 10;
1218 break;
1219 case 'o':
1220 base = 8;
1221 break;
1222 case 'X':
1223 case 'x':
1224 base = 16;
1225 break;
1226 default:
1227 gcc_unreachable ();
1228 }
1229
1230 /* The type of the "formal" argument expected by the directive. */
1231 tree dirtype = NULL_TREE;
1232
1233 /* Determine the expected type of the argument from the length
1234 modifier. */
1235 switch (dir.modifier)
1236 {
1237 case FMT_LEN_none:
1238 if (dir.specifier == 'p')
1239 dirtype = ptr_type_node;
1240 else
1241 dirtype = sign ? integer_type_node : unsigned_type_node;
1242 break;
1243
1244 case FMT_LEN_h:
1245 dirtype = sign ? short_integer_type_node : short_unsigned_type_node;
1246 break;
1247
1248 case FMT_LEN_hh:
1249 dirtype = sign ? signed_char_type_node : unsigned_char_type_node;
1250 break;
1251
1252 case FMT_LEN_l:
1253 dirtype = sign ? long_integer_type_node : long_unsigned_type_node;
1254 break;
1255
1256 case FMT_LEN_L:
1257 case FMT_LEN_ll:
1258 dirtype = (sign
1259 ? long_long_integer_type_node
1260 : long_long_unsigned_type_node);
1261 break;
1262
1263 case FMT_LEN_z:
1264 dirtype = signed_or_unsigned_type_for (!sign, size_type_node);
1265 break;
1266
1267 case FMT_LEN_t:
1268 dirtype = signed_or_unsigned_type_for (!sign, ptrdiff_type_node);
1269 break;
1270
1271 case FMT_LEN_j:
1272 build_intmax_type_nodes (&intmax_type_node, &uintmax_type_node);
1273 dirtype = sign ? intmax_type_node : uintmax_type_node;
1274 break;
1275
1276 default:
1277 return fmtresult ();
1278 }
1279
1280 /* The type of the argument to the directive, either deduced from
1281 the actual non-constant argument if one is known, or from
1282 the directive itself when none has been provided because it's
1283 a va_list. */
1284 tree argtype = NULL_TREE;
1285
1286 if (!arg)
1287 {
1288 /* When the argument has not been provided, use the type of
1289 the directive's argument as an approximation. This will
1290 result in false positives for directives like %i with
1291 arguments with smaller precision (such as short or char). */
1292 argtype = dirtype;
1293 }
1294 else if (TREE_CODE (arg) == INTEGER_CST)
1295 {
1296 /* When a constant argument has been provided use its value
1297 rather than type to determine the length of the output. */
1298 fmtresult res;
1299
1300 if ((dir.prec[0] <= 0 && dir.prec[1] >= 0) && integer_zerop (arg))
1301 {
1302 /* As a special case, a precision of zero with a zero argument
1303 results in zero bytes except in base 8 when the '#' flag is
1304 specified, and for signed conversions in base 8 and 10 when
1305 either the space or '+' flag has been specified and it results
1306 in just one byte (with width having the normal effect). This
1307 must extend to the case of a specified precision with
1308 an unknown value because it can be zero. */
1309 res.range.min = ((base == 8 && dir.get_flag ('#')) || maybesign);
1310 if (res.range.min == 0 && dir.prec[0] != dir.prec[1])
1311 {
1312 res.range.max = 1;
1313 res.range.likely = 1;
1314 }
1315 else
1316 {
1317 res.range.max = res.range.min;
1318 res.range.likely = res.range.min;
1319 }
1320 }
1321 else
1322 {
1323 /* Convert the argument to the type of the directive. */
1324 arg = fold_convert (dirtype, arg);
1325
1326 res.range.min = tree_digits (arg, base, dir.prec[0],
1327 maybesign, maybebase);
1328 if (dir.prec[0] == dir.prec[1])
1329 res.range.max = res.range.min;
1330 else
1331 res.range.max = tree_digits (arg, base, dir.prec[1],
1332 maybesign, maybebase);
1333 res.range.likely = res.range.min;
1334 res.knownrange = true;
1335 }
1336
1337 res.range.unlikely = res.range.max;
1338
1339 /* Bump up the counters if WIDTH is greater than LEN. */
1340 res.adjust_for_width_or_precision (dir.width, dirtype, base,
1341 (sign | maybebase) + (base == 16));
1342 /* Bump up the counters again if PRECision is greater still. */
1343 res.adjust_for_width_or_precision (dir.prec, dirtype, base,
1344 (sign | maybebase) + (base == 16));
1345
1346 return res;
1347 }
1348 else if (INTEGRAL_TYPE_P (TREE_TYPE (arg))
1349 || TREE_CODE (TREE_TYPE (arg)) == POINTER_TYPE)
1350 /* Determine the type of the provided non-constant argument. */
1351 argtype = TREE_TYPE (arg);
1352 else
1353 /* Don't bother with invalid arguments since they likely would
1354 have already been diagnosed, and disable any further checking
1355 of the format string by returning [-1, -1]. */
1356 return fmtresult ();
1357
1358 fmtresult res;
1359
1360 /* Using either the range the non-constant argument is in, or its
1361 type (either "formal" or actual), create a range of values that
1362 constrain the length of output given the warning level. */
1363 tree argmin = NULL_TREE;
1364 tree argmax = NULL_TREE;
1365
1366 if (arg
1367 && TREE_CODE (arg) == SSA_NAME
1368 && INTEGRAL_TYPE_P (argtype))
1369 {
1370 /* Try to determine the range of values of the integer argument
1371 (range information is not available for pointers). */
1372 const value_range_equiv *vr
1373 = CONST_CAST (class vr_values *, vr_values)->get_value_range (arg);
1374
1375 if (range_int_cst_p (vr))
1376 {
1377 argmin = vr->min ();
1378 argmax = vr->max ();
1379
1380 /* Set KNOWNRANGE if the argument is in a known subrange
1381 of the directive's type and neither width nor precision
1382 is unknown. (KNOWNRANGE may be reset below). */
1383 res.knownrange
1384 = ((!tree_int_cst_equal (TYPE_MIN_VALUE (dirtype), argmin)
1385 || !tree_int_cst_equal (TYPE_MAX_VALUE (dirtype), argmax))
1386 && dir.known_width_and_precision ());
1387
1388 res.argmin = argmin;
1389 res.argmax = argmax;
1390 }
1391 else if (vr->kind () == VR_ANTI_RANGE)
1392 {
1393 /* Handle anti-ranges if/when bug 71690 is resolved. */
1394 }
1395 else if (vr->varying_p () || vr->undefined_p ())
1396 {
1397 /* The argument here may be the result of promoting the actual
1398 argument to int. Try to determine the type of the actual
1399 argument before promotion and narrow down its range that
1400 way. */
1401 gimple *def = SSA_NAME_DEF_STMT (arg);
1402 if (is_gimple_assign (def))
1403 {
1404 tree_code code = gimple_assign_rhs_code (def);
1405 if (code == INTEGER_CST)
1406 {
1407 arg = gimple_assign_rhs1 (def);
1408 return format_integer (dir, arg, vr_values);
1409 }
1410
1411 if (code == NOP_EXPR)
1412 {
1413 tree type = TREE_TYPE (gimple_assign_rhs1 (def));
1414 if (INTEGRAL_TYPE_P (type)
1415 || TREE_CODE (type) == POINTER_TYPE)
1416 argtype = type;
1417 }
1418 }
1419 }
1420 }
1421
1422 if (!argmin)
1423 {
1424 if (TREE_CODE (argtype) == POINTER_TYPE)
1425 {
1426 argmin = build_int_cst (pointer_sized_int_node, 0);
1427 argmax = build_all_ones_cst (pointer_sized_int_node);
1428 }
1429 else
1430 {
1431 argmin = TYPE_MIN_VALUE (argtype);
1432 argmax = TYPE_MAX_VALUE (argtype);
1433 }
1434 }
1435
1436 /* Clear KNOWNRANGE if the range has been adjusted to the maximum
1437 of the directive. If it has been cleared then since ARGMIN and/or
1438 ARGMAX have been adjusted also adjust the corresponding ARGMIN and
1439 ARGMAX in the result to include in diagnostics. */
1440 if (adjust_range_for_overflow (dirtype, &argmin, &argmax))
1441 {
1442 res.knownrange = false;
1443 res.argmin = argmin;
1444 res.argmax = argmax;
1445 }
1446
1447 /* Recursively compute the minimum and maximum from the known range. */
1448 if (TYPE_UNSIGNED (dirtype) || tree_int_cst_sgn (argmin) >= 0)
1449 {
1450 /* For unsigned conversions/directives or signed when
1451 the minimum is positive, use the minimum and maximum to compute
1452 the shortest and longest output, respectively. */
1453 res.range.min = format_integer (dir, argmin, vr_values).range.min;
1454 res.range.max = format_integer (dir, argmax, vr_values).range.max;
1455 }
1456 else if (tree_int_cst_sgn (argmax) < 0)
1457 {
1458 /* For signed conversions/directives if maximum is negative,
1459 use the minimum as the longest output and maximum as the
1460 shortest output. */
1461 res.range.min = format_integer (dir, argmax, vr_values).range.min;
1462 res.range.max = format_integer (dir, argmin, vr_values).range.max;
1463 }
1464 else
1465 {
1466 /* Otherwise, 0 is inside of the range and minimum negative. Use 0
1467 as the shortest output and for the longest output compute the
1468 length of the output of both minimum and maximum and pick the
1469 longer. */
1470 unsigned HOST_WIDE_INT max1
1471 = format_integer (dir, argmin, vr_values).range.max;
1472 unsigned HOST_WIDE_INT max2
1473 = format_integer (dir, argmax, vr_values).range.max;
1474 res.range.min
1475 = format_integer (dir, integer_zero_node, vr_values).range.min;
1476 res.range.max = MAX (max1, max2);
1477 }
1478
1479 /* If the range is known, use the maximum as the likely length. */
1480 if (res.knownrange)
1481 res.range.likely = res.range.max;
1482 else
1483 {
1484 /* Otherwise, use the minimum. Except for the case where for %#x or
1485 %#o the minimum is just for a single value in the range (0) and
1486 for all other values it is something longer, like 0x1 or 01.
1487 Use the length for value 1 in that case instead as the likely
1488 length. */
1489 res.range.likely = res.range.min;
1490 if (maybebase
1491 && base != 10
1492 && (tree_int_cst_sgn (argmin) < 0 || tree_int_cst_sgn (argmax) > 0))
1493 {
1494 if (res.range.min == 1)
1495 res.range.likely += base == 8 ? 1 : 2;
1496 else if (res.range.min == 2
1497 && base == 16
1498 && (dir.width[0] == 2 || dir.prec[0] == 2))
1499 ++res.range.likely;
1500 }
1501 }
1502
1503 res.range.unlikely = res.range.max;
1504 res.adjust_for_width_or_precision (dir.width, dirtype, base,
1505 (sign | maybebase) + (base == 16));
1506 res.adjust_for_width_or_precision (dir.prec, dirtype, base,
1507 (sign | maybebase) + (base == 16));
1508
1509 return res;
1510 }
1511
1512 /* Return the number of bytes that a format directive consisting of FLAGS,
1513 PRECision, format SPECification, and MPFR rounding specifier RNDSPEC,
1514 would result for argument X under ideal conditions (i.e., if PREC
1515 weren't excessive). MPFR 3.1 allocates large amounts of memory for
1516 values of PREC with large magnitude and can fail (see MPFR bug #21056).
1517 This function works around those problems. */
1518
1519 static unsigned HOST_WIDE_INT
1520 get_mpfr_format_length (mpfr_ptr x, const char *flags, HOST_WIDE_INT prec,
1521 char spec, char rndspec)
1522 {
1523 char fmtstr[40];
1524
1525 HOST_WIDE_INT len = strlen (flags);
1526
1527 fmtstr[0] = '%';
1528 memcpy (fmtstr + 1, flags, len);
1529 memcpy (fmtstr + 1 + len, ".*R", 3);
1530 fmtstr[len + 4] = rndspec;
1531 fmtstr[len + 5] = spec;
1532 fmtstr[len + 6] = '\0';
1533
1534 spec = TOUPPER (spec);
1535 if (spec == 'E' || spec == 'F')
1536 {
1537 /* For %e, specify the precision explicitly since mpfr_sprintf
1538 does its own thing just to be different (see MPFR bug 21088). */
1539 if (prec < 0)
1540 prec = 6;
1541 }
1542 else
1543 {
1544 /* Avoid passing negative precisions with larger magnitude to MPFR
1545 to avoid exposing its bugs. (A negative precision is supposed
1546 to be ignored.) */
1547 if (prec < 0)
1548 prec = -1;
1549 }
1550
1551 HOST_WIDE_INT p = prec;
1552
1553 if (spec == 'G' && !strchr (flags, '#'))
1554 {
1555 /* For G/g without the pound flag, precision gives the maximum number
1556 of significant digits which is bounded by LDBL_MAX_10_EXP, or, for
1557 a 128 bit IEEE extended precision, 4932. Using twice as much here
1558 should be more than sufficient for any real format. */
1559 if ((IEEE_MAX_10_EXP * 2) < prec)
1560 prec = IEEE_MAX_10_EXP * 2;
1561 p = prec;
1562 }
1563 else
1564 {
1565 /* Cap precision arbitrarily at 1KB and add the difference
1566 (if any) to the MPFR result. */
1567 if (prec > 1024)
1568 p = 1024;
1569 }
1570
1571 len = mpfr_snprintf (NULL, 0, fmtstr, (int)p, x);
1572
1573 /* Handle the unlikely (impossible?) error by returning more than
1574 the maximum dictated by the function's return type. */
1575 if (len < 0)
1576 return target_dir_max () + 1;
1577
1578 /* Adjust the return value by the difference. */
1579 if (p < prec)
1580 len += prec - p;
1581
1582 return len;
1583 }
1584
1585 /* Return the number of bytes to format using the format specifier
1586 SPEC and the precision PREC the largest value in the real floating
1587 TYPE. */
1588
1589 static unsigned HOST_WIDE_INT
1590 format_floating_max (tree type, char spec, HOST_WIDE_INT prec)
1591 {
1592 machine_mode mode = TYPE_MODE (type);
1593
1594 /* IBM Extended mode. */
1595 if (MODE_COMPOSITE_P (mode))
1596 mode = DFmode;
1597
1598 /* Get the real type format desription for the target. */
1599 const real_format *rfmt = REAL_MODE_FORMAT (mode);
1600 REAL_VALUE_TYPE rv;
1601
1602 real_maxval (&rv, 0, mode);
1603
1604 /* Convert the GCC real value representation with the precision
1605 of the real type to the mpfr_t format with the GCC default
1606 round-to-nearest mode. */
1607 mpfr_t x;
1608 mpfr_init2 (x, rfmt->p);
1609 mpfr_from_real (x, &rv, MPFR_RNDN);
1610
1611 /* Return a value one greater to account for the leading minus sign. */
1612 unsigned HOST_WIDE_INT r
1613 = 1 + get_mpfr_format_length (x, "", prec, spec, 'D');
1614 mpfr_clear (x);
1615 return r;
1616 }
1617
1618 /* Return a range representing the minimum and maximum number of bytes
1619 that the directive DIR will output for any argument. PREC gives
1620 the adjusted precision range to account for negative precisions
1621 meaning the default 6. This function is used when the directive
1622 argument or its value isn't known. */
1623
1624 static fmtresult
1625 format_floating (const directive &dir, const HOST_WIDE_INT prec[2])
1626 {
1627 tree type;
1628
1629 switch (dir.modifier)
1630 {
1631 case FMT_LEN_l:
1632 case FMT_LEN_none:
1633 type = double_type_node;
1634 break;
1635
1636 case FMT_LEN_L:
1637 type = long_double_type_node;
1638 break;
1639
1640 case FMT_LEN_ll:
1641 type = long_double_type_node;
1642 break;
1643
1644 default:
1645 return fmtresult ();
1646 }
1647
1648 /* The minimum and maximum number of bytes produced by the directive. */
1649 fmtresult res;
1650
1651 /* The minimum output as determined by flags. It's always at least 1.
1652 When plus or space are set the output is preceded by either a sign
1653 or a space. */
1654 unsigned flagmin = (1 /* for the first digit */
1655 + (dir.get_flag ('+') | dir.get_flag (' ')));
1656
1657 /* The minimum is 3 for "inf" and "nan" for all specifiers, plus 1
1658 for the plus sign/space with the '+' and ' ' flags, respectively,
1659 unless reduced below. */
1660 res.range.min = 2 + flagmin;
1661
1662 /* When the pound flag is set the decimal point is included in output
1663 regardless of precision. Whether or not a decimal point is included
1664 otherwise depends on the specification and precision. */
1665 bool radix = dir.get_flag ('#');
1666
1667 switch (dir.specifier)
1668 {
1669 case 'A':
1670 case 'a':
1671 {
1672 HOST_WIDE_INT minprec = 6 + !radix /* decimal point */;
1673 if (dir.prec[0] <= 0)
1674 minprec = 0;
1675 else if (dir.prec[0] > 0)
1676 minprec = dir.prec[0] + !radix /* decimal point */;
1677
1678 res.range.likely = (2 /* 0x */
1679 + flagmin
1680 + radix
1681 + minprec
1682 + 3 /* p+0 */);
1683
1684 res.range.max = format_floating_max (type, 'a', prec[1]);
1685
1686 /* The unlikely maximum accounts for the longest multibyte
1687 decimal point character. */
1688 res.range.unlikely = res.range.max;
1689 if (dir.prec[1] > 0)
1690 res.range.unlikely += target_mb_len_max () - 1;
1691
1692 break;
1693 }
1694
1695 case 'E':
1696 case 'e':
1697 {
1698 /* Minimum output attributable to precision and, when it's
1699 non-zero, decimal point. */
1700 HOST_WIDE_INT minprec = prec[0] ? prec[0] + !radix : 0;
1701
1702 /* The likely minimum output is "[-+]1.234567e+00" regardless
1703 of the value of the actual argument. */
1704 res.range.likely = (flagmin
1705 + radix
1706 + minprec
1707 + 2 /* e+ */ + 2);
1708
1709 res.range.max = format_floating_max (type, 'e', prec[1]);
1710
1711 /* The unlikely maximum accounts for the longest multibyte
1712 decimal point character. */
1713 if (dir.prec[0] != dir.prec[1]
1714 || dir.prec[0] == -1 || dir.prec[0] > 0)
1715 res.range.unlikely = res.range.max + target_mb_len_max () -1;
1716 else
1717 res.range.unlikely = res.range.max;
1718 break;
1719 }
1720
1721 case 'F':
1722 case 'f':
1723 {
1724 /* Minimum output attributable to precision and, when it's non-zero,
1725 decimal point. */
1726 HOST_WIDE_INT minprec = prec[0] ? prec[0] + !radix : 0;
1727
1728 /* For finite numbers (i.e., not infinity or NaN) the lower bound
1729 when precision isn't specified is 8 bytes ("1.23456" since
1730 precision is taken to be 6). When precision is zero, the lower
1731 bound is 1 byte (e.g., "1"). Otherwise, when precision is greater
1732 than zero, then the lower bound is 2 plus precision (plus flags).
1733 But in all cases, the lower bound is no greater than 3. */
1734 unsigned HOST_WIDE_INT min = flagmin + radix + minprec;
1735 if (min < res.range.min)
1736 res.range.min = min;
1737
1738 /* Compute the upper bound for -TYPE_MAX. */
1739 res.range.max = format_floating_max (type, 'f', prec[1]);
1740
1741 /* The minimum output with unknown precision is a single byte
1742 (e.g., "0") but the more likely output is 3 bytes ("0.0"). */
1743 if (dir.prec[0] < 0 && dir.prec[1] > 0)
1744 res.range.likely = 3;
1745 else
1746 res.range.likely = min;
1747
1748 /* The unlikely maximum accounts for the longest multibyte
1749 decimal point character. */
1750 if (dir.prec[0] != dir.prec[1]
1751 || dir.prec[0] == -1 || dir.prec[0] > 0)
1752 res.range.unlikely = res.range.max + target_mb_len_max () - 1;
1753 break;
1754 }
1755
1756 case 'G':
1757 case 'g':
1758 {
1759 /* The %g output depends on precision and the exponent of
1760 the argument. Since the value of the argument isn't known
1761 the lower bound on the range of bytes (not counting flags
1762 or width) is 1 plus radix (i.e., either "0" or "0." for
1763 "%g" and "%#g", respectively, with a zero argument). */
1764 unsigned HOST_WIDE_INT min = flagmin + radix;
1765 if (min < res.range.min)
1766 res.range.min = min;
1767
1768 char spec = 'g';
1769 HOST_WIDE_INT maxprec = dir.prec[1];
1770 if (radix && maxprec)
1771 {
1772 /* When the pound flag (radix) is set, trailing zeros aren't
1773 trimmed and so the longest output is the same as for %e,
1774 except with precision minus 1 (as specified in C11). */
1775 spec = 'e';
1776 if (maxprec > 0)
1777 --maxprec;
1778 else if (maxprec < 0)
1779 maxprec = 5;
1780 }
1781 else
1782 maxprec = prec[1];
1783
1784 res.range.max = format_floating_max (type, spec, maxprec);
1785
1786 /* The likely output is either the maximum computed above
1787 minus 1 (assuming the maximum is positive) when precision
1788 is known (or unspecified), or the same minimum as for %e
1789 (which is computed for a non-negative argument). Unlike
1790 for the other specifiers above the likely output isn't
1791 the minimum because for %g that's 1 which is unlikely. */
1792 if (dir.prec[1] < 0
1793 || (unsigned HOST_WIDE_INT)dir.prec[1] < target_int_max ())
1794 res.range.likely = res.range.max - 1;
1795 else
1796 {
1797 HOST_WIDE_INT minprec = 6 + !radix /* decimal point */;
1798 res.range.likely = (flagmin
1799 + radix
1800 + minprec
1801 + 2 /* e+ */ + 2);
1802 }
1803
1804 /* The unlikely maximum accounts for the longest multibyte
1805 decimal point character. */
1806 res.range.unlikely = res.range.max + target_mb_len_max () - 1;
1807 break;
1808 }
1809
1810 default:
1811 return fmtresult ();
1812 }
1813
1814 /* Bump up the byte counters if WIDTH is greater. */
1815 res.adjust_for_width_or_precision (dir.width);
1816 return res;
1817 }
1818
1819 /* Return a range representing the minimum and maximum number of bytes
1820 that the directive DIR will write on output for the floating argument
1821 ARG. */
1822
1823 static fmtresult
1824 format_floating (const directive &dir, tree arg, const vr_values *)
1825 {
1826 HOST_WIDE_INT prec[] = { dir.prec[0], dir.prec[1] };
1827 tree type = (dir.modifier == FMT_LEN_L || dir.modifier == FMT_LEN_ll
1828 ? long_double_type_node : double_type_node);
1829
1830 /* For an indeterminate precision the lower bound must be assumed
1831 to be zero. */
1832 if (TOUPPER (dir.specifier) == 'A')
1833 {
1834 /* Get the number of fractional decimal digits needed to represent
1835 the argument without a loss of accuracy. */
1836 unsigned fmtprec
1837 = REAL_MODE_FORMAT (TYPE_MODE (type))->p;
1838
1839 /* The precision of the IEEE 754 double format is 53.
1840 The precision of all other GCC binary double formats
1841 is 56 or less. */
1842 unsigned maxprec = fmtprec <= 56 ? 13 : 15;
1843
1844 /* For %a, leave the minimum precision unspecified to let
1845 MFPR trim trailing zeros (as it and many other systems
1846 including Glibc happen to do) and set the maximum
1847 precision to reflect what it would be with trailing zeros
1848 present (as Solaris and derived systems do). */
1849 if (dir.prec[1] < 0)
1850 {
1851 /* Both bounds are negative implies that precision has
1852 not been specified. */
1853 prec[0] = maxprec;
1854 prec[1] = -1;
1855 }
1856 else if (dir.prec[0] < 0)
1857 {
1858 /* With a negative lower bound and a non-negative upper
1859 bound set the minimum precision to zero and the maximum
1860 to the greater of the maximum precision (i.e., with
1861 trailing zeros present) and the specified upper bound. */
1862 prec[0] = 0;
1863 prec[1] = dir.prec[1] < maxprec ? maxprec : dir.prec[1];
1864 }
1865 }
1866 else if (dir.prec[0] < 0)
1867 {
1868 if (dir.prec[1] < 0)
1869 {
1870 /* A precision in a strictly negative range is ignored and
1871 the default of 6 is used instead. */
1872 prec[0] = prec[1] = 6;
1873 }
1874 else
1875 {
1876 /* For a precision in a partly negative range, the lower bound
1877 must be assumed to be zero and the new upper bound is the
1878 greater of 6 (the default precision used when the specified
1879 precision is negative) and the upper bound of the specified
1880 range. */
1881 prec[0] = 0;
1882 prec[1] = dir.prec[1] < 6 ? 6 : dir.prec[1];
1883 }
1884 }
1885
1886 if (!arg
1887 || TREE_CODE (arg) != REAL_CST
1888 || !useless_type_conversion_p (type, TREE_TYPE (arg)))
1889 return format_floating (dir, prec);
1890
1891 /* The minimum and maximum number of bytes produced by the directive. */
1892 fmtresult res;
1893
1894 /* Get the real type format desription for the target. */
1895 const REAL_VALUE_TYPE *rvp = TREE_REAL_CST_PTR (arg);
1896 const real_format *rfmt = REAL_MODE_FORMAT (TYPE_MODE (TREE_TYPE (arg)));
1897
1898 if (!real_isfinite (rvp))
1899 {
1900 /* The format for Infinity and NaN is "[-]inf"/"[-]infinity"
1901 and "[-]nan" with the choice being implementation-defined
1902 but not locale dependent. */
1903 bool sign = dir.get_flag ('+') || real_isneg (rvp);
1904 res.range.min = 3 + sign;
1905
1906 res.range.likely = res.range.min;
1907 res.range.max = res.range.min;
1908 /* The unlikely maximum is "[-/+]infinity" or "[-/+][qs]nan".
1909 For NaN, the C/POSIX standards specify two formats:
1910 "[-/+]nan"
1911 and
1912 "[-/+]nan(n-char-sequence)"
1913 No known printf implementation outputs the latter format but AIX
1914 outputs QNaN and SNaN for quiet and signalling NaN, respectively,
1915 so the unlikely maximum reflects that. */
1916 res.range.unlikely = sign + (real_isinf (rvp) ? 8 : 4);
1917
1918 /* The range for infinity and NaN is known unless either width
1919 or precision is unknown. Width has the same effect regardless
1920 of whether the argument is finite. Precision is either ignored
1921 (e.g., Glibc) or can have an effect on the short vs long format
1922 such as inf/infinity (e.g., Solaris). */
1923 res.knownrange = dir.known_width_and_precision ();
1924
1925 /* Adjust the range for width but ignore precision. */
1926 res.adjust_for_width_or_precision (dir.width);
1927
1928 return res;
1929 }
1930
1931 char fmtstr [40];
1932 char *pfmt = fmtstr;
1933
1934 /* Append flags. */
1935 for (const char *pf = "-+ #0"; *pf; ++pf)
1936 if (dir.get_flag (*pf))
1937 *pfmt++ = *pf;
1938
1939 *pfmt = '\0';
1940
1941 {
1942 /* Set up an array to easily iterate over. */
1943 unsigned HOST_WIDE_INT* const minmax[] = {
1944 &res.range.min, &res.range.max
1945 };
1946
1947 for (int i = 0; i != sizeof minmax / sizeof *minmax; ++i)
1948 {
1949 /* Convert the GCC real value representation with the precision
1950 of the real type to the mpfr_t format rounding down in the
1951 first iteration that computes the minimm and up in the second
1952 that computes the maximum. This order is arbibtrary because
1953 rounding in either direction can result in longer output. */
1954 mpfr_t mpfrval;
1955 mpfr_init2 (mpfrval, rfmt->p);
1956 mpfr_from_real (mpfrval, rvp, i ? MPFR_RNDU : MPFR_RNDD);
1957
1958 /* Use the MPFR rounding specifier to round down in the first
1959 iteration and then up. In most but not all cases this will
1960 result in the same number of bytes. */
1961 char rndspec = "DU"[i];
1962
1963 /* Format it and store the result in the corresponding member
1964 of the result struct. */
1965 *minmax[i] = get_mpfr_format_length (mpfrval, fmtstr, prec[i],
1966 dir.specifier, rndspec);
1967 mpfr_clear (mpfrval);
1968 }
1969 }
1970
1971 /* Make sure the minimum is less than the maximum (MPFR rounding
1972 in the call to mpfr_snprintf can result in the reverse. */
1973 if (res.range.max < res.range.min)
1974 {
1975 unsigned HOST_WIDE_INT tmp = res.range.min;
1976 res.range.min = res.range.max;
1977 res.range.max = tmp;
1978 }
1979
1980 /* The range is known unless either width or precision is unknown. */
1981 res.knownrange = dir.known_width_and_precision ();
1982
1983 /* For the same floating point constant, unless width or precision
1984 is unknown, use the longer output as the likely maximum since
1985 with round to nearest either is equally likely. Otheriwse, when
1986 precision is unknown, use the greater of the minimum and 3 as
1987 the likely output (for "0.0" since zero precision is unlikely). */
1988 if (res.knownrange)
1989 res.range.likely = res.range.max;
1990 else if (res.range.min < 3
1991 && dir.prec[0] < 0
1992 && (unsigned HOST_WIDE_INT)dir.prec[1] == target_int_max ())
1993 res.range.likely = 3;
1994 else
1995 res.range.likely = res.range.min;
1996
1997 res.range.unlikely = res.range.max;
1998
1999 if (res.range.max > 2 && (prec[0] != 0 || prec[1] != 0))
2000 {
2001 /* Unless the precision is zero output longer than 2 bytes may
2002 include the decimal point which must be a single character
2003 up to MB_LEN_MAX in length. This is overly conservative
2004 since in some conversions some constants result in no decimal
2005 point (e.g., in %g). */
2006 res.range.unlikely += target_mb_len_max () - 1;
2007 }
2008
2009 res.adjust_for_width_or_precision (dir.width);
2010 return res;
2011 }
2012
2013 /* Return a FMTRESULT struct set to the lengths of the shortest and longest
2014 strings referenced by the expression STR, or (-1, -1) when not known.
2015 Used by the format_string function below. */
2016
2017 static fmtresult
2018 get_string_length (tree str, unsigned eltsize, const vr_values *vr)
2019 {
2020 if (!str)
2021 return fmtresult ();
2022
2023 /* Try to determine the dynamic string length first.
2024 Set MAXBOUND to an arbitrary non-null non-integer node as a request
2025 to have it set to the length of the longest string in a PHI. */
2026 c_strlen_data lendata = { };
2027 lendata.maxbound = str;
2028 if (eltsize == 1)
2029 get_range_strlen_dynamic (str, &lendata, vr);
2030 else
2031 {
2032 /* Determine the length of the shortest and longest string referenced
2033 by STR. Strings of unknown lengths are bounded by the sizes of
2034 arrays that subexpressions of STR may refer to. Pointers that
2035 aren't known to point any such arrays result in LENDATA.MAXLEN
2036 set to SIZE_MAX. */
2037 get_range_strlen (str, &lendata, eltsize);
2038 }
2039
2040 /* If LENDATA.MAXBOUND is not equal to .MINLEN it corresponds to the bound
2041 of the largest array STR refers to, if known, or it's set to SIZE_MAX
2042 otherwise. */
2043
2044 /* Return the default result when nothing is known about the string. */
2045 if ((lendata.maxbound && !tree_fits_uhwi_p (lendata.maxbound))
2046 || !tree_fits_uhwi_p (lendata.maxlen))
2047 {
2048 fmtresult res;
2049 res.nonstr = lendata.decl;
2050 return res;
2051 }
2052
2053 unsigned HOST_WIDE_INT lenmax = tree_to_uhwi (max_object_size ()) - 2;
2054 if (integer_zerop (lendata.minlen)
2055 && (!lendata.maxbound || lenmax <= tree_to_uhwi (lendata.maxbound))
2056 && lenmax <= tree_to_uhwi (lendata.maxlen))
2057 {
2058 fmtresult res;
2059 res.nonstr = lendata.decl;
2060 return res;
2061 }
2062
2063 HOST_WIDE_INT min
2064 = (tree_fits_uhwi_p (lendata.minlen)
2065 ? tree_to_uhwi (lendata.minlen)
2066 : 0);
2067
2068 HOST_WIDE_INT max
2069 = (lendata.maxbound && tree_fits_uhwi_p (lendata.maxbound)
2070 ? tree_to_uhwi (lendata.maxbound)
2071 : HOST_WIDE_INT_M1U);
2072
2073 const bool unbounded = integer_all_onesp (lendata.maxlen);
2074
2075 /* Set the max/likely counters to unbounded when a minimum is known
2076 but the maximum length isn't bounded. This implies that STR is
2077 a conditional expression involving a string of known length and
2078 and an expression of unknown/unbounded length. */
2079 if (min
2080 && (unsigned HOST_WIDE_INT)min < HOST_WIDE_INT_M1U
2081 && unbounded)
2082 max = HOST_WIDE_INT_M1U;
2083
2084 /* get_range_strlen() returns the target value of SIZE_MAX for
2085 strings of unknown length. Bump it up to HOST_WIDE_INT_M1U
2086 which may be bigger. */
2087 if ((unsigned HOST_WIDE_INT)min == target_size_max ())
2088 min = HOST_WIDE_INT_M1U;
2089 if ((unsigned HOST_WIDE_INT)max == target_size_max ())
2090 max = HOST_WIDE_INT_M1U;
2091
2092 fmtresult res (min, max);
2093 res.nonstr = lendata.decl;
2094
2095 /* Set RES.KNOWNRANGE to true if and only if all strings referenced
2096 by STR are known to be bounded (though not necessarily by their
2097 actual length but perhaps by their maximum possible length). */
2098 if (res.range.max < target_int_max ())
2099 {
2100 res.knownrange = true;
2101 /* When the length of the longest string is known and not
2102 excessive use it as the likely length of the string(s). */
2103 res.range.likely = res.range.max;
2104 }
2105 else
2106 {
2107 /* When the upper bound is unknown (it can be zero or excessive)
2108 set the likely length to the greater of 1. If MAXBOUND is
2109 known, also reset the length of the lower bound to zero. */
2110 res.range.likely = res.range.min ? res.range.min : warn_level > 1;
2111 if (lendata.maxbound && !integer_all_onesp (lendata.maxbound))
2112 res.range.min = 0;
2113 }
2114
2115 res.range.unlikely = unbounded ? HOST_WIDE_INT_MAX : res.range.max;
2116
2117 return res;
2118 }
2119
2120 /* Return the minimum and maximum number of characters formatted
2121 by the '%c' format directives and its wide character form for
2122 the argument ARG. ARG can be null (for functions such as
2123 vsprinf). */
2124
2125 static fmtresult
2126 format_character (const directive &dir, tree arg, const vr_values *vr_values)
2127 {
2128 fmtresult res;
2129
2130 res.knownrange = true;
2131
2132 if (dir.specifier == 'C'
2133 || dir.modifier == FMT_LEN_l)
2134 {
2135 /* A wide character can result in as few as zero bytes. */
2136 res.range.min = 0;
2137
2138 HOST_WIDE_INT min, max;
2139 if (get_int_range (arg, &min, &max, false, 0, vr_values))
2140 {
2141 if (min == 0 && max == 0)
2142 {
2143 /* The NUL wide character results in no bytes. */
2144 res.range.max = 0;
2145 res.range.likely = 0;
2146 res.range.unlikely = 0;
2147 }
2148 else if (min >= 0 && min < 128)
2149 {
2150 /* Be conservative if the target execution character set
2151 is not a 1-to-1 mapping to the source character set or
2152 if the source set is not ASCII. */
2153 bool one_2_one_ascii
2154 = (target_to_host_charmap[0] == 1 && target_to_host ('a') == 97);
2155
2156 /* A wide character in the ASCII range most likely results
2157 in a single byte, and only unlikely in up to MB_LEN_MAX. */
2158 res.range.max = one_2_one_ascii ? 1 : target_mb_len_max ();;
2159 res.range.likely = 1;
2160 res.range.unlikely = target_mb_len_max ();
2161 res.mayfail = !one_2_one_ascii;
2162 }
2163 else
2164 {
2165 /* A wide character outside the ASCII range likely results
2166 in up to two bytes, and only unlikely in up to MB_LEN_MAX. */
2167 res.range.max = target_mb_len_max ();
2168 res.range.likely = 2;
2169 res.range.unlikely = res.range.max;
2170 /* Converting such a character may fail. */
2171 res.mayfail = true;
2172 }
2173 }
2174 else
2175 {
2176 /* An unknown wide character is treated the same as a wide
2177 character outside the ASCII range. */
2178 res.range.max = target_mb_len_max ();
2179 res.range.likely = 2;
2180 res.range.unlikely = res.range.max;
2181 res.mayfail = true;
2182 }
2183 }
2184 else
2185 {
2186 /* A plain '%c' directive. Its ouput is exactly 1. */
2187 res.range.min = res.range.max = 1;
2188 res.range.likely = res.range.unlikely = 1;
2189 res.knownrange = true;
2190 }
2191
2192 /* Bump up the byte counters if WIDTH is greater. */
2193 return res.adjust_for_width_or_precision (dir.width);
2194 }
2195
2196 /* Determine the offset *INDEX of the first byte of an array element of
2197 TYPE (possibly recursively) into which the byte offset OFF points.
2198 On success set *INDEX to the offset of the first byte and return type.
2199 Otherwise, if no such element can be found, return null. */
2200
2201 static tree
2202 array_elt_at_offset (tree type, HOST_WIDE_INT off, HOST_WIDE_INT *index)
2203 {
2204 gcc_assert (TREE_CODE (type) == ARRAY_TYPE);
2205
2206 tree eltype = type;
2207 while (TREE_CODE (TREE_TYPE (eltype)) == ARRAY_TYPE)
2208 eltype = TREE_TYPE (eltype);
2209
2210 if (TYPE_MODE (TREE_TYPE (eltype)) != TYPE_MODE (char_type_node))
2211 eltype = TREE_TYPE (eltype);
2212
2213 if (eltype == type)
2214 {
2215 *index = 0;
2216 return type;
2217 }
2218
2219 HOST_WIDE_INT typsz = int_size_in_bytes (type);
2220 HOST_WIDE_INT eltsz = int_size_in_bytes (eltype);
2221 if (off < typsz * eltsz)
2222 {
2223 *index = (off / eltsz) * eltsz;
2224 return TREE_CODE (eltype) == ARRAY_TYPE ? TREE_TYPE (eltype) : eltype;
2225 }
2226
2227 return NULL_TREE;
2228 }
2229
2230 /* Determine the offset *INDEX of the first byte of a struct member of TYPE
2231 (possibly recursively) into which the byte offset OFF points. On success
2232 set *INDEX to the offset of the first byte and return true. Otherwise,
2233 if no such member can be found, return false. */
2234
2235 static bool
2236 field_at_offset (tree type, HOST_WIDE_INT off, HOST_WIDE_INT *index)
2237 {
2238 gcc_assert (RECORD_OR_UNION_TYPE_P (type));
2239
2240 for (tree fld = TYPE_FIELDS (type); fld; fld = TREE_CHAIN (fld))
2241 {
2242 if (TREE_CODE (fld) != FIELD_DECL || DECL_ARTIFICIAL (fld))
2243 continue;
2244
2245 tree fldtype = TREE_TYPE (fld);
2246 HOST_WIDE_INT fldoff = int_byte_position (fld);
2247
2248 /* If the size is not available the field is a flexible array
2249 member. Treat this case as success. */
2250 tree typesize = TYPE_SIZE_UNIT (fldtype);
2251 HOST_WIDE_INT fldsize = (tree_fits_uhwi_p (typesize)
2252 ? tree_to_uhwi (typesize)
2253 : off);
2254
2255 if (fldoff + fldsize < off)
2256 continue;
2257
2258 if (TREE_CODE (fldtype) == ARRAY_TYPE)
2259 {
2260 HOST_WIDE_INT idx = 0;
2261 if (tree ft = array_elt_at_offset (fldtype, off, &idx))
2262 fldtype = ft;
2263 else
2264 break;
2265
2266 *index += idx;
2267 fldoff -= idx;
2268 off -= idx;
2269 }
2270
2271 if (RECORD_OR_UNION_TYPE_P (fldtype))
2272 {
2273 *index += fldoff;
2274 return field_at_offset (fldtype, off - fldoff, index);
2275 }
2276
2277 *index += fldoff;
2278 return true;
2279 }
2280
2281 return false;
2282 }
2283
2284 /* For an expression X of pointer type, recursively try to find the same
2285 origin (object or pointer) as Y it references and return such an X.
2286 When X refers to a struct member, set *FLDOFF to the offset of the
2287 member from the beginning of the "most derived" object. */
2288
2289 static tree
2290 get_origin_and_offset (tree x, HOST_WIDE_INT *fldoff, HOST_WIDE_INT *off)
2291 {
2292 if (!x)
2293 return NULL_TREE;
2294
2295 switch (TREE_CODE (x))
2296 {
2297 case ADDR_EXPR:
2298 x = TREE_OPERAND (x, 0);
2299 return get_origin_and_offset (x, fldoff, off);
2300
2301 case ARRAY_REF:
2302 {
2303 tree offset = TREE_OPERAND (x, 1);
2304 HOST_WIDE_INT idx = (tree_fits_uhwi_p (offset)
2305 ? tree_to_uhwi (offset) : HOST_WIDE_INT_MAX);
2306
2307 tree eltype = TREE_TYPE (x);
2308 if (TREE_CODE (eltype) == INTEGER_TYPE)
2309 {
2310 if (off)
2311 *off = idx;
2312 }
2313 else if (idx < HOST_WIDE_INT_MAX)
2314 *fldoff += idx * int_size_in_bytes (eltype);
2315 else
2316 *fldoff = idx;
2317
2318 x = TREE_OPERAND (x, 0);
2319 return get_origin_and_offset (x, fldoff, NULL);
2320 }
2321
2322 case MEM_REF:
2323 if (off)
2324 {
2325 tree offset = TREE_OPERAND (x, 1);
2326 *off = (tree_fits_uhwi_p (offset)
2327 ? tree_to_uhwi (offset) : HOST_WIDE_INT_MAX);
2328 }
2329
2330 x = TREE_OPERAND (x, 0);
2331
2332 if (off)
2333 {
2334 tree xtype
2335 = (TREE_CODE (x) == ADDR_EXPR
2336 ? TREE_TYPE (TREE_OPERAND (x, 0)) : TREE_TYPE (TREE_TYPE (x)));
2337
2338 /* The byte offset of the most basic struct member the byte
2339 offset *OFF corresponds to, or for a (multidimensional)
2340 array member, the byte offset of the array element. */
2341 HOST_WIDE_INT index = 0;
2342
2343 if ((RECORD_OR_UNION_TYPE_P (xtype)
2344 && field_at_offset (xtype, *off, &index))
2345 || (TREE_CODE (xtype) == ARRAY_TYPE
2346 && TREE_CODE (TREE_TYPE (xtype)) == ARRAY_TYPE
2347 && array_elt_at_offset (xtype, *off, &index)))
2348 {
2349 *fldoff += index;
2350 *off -= index;
2351 }
2352 }
2353
2354 return get_origin_and_offset (x, fldoff, NULL);
2355
2356 case COMPONENT_REF:
2357 {
2358 tree fld = TREE_OPERAND (x, 1);
2359 *fldoff += int_byte_position (fld);
2360
2361 get_origin_and_offset (fld, fldoff, off);
2362 x = TREE_OPERAND (x, 0);
2363 return get_origin_and_offset (x, fldoff, off);
2364 }
2365
2366 case SSA_NAME:
2367 {
2368 gimple *def = SSA_NAME_DEF_STMT (x);
2369 if (is_gimple_assign (def))
2370 {
2371 tree_code code = gimple_assign_rhs_code (def);
2372 if (code == ADDR_EXPR)
2373 {
2374 x = gimple_assign_rhs1 (def);
2375 return get_origin_and_offset (x, fldoff, off);
2376 }
2377
2378 if (code == POINTER_PLUS_EXPR)
2379 {
2380 tree offset = gimple_assign_rhs2 (def);
2381 if (off)
2382 *off = (tree_fits_uhwi_p (offset)
2383 ? tree_to_uhwi (offset) : HOST_WIDE_INT_MAX);
2384
2385 x = gimple_assign_rhs1 (def);
2386 return get_origin_and_offset (x, fldoff, NULL);
2387 }
2388 else if (code == VAR_DECL)
2389 {
2390 x = gimple_assign_rhs1 (def);
2391 return get_origin_and_offset (x, fldoff, off);
2392 }
2393 }
2394 else if (gimple_nop_p (def) && SSA_NAME_VAR (x))
2395 x = SSA_NAME_VAR (x);
2396 }
2397
2398 default:
2399 break;
2400 }
2401
2402 return x;
2403 }
2404
2405 /* If ARG refers to the same (sub)object or array element as described
2406 by DST and DST_FLD, return the byte offset into the struct member or
2407 array element referenced by ARG. Otherwise return HOST_WIDE_INT_MIN
2408 to indicate that ARG and DST do not refer to the same object. */
2409
2410 static HOST_WIDE_INT
2411 alias_offset (tree arg, tree dst, HOST_WIDE_INT dst_fld)
2412 {
2413 /* See if the argument refers to the same base object as the destination
2414 of the formatted function call, and if so, try to determine if they
2415 can alias. */
2416 if (!arg || !dst || !ptr_derefs_may_alias_p (arg, dst))
2417 return HOST_WIDE_INT_MIN;
2418
2419 /* The two arguments may refer to the same object. If they both refer
2420 to a struct member, see if the members are one and the same. */
2421 HOST_WIDE_INT arg_off = 0, arg_fld = 0;
2422
2423 tree arg_orig = get_origin_and_offset (arg, &arg_fld, &arg_off);
2424
2425 if (arg_orig == dst && arg_fld == dst_fld)
2426 return arg_off;
2427
2428 return HOST_WIDE_INT_MIN;
2429 }
2430
2431 /* Return the minimum and maximum number of characters formatted
2432 by the '%s' format directive and its wide character form for
2433 the argument ARG. ARG can be null (for functions such as
2434 vsprinf). */
2435
2436 static fmtresult
2437 format_string (const directive &dir, tree arg, const vr_values *vr_values)
2438 {
2439 fmtresult res;
2440
2441 if (warn_restrict)
2442 {
2443 /* See if ARG might alias the destination of the call with
2444 DST_ORIGIN and DST_FIELD. If so, store the starting offset
2445 so that the overlap can be determined for certain later,
2446 when the amount of output of the call (including subsequent
2447 directives) has been computed. Otherwise, store HWI_MIN. */
2448 res.dst_offset = alias_offset (arg, dir.info->dst_origin,
2449 dir.info->dst_field);
2450 }
2451
2452 /* Compute the range the argument's length can be in. */
2453 int count_by = 1;
2454 if (dir.specifier == 'S' || dir.modifier == FMT_LEN_l)
2455 {
2456 /* Get a node for a C type that will be the same size
2457 as a wchar_t on the target. */
2458 tree node = get_typenode_from_name (MODIFIED_WCHAR_TYPE);
2459
2460 /* Now that we have a suitable node, get the number of
2461 bytes it occupies. */
2462 count_by = int_size_in_bytes (node);
2463 gcc_checking_assert (count_by == 2 || count_by == 4);
2464 }
2465
2466 fmtresult slen = get_string_length (arg, count_by, vr_values);
2467 if (slen.range.min == slen.range.max
2468 && slen.range.min < HOST_WIDE_INT_MAX)
2469 {
2470 /* The argument is either a string constant or it refers
2471 to one of a number of strings of the same length. */
2472
2473 /* A '%s' directive with a string argument with constant length. */
2474 res.range = slen.range;
2475
2476 if (dir.specifier == 'S'
2477 || dir.modifier == FMT_LEN_l)
2478 {
2479 /* In the worst case the length of output of a wide string S
2480 is bounded by MB_LEN_MAX * wcslen (S). */
2481 res.range.max *= target_mb_len_max ();
2482 res.range.unlikely = res.range.max;
2483 /* It's likely that the total length is not more that
2484 2 * wcslen (S).*/
2485 res.range.likely = res.range.min * 2;
2486
2487 if (dir.prec[1] >= 0
2488 && (unsigned HOST_WIDE_INT)dir.prec[1] < res.range.max)
2489 {
2490 res.range.max = dir.prec[1];
2491 res.range.likely = dir.prec[1];
2492 res.range.unlikely = dir.prec[1];
2493 }
2494
2495 if (dir.prec[0] < 0 && dir.prec[1] > -1)
2496 res.range.min = 0;
2497 else if (dir.prec[0] >= 0)
2498 res.range.likely = dir.prec[0];
2499
2500 /* Even a non-empty wide character string need not convert into
2501 any bytes. */
2502 res.range.min = 0;
2503
2504 /* A non-empty wide character conversion may fail. */
2505 if (slen.range.max > 0)
2506 res.mayfail = true;
2507 }
2508 else
2509 {
2510 res.knownrange = true;
2511
2512 if (dir.prec[0] < 0 && dir.prec[1] > -1)
2513 res.range.min = 0;
2514 else if ((unsigned HOST_WIDE_INT)dir.prec[0] < res.range.min)
2515 res.range.min = dir.prec[0];
2516
2517 if ((unsigned HOST_WIDE_INT)dir.prec[1] < res.range.max)
2518 {
2519 res.range.max = dir.prec[1];
2520 res.range.likely = dir.prec[1];
2521 res.range.unlikely = dir.prec[1];
2522 }
2523 }
2524 }
2525 else if (arg && integer_zerop (arg))
2526 {
2527 /* Handle null pointer argument. */
2528
2529 fmtresult res (0);
2530 res.nullp = true;
2531 return res;
2532 }
2533 else
2534 {
2535 /* For a '%s' and '%ls' directive with a non-constant string (either
2536 one of a number of strings of known length or an unknown string)
2537 the minimum number of characters is lesser of PRECISION[0] and
2538 the length of the shortest known string or zero, and the maximum
2539 is the lessser of the length of the longest known string or
2540 PTRDIFF_MAX and PRECISION[1]. The likely length is either
2541 the minimum at level 1 and the greater of the minimum and 1
2542 at level 2. This result is adjust upward for width (if it's
2543 specified). */
2544
2545 if (dir.specifier == 'S'
2546 || dir.modifier == FMT_LEN_l)
2547 {
2548 /* A wide character converts to as few as zero bytes. */
2549 slen.range.min = 0;
2550 if (slen.range.max < target_int_max ())
2551 slen.range.max *= target_mb_len_max ();
2552
2553 if (slen.range.likely < target_int_max ())
2554 slen.range.likely *= 2;
2555
2556 if (slen.range.likely < target_int_max ())
2557 slen.range.unlikely *= target_mb_len_max ();
2558
2559 /* A non-empty wide character conversion may fail. */
2560 if (slen.range.max > 0)
2561 res.mayfail = true;
2562 }
2563
2564 res.range = slen.range;
2565
2566 if (dir.prec[0] >= 0)
2567 {
2568 /* Adjust the minimum to zero if the string length is unknown,
2569 or at most the lower bound of the precision otherwise. */
2570 if (slen.range.min >= target_int_max ())
2571 res.range.min = 0;
2572 else if ((unsigned HOST_WIDE_INT)dir.prec[0] < slen.range.min)
2573 res.range.min = dir.prec[0];
2574
2575 /* Make both maxima no greater than the upper bound of precision. */
2576 if ((unsigned HOST_WIDE_INT)dir.prec[1] < slen.range.max
2577 || slen.range.max >= target_int_max ())
2578 {
2579 res.range.max = dir.prec[1];
2580 res.range.unlikely = dir.prec[1];
2581 }
2582
2583 /* If precision is constant, set the likely counter to the lesser
2584 of it and the maximum string length. Otherwise, if the lower
2585 bound of precision is greater than zero, set the likely counter
2586 to the minimum. Otherwise set it to zero or one based on
2587 the warning level. */
2588 if (dir.prec[0] == dir.prec[1])
2589 res.range.likely
2590 = ((unsigned HOST_WIDE_INT)dir.prec[0] < slen.range.max
2591 ? dir.prec[0] : slen.range.max);
2592 else if (dir.prec[0] > 0)
2593 res.range.likely = res.range.min;
2594 else
2595 res.range.likely = warn_level > 1;
2596 }
2597 else if (dir.prec[1] >= 0)
2598 {
2599 res.range.min = 0;
2600 if ((unsigned HOST_WIDE_INT)dir.prec[1] < slen.range.max)
2601 res.range.max = dir.prec[1];
2602 res.range.likely = dir.prec[1] ? warn_level > 1 : 0;
2603 if ((unsigned HOST_WIDE_INT)dir.prec[1] < slen.range.unlikely)
2604 res.range.unlikely = dir.prec[1];
2605 }
2606 else if (slen.range.min >= target_int_max ())
2607 {
2608 res.range.min = 0;
2609 res.range.max = HOST_WIDE_INT_MAX;
2610 /* At level 1 strings of unknown length are assumed to be
2611 empty, while at level 1 they are assumed to be one byte
2612 long. */
2613 res.range.likely = warn_level > 1;
2614 res.range.unlikely = HOST_WIDE_INT_MAX;
2615 }
2616 else
2617 {
2618 /* A string of unknown length unconstrained by precision is
2619 assumed to be empty at level 1 and just one character long
2620 at higher levels. */
2621 if (res.range.likely >= target_int_max ())
2622 res.range.likely = warn_level > 1;
2623 }
2624 }
2625
2626 /* If the argument isn't a nul-terminated string and the number
2627 of bytes on output isn't bounded by precision, set NONSTR. */
2628 if (slen.nonstr && slen.range.min < (unsigned HOST_WIDE_INT)dir.prec[0])
2629 res.nonstr = slen.nonstr;
2630
2631 /* Bump up the byte counters if WIDTH is greater. */
2632 return res.adjust_for_width_or_precision (dir.width);
2633 }
2634
2635 /* Format plain string (part of the format string itself). */
2636
2637 static fmtresult
2638 format_plain (const directive &dir, tree, const vr_values *)
2639 {
2640 fmtresult res (dir.len);
2641 return res;
2642 }
2643
2644 /* Return true if the RESULT of a directive in a call describe by INFO
2645 should be diagnosed given the AVAILable space in the destination. */
2646
2647 static bool
2648 should_warn_p (const call_info &info,
2649 const result_range &avail, const result_range &result)
2650 {
2651 if (result.max <= avail.min)
2652 {
2653 /* The least amount of space remaining in the destination is big
2654 enough for the longest output. */
2655 return false;
2656 }
2657
2658 if (info.bounded)
2659 {
2660 if (warn_format_trunc == 1 && result.min <= avail.max
2661 && info.retval_used ())
2662 {
2663 /* The likely amount of space remaining in the destination is big
2664 enough for the least output and the return value is used. */
2665 return false;
2666 }
2667
2668 if (warn_format_trunc == 1 && result.likely <= avail.likely
2669 && !info.retval_used ())
2670 {
2671 /* The likely amount of space remaining in the destination is big
2672 enough for the likely output and the return value is unused. */
2673 return false;
2674 }
2675
2676 if (warn_format_trunc == 2
2677 && result.likely <= avail.min
2678 && (result.max <= avail.min
2679 || result.max > HOST_WIDE_INT_MAX))
2680 {
2681 /* The minimum amount of space remaining in the destination is big
2682 enough for the longest output. */
2683 return false;
2684 }
2685 }
2686 else
2687 {
2688 if (warn_level == 1 && result.likely <= avail.likely)
2689 {
2690 /* The likely amount of space remaining in the destination is big
2691 enough for the likely output. */
2692 return false;
2693 }
2694
2695 if (warn_level == 2
2696 && result.likely <= avail.min
2697 && (result.max <= avail.min
2698 || result.max > HOST_WIDE_INT_MAX))
2699 {
2700 /* The minimum amount of space remaining in the destination is big
2701 enough for the longest output. */
2702 return false;
2703 }
2704 }
2705
2706 return true;
2707 }
2708
2709 /* At format string location describe by DIRLOC in a call described
2710 by INFO, issue a warning for a directive DIR whose output may be
2711 in excess of the available space AVAIL_RANGE in the destination
2712 given the formatting result FMTRES. This function does nothing
2713 except decide whether to issue a warning for a possible write
2714 past the end or truncation and, if so, format the warning.
2715 Return true if a warning has been issued. */
2716
2717 static bool
2718 maybe_warn (substring_loc &dirloc, location_t argloc,
2719 const call_info &info,
2720 const result_range &avail_range, const result_range &res,
2721 const directive &dir)
2722 {
2723 if (!should_warn_p (info, avail_range, res))
2724 return false;
2725
2726 /* A warning will definitely be issued below. */
2727
2728 /* The maximum byte count to reference in the warning. Larger counts
2729 imply that the upper bound is unknown (and could be anywhere between
2730 RES.MIN + 1 and SIZE_MAX / 2) are printed as "N or more bytes" rather
2731 than "between N and X" where X is some huge number. */
2732 unsigned HOST_WIDE_INT maxbytes = target_dir_max ();
2733
2734 /* True when there is enough room in the destination for the least
2735 amount of a directive's output but not enough for its likely or
2736 maximum output. */
2737 bool maybe = (res.min <= avail_range.max
2738 && (avail_range.min < res.likely
2739 || (res.max < HOST_WIDE_INT_MAX
2740 && avail_range.min < res.max)));
2741
2742 /* Buffer for the directive in the host character set (used when
2743 the source character set is different). */
2744 char hostdir[32];
2745
2746 if (avail_range.min == avail_range.max)
2747 {
2748 /* The size of the destination region is exact. */
2749 unsigned HOST_WIDE_INT navail = avail_range.max;
2750
2751 if (target_to_host (*dir.beg) != '%')
2752 {
2753 /* For plain character directives (i.e., the format string itself)
2754 but not others, point the caret at the first character that's
2755 past the end of the destination. */
2756 if (navail < dir.len)
2757 dirloc.set_caret_index (dirloc.get_caret_idx () + navail);
2758 }
2759
2760 if (*dir.beg == '\0')
2761 {
2762 /* This is the terminating nul. */
2763 gcc_assert (res.min == 1 && res.min == res.max);
2764
2765 return fmtwarn (dirloc, UNKNOWN_LOCATION, NULL, info.warnopt (),
2766 info.bounded
2767 ? (maybe
2768 ? G_("%qE output may be truncated before the "
2769 "last format character")
2770 : G_("%qE output truncated before the last "
2771 "format character"))
2772 : (maybe
2773 ? G_("%qE may write a terminating nul past the "
2774 "end of the destination")
2775 : G_("%qE writing a terminating nul past the "
2776 "end of the destination")),
2777 info.func);
2778 }
2779
2780 if (res.min == res.max)
2781 {
2782 const char *d = target_to_host (hostdir, sizeof hostdir, dir.beg);
2783 if (!info.bounded)
2784 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2785 "%<%.*s%> directive writing %wu byte into a "
2786 "region of size %wu",
2787 "%<%.*s%> directive writing %wu bytes into a "
2788 "region of size %wu",
2789 (int) dir.len, d, res.min, navail);
2790 else if (maybe)
2791 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2792 "%<%.*s%> directive output may be truncated "
2793 "writing %wu byte into a region of size %wu",
2794 "%<%.*s%> directive output may be truncated "
2795 "writing %wu bytes into a region of size %wu",
2796 (int) dir.len, d, res.min, navail);
2797 else
2798 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2799 "%<%.*s%> directive output truncated writing "
2800 "%wu byte into a region of size %wu",
2801 "%<%.*s%> directive output truncated writing "
2802 "%wu bytes into a region of size %wu",
2803 (int) dir.len, d, res.min, navail);
2804 }
2805 if (res.min == 0 && res.max < maxbytes)
2806 return fmtwarn (dirloc, argloc, NULL,
2807 info.warnopt (),
2808 info.bounded
2809 ? (maybe
2810 ? G_("%<%.*s%> directive output may be truncated "
2811 "writing up to %wu bytes into a region of "
2812 "size %wu")
2813 : G_("%<%.*s%> directive output truncated writing "
2814 "up to %wu bytes into a region of size %wu"))
2815 : G_("%<%.*s%> directive writing up to %wu bytes "
2816 "into a region of size %wu"), (int) dir.len,
2817 target_to_host (hostdir, sizeof hostdir, dir.beg),
2818 res.max, navail);
2819
2820 if (res.min == 0 && maxbytes <= res.max)
2821 /* This is a special case to avoid issuing the potentially
2822 confusing warning:
2823 writing 0 or more bytes into a region of size 0. */
2824 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2825 info.bounded
2826 ? (maybe
2827 ? G_("%<%.*s%> directive output may be truncated "
2828 "writing likely %wu or more bytes into a "
2829 "region of size %wu")
2830 : G_("%<%.*s%> directive output truncated writing "
2831 "likely %wu or more bytes into a region of "
2832 "size %wu"))
2833 : G_("%<%.*s%> directive writing likely %wu or more "
2834 "bytes into a region of size %wu"), (int) dir.len,
2835 target_to_host (hostdir, sizeof hostdir, dir.beg),
2836 res.likely, navail);
2837
2838 if (res.max < maxbytes)
2839 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2840 info.bounded
2841 ? (maybe
2842 ? G_("%<%.*s%> directive output may be truncated "
2843 "writing between %wu and %wu bytes into a "
2844 "region of size %wu")
2845 : G_("%<%.*s%> directive output truncated "
2846 "writing between %wu and %wu bytes into a "
2847 "region of size %wu"))
2848 : G_("%<%.*s%> directive writing between %wu and "
2849 "%wu bytes into a region of size %wu"),
2850 (int) dir.len,
2851 target_to_host (hostdir, sizeof hostdir, dir.beg),
2852 res.min, res.max, navail);
2853
2854 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2855 info.bounded
2856 ? (maybe
2857 ? G_("%<%.*s%> directive output may be truncated "
2858 "writing %wu or more bytes into a region of "
2859 "size %wu")
2860 : G_("%<%.*s%> directive output truncated writing "
2861 "%wu or more bytes into a region of size %wu"))
2862 : G_("%<%.*s%> directive writing %wu or more bytes "
2863 "into a region of size %wu"), (int) dir.len,
2864 target_to_host (hostdir, sizeof hostdir, dir.beg),
2865 res.min, navail);
2866 }
2867
2868 /* The size of the destination region is a range. */
2869
2870 if (target_to_host (*dir.beg) != '%')
2871 {
2872 unsigned HOST_WIDE_INT navail = avail_range.max;
2873
2874 /* For plain character directives (i.e., the format string itself)
2875 but not others, point the caret at the first character that's
2876 past the end of the destination. */
2877 if (navail < dir.len)
2878 dirloc.set_caret_index (dirloc.get_caret_idx () + navail);
2879 }
2880
2881 if (*dir.beg == '\0')
2882 {
2883 gcc_assert (res.min == 1 && res.min == res.max);
2884
2885 return fmtwarn (dirloc, UNKNOWN_LOCATION, NULL, info.warnopt (),
2886 info.bounded
2887 ? (maybe
2888 ? G_("%qE output may be truncated before the last "
2889 "format character")
2890 : G_("%qE output truncated before the last format "
2891 "character"))
2892 : (maybe
2893 ? G_("%qE may write a terminating nul past the end "
2894 "of the destination")
2895 : G_("%qE writing a terminating nul past the end "
2896 "of the destination")), info.func);
2897 }
2898
2899 if (res.min == res.max)
2900 {
2901 const char *d = target_to_host (hostdir, sizeof hostdir, dir.beg);
2902 if (!info.bounded)
2903 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2904 "%<%.*s%> directive writing %wu byte into a region "
2905 "of size between %wu and %wu",
2906 "%<%.*s%> directive writing %wu bytes into a region "
2907 "of size between %wu and %wu", (int) dir.len, d,
2908 res.min, avail_range.min, avail_range.max);
2909 else if (maybe)
2910 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2911 "%<%.*s%> directive output may be truncated writing "
2912 "%wu byte into a region of size between %wu and %wu",
2913 "%<%.*s%> directive output may be truncated writing "
2914 "%wu bytes into a region of size between %wu and "
2915 "%wu", (int) dir.len, d, res.min, avail_range.min,
2916 avail_range.max);
2917 else
2918 return fmtwarn_n (dirloc, argloc, NULL, info.warnopt (), res.min,
2919 "%<%.*s%> directive output truncated writing %wu "
2920 "byte into a region of size between %wu and %wu",
2921 "%<%.*s%> directive output truncated writing %wu "
2922 "bytes into a region of size between %wu and %wu",
2923 (int) dir.len, d, res.min, avail_range.min,
2924 avail_range.max);
2925 }
2926
2927 if (res.min == 0 && res.max < maxbytes)
2928 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2929 info.bounded
2930 ? (maybe
2931 ? G_("%<%.*s%> directive output may be truncated "
2932 "writing up to %wu bytes into a region of size "
2933 "between %wu and %wu")
2934 : G_("%<%.*s%> directive output truncated writing "
2935 "up to %wu bytes into a region of size between "
2936 "%wu and %wu"))
2937 : G_("%<%.*s%> directive writing up to %wu bytes "
2938 "into a region of size between %wu and %wu"),
2939 (int) dir.len,
2940 target_to_host (hostdir, sizeof hostdir, dir.beg),
2941 res.max, avail_range.min, avail_range.max);
2942
2943 if (res.min == 0 && maxbytes <= res.max)
2944 /* This is a special case to avoid issuing the potentially confusing
2945 warning:
2946 writing 0 or more bytes into a region of size between 0 and N. */
2947 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2948 info.bounded
2949 ? (maybe
2950 ? G_("%<%.*s%> directive output may be truncated "
2951 "writing likely %wu or more bytes into a region "
2952 "of size between %wu and %wu")
2953 : G_("%<%.*s%> directive output truncated writing "
2954 "likely %wu or more bytes into a region of size "
2955 "between %wu and %wu"))
2956 : G_("%<%.*s%> directive writing likely %wu or more bytes "
2957 "into a region of size between %wu and %wu"),
2958 (int) dir.len,
2959 target_to_host (hostdir, sizeof hostdir, dir.beg),
2960 res.likely, avail_range.min, avail_range.max);
2961
2962 if (res.max < maxbytes)
2963 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2964 info.bounded
2965 ? (maybe
2966 ? G_("%<%.*s%> directive output may be truncated "
2967 "writing between %wu and %wu bytes into a region "
2968 "of size between %wu and %wu")
2969 : G_("%<%.*s%> directive output truncated writing "
2970 "between %wu and %wu bytes into a region of size "
2971 "between %wu and %wu"))
2972 : G_("%<%.*s%> directive writing between %wu and "
2973 "%wu bytes into a region of size between %wu and "
2974 "%wu"), (int) dir.len,
2975 target_to_host (hostdir, sizeof hostdir, dir.beg),
2976 res.min, res.max, avail_range.min, avail_range.max);
2977
2978 return fmtwarn (dirloc, argloc, NULL, info.warnopt (),
2979 info.bounded
2980 ? (maybe
2981 ? G_("%<%.*s%> directive output may be truncated writing "
2982 "%wu or more bytes into a region of size between "
2983 "%wu and %wu")
2984 : G_("%<%.*s%> directive output truncated writing "
2985 "%wu or more bytes into a region of size between "
2986 "%wu and %wu"))
2987 : G_("%<%.*s%> directive writing %wu or more bytes "
2988 "into a region of size between %wu and %wu"),
2989 (int) dir.len,
2990 target_to_host (hostdir, sizeof hostdir, dir.beg),
2991 res.min, avail_range.min, avail_range.max);
2992 }
2993
2994 /* Given the formatting result described by RES and NAVAIL, the number
2995 of available in the destination, return the range of bytes remaining
2996 in the destination. */
2997
2998 static inline result_range
2999 bytes_remaining (unsigned HOST_WIDE_INT navail, const format_result &res)
3000 {
3001 result_range range;
3002
3003 if (HOST_WIDE_INT_MAX <= navail)
3004 {
3005 range.min = range.max = range.likely = range.unlikely = navail;
3006 return range;
3007 }
3008
3009 /* The lower bound of the available range is the available size
3010 minus the maximum output size, and the upper bound is the size
3011 minus the minimum. */
3012 range.max = res.range.min < navail ? navail - res.range.min : 0;
3013
3014 range.likely = res.range.likely < navail ? navail - res.range.likely : 0;
3015
3016 if (res.range.max < HOST_WIDE_INT_MAX)
3017 range.min = res.range.max < navail ? navail - res.range.max : 0;
3018 else
3019 range.min = range.likely;
3020
3021 range.unlikely = (res.range.unlikely < navail
3022 ? navail - res.range.unlikely : 0);
3023
3024 return range;
3025 }
3026
3027 /* Compute the length of the output resulting from the directive DIR
3028 in a call described by INFO and update the overall result of the call
3029 in *RES. Return true if the directive has been handled. */
3030
3031 static bool
3032 format_directive (const call_info &info,
3033 format_result *res, const directive &dir,
3034 const class vr_values *vr_values)
3035 {
3036 /* Offset of the beginning of the directive from the beginning
3037 of the format string. */
3038 size_t offset = dir.beg - info.fmtstr;
3039 size_t start = offset;
3040 size_t length = offset + dir.len - !!dir.len;
3041
3042 /* Create a location for the whole directive from the % to the format
3043 specifier. */
3044 substring_loc dirloc (info.fmtloc, TREE_TYPE (info.format),
3045 offset, start, length);
3046
3047 /* Also get the location of the argument if possible.
3048 This doesn't work for integer literals or function calls. */
3049 location_t argloc = UNKNOWN_LOCATION;
3050 if (dir.arg)
3051 argloc = EXPR_LOCATION (dir.arg);
3052
3053 /* Bail when there is no function to compute the output length,
3054 or when minimum length checking has been disabled. */
3055 if (!dir.fmtfunc || res->range.min >= HOST_WIDE_INT_MAX)
3056 return false;
3057
3058 /* Compute the range of lengths of the formatted output. */
3059 fmtresult fmtres = dir.fmtfunc (dir, dir.arg, vr_values);
3060
3061 /* Record whether the output of all directives is known to be
3062 bounded by some maximum, implying that their arguments are
3063 either known exactly or determined to be in a known range
3064 or, for strings, limited by the upper bounds of the arrays
3065 they refer to. */
3066 res->knownrange &= fmtres.knownrange;
3067
3068 if (!fmtres.knownrange)
3069 {
3070 /* Only when the range is known, check it against the host value
3071 of INT_MAX + (the number of bytes of the "%.*Lf" directive with
3072 INT_MAX precision, which is the longest possible output of any
3073 single directive). That's the largest valid byte count (though
3074 not valid call to a printf-like function because it can never
3075 return such a count). Otherwise, the range doesn't correspond
3076 to known values of the argument. */
3077 if (fmtres.range.max > target_dir_max ())
3078 {
3079 /* Normalize the MAX counter to avoid having to deal with it
3080 later. The counter can be less than HOST_WIDE_INT_M1U
3081 when compiling for an ILP32 target on an LP64 host. */
3082 fmtres.range.max = HOST_WIDE_INT_M1U;
3083 /* Disable exact and maximum length checking after a failure
3084 to determine the maximum number of characters (for example
3085 for wide characters or wide character strings) but continue
3086 tracking the minimum number of characters. */
3087 res->range.max = HOST_WIDE_INT_M1U;
3088 }
3089
3090 if (fmtres.range.min > target_dir_max ())
3091 {
3092 /* Disable exact length checking after a failure to determine
3093 even the minimum number of characters (it shouldn't happen
3094 except in an error) but keep tracking the minimum and maximum
3095 number of characters. */
3096 return true;
3097 }
3098 }
3099
3100 /* Buffer for the directive in the host character set (used when
3101 the source character set is different). */
3102 char hostdir[32];
3103
3104 int dirlen = dir.len;
3105
3106 if (fmtres.nullp)
3107 {
3108 fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3109 "%G%<%.*s%> directive argument is null",
3110 info.callstmt, dirlen,
3111 target_to_host (hostdir, sizeof hostdir, dir.beg));
3112
3113 /* Don't bother processing the rest of the format string. */
3114 res->warned = true;
3115 res->range.min = HOST_WIDE_INT_M1U;
3116 res->range.max = HOST_WIDE_INT_M1U;
3117 return false;
3118 }
3119
3120 /* Compute the number of available bytes in the destination. There
3121 must always be at least one byte of space for the terminating
3122 NUL that's appended after the format string has been processed. */
3123 result_range avail_range = bytes_remaining (info.objsize, *res);
3124
3125 /* If the argument aliases a part of the destination of the formatted
3126 call at offset FMTRES.DST_OFFSET append the directive and its result
3127 to the set of aliases for later processing. */
3128 if (fmtres.dst_offset != HOST_WIDE_INT_MIN)
3129 res->append_alias (dir, fmtres.dst_offset, fmtres.range);
3130
3131 bool warned = res->warned;
3132
3133 if (!warned)
3134 warned = maybe_warn (dirloc, argloc, info, avail_range,
3135 fmtres.range, dir);
3136
3137 /* Bump up the total maximum if it isn't too big. */
3138 if (res->range.max < HOST_WIDE_INT_MAX
3139 && fmtres.range.max < HOST_WIDE_INT_MAX)
3140 res->range.max += fmtres.range.max;
3141
3142 /* Raise the total unlikely maximum by the larger of the maximum
3143 and the unlikely maximum. */
3144 unsigned HOST_WIDE_INT save = res->range.unlikely;
3145 if (fmtres.range.max < fmtres.range.unlikely)
3146 res->range.unlikely += fmtres.range.unlikely;
3147 else
3148 res->range.unlikely += fmtres.range.max;
3149
3150 if (res->range.unlikely < save)
3151 res->range.unlikely = HOST_WIDE_INT_M1U;
3152
3153 res->range.min += fmtres.range.min;
3154 res->range.likely += fmtres.range.likely;
3155
3156 /* Has the minimum directive output length exceeded the maximum
3157 of 4095 bytes required to be supported? */
3158 bool minunder4k = fmtres.range.min < 4096;
3159 bool maxunder4k = fmtres.range.max < 4096;
3160 /* Clear POSUNDER4K in the overall result if the maximum has exceeded
3161 the 4k (this is necessary to avoid the return value optimization
3162 that may not be safe in the maximum case). */
3163 if (!maxunder4k)
3164 res->posunder4k = false;
3165 /* Also clear POSUNDER4K if the directive may fail. */
3166 if (fmtres.mayfail)
3167 res->posunder4k = false;
3168
3169 if (!warned
3170 /* Only warn at level 2. */
3171 && warn_level > 1
3172 /* Only warn for string functions. */
3173 && info.is_string_func ()
3174 && (!minunder4k
3175 || (!maxunder4k && fmtres.range.max < HOST_WIDE_INT_MAX)))
3176 {
3177 /* The directive output may be longer than the maximum required
3178 to be handled by an implementation according to 7.21.6.1, p15
3179 of C11. Warn on this only at level 2 but remember this and
3180 prevent folding the return value when done. This allows for
3181 the possibility of the actual libc call failing due to ENOMEM
3182 (like Glibc does with very large precision or width).
3183 Issue the "may exceed" warning only for string functions and
3184 not for fprintf or printf. */
3185
3186 if (fmtres.range.min == fmtres.range.max)
3187 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3188 "%<%.*s%> directive output of %wu bytes exceeds "
3189 "minimum required size of 4095", dirlen,
3190 target_to_host (hostdir, sizeof hostdir, dir.beg),
3191 fmtres.range.min);
3192 else if (!minunder4k)
3193 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3194 "%<%.*s%> directive output between %wu and %wu "
3195 "bytes exceeds minimum required size of 4095",
3196 dirlen,
3197 target_to_host (hostdir, sizeof hostdir, dir.beg),
3198 fmtres.range.min, fmtres.range.max);
3199 else if (!info.retval_used () && info.is_string_func ())
3200 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3201 "%<%.*s%> directive output between %wu and %wu "
3202 "bytes may exceed minimum required size of "
3203 "4095",
3204 dirlen,
3205 target_to_host (hostdir, sizeof hostdir, dir.beg),
3206 fmtres.range.min, fmtres.range.max);
3207 }
3208
3209 /* Has the likely and maximum directive output exceeded INT_MAX? */
3210 bool likelyximax = *dir.beg && res->range.likely > target_int_max ();
3211 /* Don't consider the maximum to be in excess when it's the result
3212 of a string of unknown length (i.e., whose maximum has been set
3213 to be greater than or equal to HOST_WIDE_INT_MAX. */
3214 bool maxximax = (*dir.beg
3215 && res->range.max > target_int_max ()
3216 && res->range.max < HOST_WIDE_INT_MAX);
3217
3218 if (!warned
3219 /* Warn for the likely output size at level 1. */
3220 && (likelyximax
3221 /* But only warn for the maximum at level 2. */
3222 || (warn_level > 1
3223 && maxximax
3224 && fmtres.range.max < HOST_WIDE_INT_MAX)))
3225 {
3226 if (fmtres.range.min > target_int_max ())
3227 {
3228 /* The directive output exceeds INT_MAX bytes. */
3229 if (fmtres.range.min == fmtres.range.max)
3230 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3231 "%<%.*s%> directive output of %wu bytes exceeds "
3232 "%<INT_MAX%>", dirlen,
3233 target_to_host (hostdir, sizeof hostdir, dir.beg),
3234 fmtres.range.min);
3235 else
3236 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3237 "%<%.*s%> directive output between %wu and "
3238 "%wu bytes exceeds %<INT_MAX%>", dirlen,
3239 target_to_host (hostdir, sizeof hostdir, dir.beg),
3240 fmtres.range.min, fmtres.range.max);
3241 }
3242 else if (res->range.min > target_int_max ())
3243 {
3244 /* The directive output is under INT_MAX but causes the result
3245 to exceed INT_MAX bytes. */
3246 if (fmtres.range.min == fmtres.range.max)
3247 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3248 "%<%.*s%> directive output of %wu bytes causes "
3249 "result to exceed %<INT_MAX%>", dirlen,
3250 target_to_host (hostdir, sizeof hostdir, dir.beg),
3251 fmtres.range.min);
3252 else
3253 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3254 "%<%.*s%> directive output between %wu and "
3255 "%wu bytes causes result to exceed %<INT_MAX%>",
3256 dirlen,
3257 target_to_host (hostdir, sizeof hostdir, dir.beg),
3258 fmtres.range.min, fmtres.range.max);
3259 }
3260 else if ((!info.retval_used () || !info.bounded)
3261 && (info.is_string_func ()))
3262 /* Warn for calls to string functions that either aren't bounded
3263 (sprintf) or whose return value isn't used. */
3264 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3265 "%<%.*s%> directive output between %wu and "
3266 "%wu bytes may cause result to exceed "
3267 "%<INT_MAX%>", dirlen,
3268 target_to_host (hostdir, sizeof hostdir, dir.beg),
3269 fmtres.range.min, fmtres.range.max);
3270 }
3271
3272 if (!warned && fmtres.nonstr)
3273 {
3274 warned = fmtwarn (dirloc, argloc, NULL, info.warnopt (),
3275 "%<%.*s%> directive argument is not a nul-terminated "
3276 "string",
3277 dirlen,
3278 target_to_host (hostdir, sizeof hostdir, dir.beg));
3279 if (warned && DECL_P (fmtres.nonstr))
3280 inform (DECL_SOURCE_LOCATION (fmtres.nonstr),
3281 "referenced argument declared here");
3282 return false;
3283 }
3284
3285 if (warned && fmtres.range.min < fmtres.range.likely
3286 && fmtres.range.likely < fmtres.range.max)
3287 inform_n (info.fmtloc, fmtres.range.likely,
3288 "assuming directive output of %wu byte",
3289 "assuming directive output of %wu bytes",
3290 fmtres.range.likely);
3291
3292 if (warned && fmtres.argmin)
3293 {
3294 if (fmtres.argmin == fmtres.argmax)
3295 inform (info.fmtloc, "directive argument %qE", fmtres.argmin);
3296 else if (fmtres.knownrange)
3297 inform (info.fmtloc, "directive argument in the range [%E, %E]",
3298 fmtres.argmin, fmtres.argmax);
3299 else
3300 inform (info.fmtloc,
3301 "using the range [%E, %E] for directive argument",
3302 fmtres.argmin, fmtres.argmax);
3303 }
3304
3305 res->warned |= warned;
3306
3307 if (!dir.beg[0] && res->warned)
3308 {
3309 location_t callloc = gimple_location (info.callstmt);
3310
3311 unsigned HOST_WIDE_INT min = res->range.min;
3312 unsigned HOST_WIDE_INT max = res->range.max;
3313
3314 if (info.objsize < HOST_WIDE_INT_MAX)
3315 {
3316 /* If a warning has been issued for buffer overflow or truncation
3317 help the user figure out how big a buffer they need. */
3318
3319 if (min == max)
3320 inform_n (callloc, min,
3321 "%qE output %wu byte into a destination of size %wu",
3322 "%qE output %wu bytes into a destination of size %wu",
3323 info.func, min, info.objsize);
3324 else if (max < HOST_WIDE_INT_MAX)
3325 inform (callloc,
3326 "%qE output between %wu and %wu bytes into "
3327 "a destination of size %wu",
3328 info.func, min, max, info.objsize);
3329 else if (min < res->range.likely && res->range.likely < max)
3330 inform (callloc,
3331 "%qE output %wu or more bytes (assuming %wu) into "
3332 "a destination of size %wu",
3333 info.func, min, res->range.likely, info.objsize);
3334 else
3335 inform (callloc,
3336 "%qE output %wu or more bytes into a destination of size "
3337 "%wu",
3338 info.func, min, info.objsize);
3339 }
3340 else if (!info.is_string_func ())
3341 {
3342 /* If the warning is for a file function like fprintf
3343 of printf with no destination size just print the computed
3344 result. */
3345 if (min == max)
3346 inform_n (callloc, min,
3347 "%qE output %wu byte", "%qE output %wu bytes",
3348 info.func, min);
3349 else if (max < HOST_WIDE_INT_MAX)
3350 inform (callloc,
3351 "%qE output between %wu and %wu bytes",
3352 info.func, min, max);
3353 else if (min < res->range.likely && res->range.likely < max)
3354 inform (callloc,
3355 "%qE output %wu or more bytes (assuming %wu)",
3356 info.func, min, res->range.likely);
3357 else
3358 inform (callloc,
3359 "%qE output %wu or more bytes",
3360 info.func, min);
3361 }
3362 }
3363
3364 if (dump_file && *dir.beg)
3365 {
3366 fprintf (dump_file,
3367 " Result: "
3368 HOST_WIDE_INT_PRINT_DEC ", " HOST_WIDE_INT_PRINT_DEC ", "
3369 HOST_WIDE_INT_PRINT_DEC ", " HOST_WIDE_INT_PRINT_DEC " ("
3370 HOST_WIDE_INT_PRINT_DEC ", " HOST_WIDE_INT_PRINT_DEC ", "
3371 HOST_WIDE_INT_PRINT_DEC ", " HOST_WIDE_INT_PRINT_DEC ")\n",
3372 fmtres.range.min, fmtres.range.likely,
3373 fmtres.range.max, fmtres.range.unlikely,
3374 res->range.min, res->range.likely,
3375 res->range.max, res->range.unlikely);
3376 }
3377
3378 return true;
3379 }
3380
3381 /* Parse a format directive in function call described by INFO starting
3382 at STR and populate DIR structure. Bump up *ARGNO by the number of
3383 arguments extracted for the directive. Return the length of
3384 the directive. */
3385
3386 static size_t
3387 parse_directive (call_info &info,
3388 directive &dir, format_result *res,
3389 const char *str, unsigned *argno,
3390 const vr_values *vr_values)
3391 {
3392 const char *pcnt = strchr (str, target_percent);
3393 dir.beg = str;
3394
3395 if (size_t len = pcnt ? pcnt - str : *str ? strlen (str) : 1)
3396 {
3397 /* This directive is either a plain string or the terminating nul
3398 (which isn't really a directive but it simplifies things to
3399 handle it as if it were). */
3400 dir.len = len;
3401 dir.fmtfunc = format_plain;
3402
3403 if (dump_file)
3404 {
3405 fprintf (dump_file, " Directive %u at offset "
3406 HOST_WIDE_INT_PRINT_UNSIGNED ": \"%.*s\", "
3407 "length = " HOST_WIDE_INT_PRINT_UNSIGNED "\n",
3408 dir.dirno,
3409 (unsigned HOST_WIDE_INT)(size_t)(dir.beg - info.fmtstr),
3410 (int)dir.len, dir.beg, (unsigned HOST_WIDE_INT) dir.len);
3411 }
3412
3413 return len - !*str;
3414 }
3415
3416 /* Set the directive argument's number to correspond to its position
3417 in the formatted function call's argument list. */
3418 dir.argno = *argno;
3419
3420 const char *pf = pcnt + 1;
3421
3422 /* POSIX numbered argument index or zero when none. */
3423 HOST_WIDE_INT dollar = 0;
3424
3425 /* With and precision. -1 when not specified, HOST_WIDE_INT_MIN
3426 when given by a va_list argument, and a non-negative value
3427 when specified in the format string itself. */
3428 HOST_WIDE_INT width = -1;
3429 HOST_WIDE_INT precision = -1;
3430
3431 /* Pointers to the beginning of the width and precision decimal
3432 string (if any) within the directive. */
3433 const char *pwidth = 0;
3434 const char *pprec = 0;
3435
3436 /* When the value of the decimal string that specifies width or
3437 precision is out of range, points to the digit that causes
3438 the value to exceed the limit. */
3439 const char *werange = NULL;
3440 const char *perange = NULL;
3441
3442 /* Width specified via the asterisk. Need not be INTEGER_CST.
3443 For vararg functions set to void_node. */
3444 tree star_width = NULL_TREE;
3445
3446 /* Width specified via the asterisk. Need not be INTEGER_CST.
3447 For vararg functions set to void_node. */
3448 tree star_precision = NULL_TREE;
3449
3450 if (ISDIGIT (target_to_host (*pf)))
3451 {
3452 /* This could be either a POSIX positional argument, the '0'
3453 flag, or a width, depending on what follows. Store it as
3454 width and sort it out later after the next character has
3455 been seen. */
3456 pwidth = pf;
3457 width = target_strtowi (&pf, &werange);
3458 }
3459 else if (target_to_host (*pf) == '*')
3460 {
3461 /* Similarly to the block above, this could be either a POSIX
3462 positional argument or a width, depending on what follows. */
3463 if (*argno < gimple_call_num_args (info.callstmt))
3464 star_width = gimple_call_arg (info.callstmt, (*argno)++);
3465 else
3466 star_width = void_node;
3467 ++pf;
3468 }
3469
3470 if (target_to_host (*pf) == '$')
3471 {
3472 /* Handle the POSIX dollar sign which references the 1-based
3473 positional argument number. */
3474 if (width != -1)
3475 dollar = width + info.argidx;
3476 else if (star_width
3477 && TREE_CODE (star_width) == INTEGER_CST
3478 && (TYPE_PRECISION (TREE_TYPE (star_width))
3479 <= TYPE_PRECISION (integer_type_node)))
3480 dollar = width + tree_to_shwi (star_width);
3481
3482 /* Bail when the numbered argument is out of range (it will
3483 have already been diagnosed by -Wformat). */
3484 if (dollar == 0
3485 || dollar == (int)info.argidx
3486 || dollar > gimple_call_num_args (info.callstmt))
3487 return false;
3488
3489 --dollar;
3490
3491 star_width = NULL_TREE;
3492 width = -1;
3493 ++pf;
3494 }
3495
3496 if (dollar || !star_width)
3497 {
3498 if (width != -1)
3499 {
3500 if (width == 0)
3501 {
3502 /* The '0' that has been interpreted as a width above is
3503 actually a flag. Reset HAVE_WIDTH, set the '0' flag,
3504 and continue processing other flags. */
3505 width = -1;
3506 dir.set_flag ('0');
3507 }
3508 else if (!dollar)
3509 {
3510 /* (Non-zero) width has been seen. The next character
3511 is either a period or a digit. */
3512 goto start_precision;
3513 }
3514 }
3515 /* When either '$' has been seen, or width has not been seen,
3516 the next field is the optional flags followed by an optional
3517 width. */
3518 for ( ; ; ) {
3519 switch (target_to_host (*pf))
3520 {
3521 case ' ':
3522 case '0':
3523 case '+':
3524 case '-':
3525 case '#':
3526 dir.set_flag (target_to_host (*pf++));
3527 break;
3528
3529 default:
3530 goto start_width;
3531 }
3532 }
3533
3534 start_width:
3535 if (ISDIGIT (target_to_host (*pf)))
3536 {
3537 werange = 0;
3538 pwidth = pf;
3539 width = target_strtowi (&pf, &werange);
3540 }
3541 else if (target_to_host (*pf) == '*')
3542 {
3543 if (*argno < gimple_call_num_args (info.callstmt))
3544 star_width = gimple_call_arg (info.callstmt, (*argno)++);
3545 else
3546 {
3547 /* This is (likely) a va_list. It could also be an invalid
3548 call with insufficient arguments. */
3549 star_width = void_node;
3550 }
3551 ++pf;
3552 }
3553 else if (target_to_host (*pf) == '\'')
3554 {
3555 /* The POSIX apostrophe indicating a numeric grouping
3556 in the current locale. Even though it's possible to
3557 estimate the upper bound on the size of the output
3558 based on the number of digits it probably isn't worth
3559 continuing. */
3560 return 0;
3561 }
3562 }
3563
3564 start_precision:
3565 if (target_to_host (*pf) == '.')
3566 {
3567 ++pf;
3568
3569 if (ISDIGIT (target_to_host (*pf)))
3570 {
3571 pprec = pf;
3572 precision = target_strtowi (&pf, &perange);
3573 }
3574 else if (target_to_host (*pf) == '*')
3575 {
3576 if (*argno < gimple_call_num_args (info.callstmt))
3577 star_precision = gimple_call_arg (info.callstmt, (*argno)++);
3578 else
3579 {
3580 /* This is (likely) a va_list. It could also be an invalid
3581 call with insufficient arguments. */
3582 star_precision = void_node;
3583 }
3584 ++pf;
3585 }
3586 else
3587 {
3588 /* The decimal precision or the asterisk are optional.
3589 When neither is dirified it's taken to be zero. */
3590 precision = 0;
3591 }
3592 }
3593
3594 switch (target_to_host (*pf))
3595 {
3596 case 'h':
3597 if (target_to_host (pf[1]) == 'h')
3598 {
3599 ++pf;
3600 dir.modifier = FMT_LEN_hh;
3601 }
3602 else
3603 dir.modifier = FMT_LEN_h;
3604 ++pf;
3605 break;
3606
3607 case 'j':
3608 dir.modifier = FMT_LEN_j;
3609 ++pf;
3610 break;
3611
3612 case 'L':
3613 dir.modifier = FMT_LEN_L;
3614 ++pf;
3615 break;
3616
3617 case 'l':
3618 if (target_to_host (pf[1]) == 'l')
3619 {
3620 ++pf;
3621 dir.modifier = FMT_LEN_ll;
3622 }
3623 else
3624 dir.modifier = FMT_LEN_l;
3625 ++pf;
3626 break;
3627
3628 case 't':
3629 dir.modifier = FMT_LEN_t;
3630 ++pf;
3631 break;
3632
3633 case 'z':
3634 dir.modifier = FMT_LEN_z;
3635 ++pf;
3636 break;
3637 }
3638
3639 switch (target_to_host (*pf))
3640 {
3641 /* Handle a sole '%' character the same as "%%" but since it's
3642 undefined prevent the result from being folded. */
3643 case '\0':
3644 --pf;
3645 res->range.min = res->range.max = HOST_WIDE_INT_M1U;
3646 /* FALLTHRU */
3647 case '%':
3648 dir.fmtfunc = format_percent;
3649 break;
3650
3651 case 'a':
3652 case 'A':
3653 case 'e':
3654 case 'E':
3655 case 'f':
3656 case 'F':
3657 case 'g':
3658 case 'G':
3659 res->floating = true;
3660 dir.fmtfunc = format_floating;
3661 break;
3662
3663 case 'd':
3664 case 'i':
3665 case 'o':
3666 case 'u':
3667 case 'x':
3668 case 'X':
3669 dir.fmtfunc = format_integer;
3670 break;
3671
3672 case 'p':
3673 /* The %p output is implementation-defined. It's possible
3674 to determine this format but due to extensions (edirially
3675 those of the Linux kernel -- see bug 78512) the first %p
3676 in the format string disables any further processing. */
3677 return false;
3678
3679 case 'n':
3680 /* %n has side-effects even when nothing is actually printed to
3681 any buffer. */
3682 info.nowrite = false;
3683 dir.fmtfunc = format_none;
3684 break;
3685
3686 case 'C':
3687 case 'c':
3688 /* POSIX wide character and C/POSIX narrow character. */
3689 dir.fmtfunc = format_character;
3690 break;
3691
3692 case 'S':
3693 case 's':
3694 /* POSIX wide string and C/POSIX narrow character string. */
3695 dir.fmtfunc = format_string;
3696 break;
3697
3698 default:
3699 /* Unknown conversion specification. */
3700 return 0;
3701 }
3702
3703 dir.specifier = target_to_host (*pf++);
3704
3705 /* Store the length of the format directive. */
3706 dir.len = pf - pcnt;
3707
3708 /* Buffer for the directive in the host character set (used when
3709 the source character set is different). */
3710 char hostdir[32];
3711
3712 if (star_width)
3713 {
3714 if (INTEGRAL_TYPE_P (TREE_TYPE (star_width)))
3715 dir.set_width (star_width, vr_values);
3716 else
3717 {
3718 /* Width specified by a va_list takes on the range [0, -INT_MIN]
3719 (width is the absolute value of that specified). */
3720 dir.width[0] = 0;
3721 dir.width[1] = target_int_max () + 1;
3722 }
3723 }
3724 else
3725 {
3726 if (width == HOST_WIDE_INT_MAX && werange)
3727 {
3728 size_t begin = dir.beg - info.fmtstr + (pwidth - pcnt);
3729 size_t caret = begin + (werange - pcnt);
3730 size_t end = pf - info.fmtstr - 1;
3731
3732 /* Create a location for the width part of the directive,
3733 pointing the caret at the first out-of-range digit. */
3734 substring_loc dirloc (info.fmtloc, TREE_TYPE (info.format),
3735 caret, begin, end);
3736
3737 fmtwarn (dirloc, UNKNOWN_LOCATION, NULL, info.warnopt (),
3738 "%<%.*s%> directive width out of range", (int) dir.len,
3739 target_to_host (hostdir, sizeof hostdir, dir.beg));
3740 }
3741
3742 dir.set_width (width);
3743 }
3744
3745 if (star_precision)
3746 {
3747 if (INTEGRAL_TYPE_P (TREE_TYPE (star_precision)))
3748 dir.set_precision (star_precision, vr_values);
3749 else
3750 {
3751 /* Precision specified by a va_list takes on the range [-1, INT_MAX]
3752 (unlike width, negative precision is ignored). */
3753 dir.prec[0] = -1;
3754 dir.prec[1] = target_int_max ();
3755 }
3756 }
3757 else
3758 {
3759 if (precision == HOST_WIDE_INT_MAX && perange)
3760 {
3761 size_t begin = dir.beg - info.fmtstr + (pprec - pcnt) - 1;
3762 size_t caret = dir.beg - info.fmtstr + (perange - pcnt) - 1;
3763 size_t end = pf - info.fmtstr - 2;
3764
3765 /* Create a location for the precision part of the directive,
3766 including the leading period, pointing the caret at the first
3767 out-of-range digit . */
3768 substring_loc dirloc (info.fmtloc, TREE_TYPE (info.format),
3769 caret, begin, end);
3770
3771 fmtwarn (dirloc, UNKNOWN_LOCATION, NULL, info.warnopt (),
3772 "%<%.*s%> directive precision out of range", (int) dir.len,
3773 target_to_host (hostdir, sizeof hostdir, dir.beg));
3774 }
3775
3776 dir.set_precision (precision);
3777 }
3778
3779 /* Extract the argument if the directive takes one and if it's
3780 available (e.g., the function doesn't take a va_list). Treat
3781 missing arguments the same as va_list, even though they will
3782 have likely already been diagnosed by -Wformat. */
3783 if (dir.specifier != '%'
3784 && *argno < gimple_call_num_args (info.callstmt))
3785 dir.arg = gimple_call_arg (info.callstmt, dollar ? dollar : (*argno)++);
3786
3787 if (dump_file)
3788 {
3789 fprintf (dump_file,
3790 " Directive %u at offset " HOST_WIDE_INT_PRINT_UNSIGNED
3791 ": \"%.*s\"",
3792 dir.dirno,
3793 (unsigned HOST_WIDE_INT)(size_t)(dir.beg - info.fmtstr),
3794 (int)dir.len, dir.beg);
3795 if (star_width)
3796 {
3797 if (dir.width[0] == dir.width[1])
3798 fprintf (dump_file, ", width = " HOST_WIDE_INT_PRINT_DEC,
3799 dir.width[0]);
3800 else
3801 fprintf (dump_file,
3802 ", width in range [" HOST_WIDE_INT_PRINT_DEC
3803 ", " HOST_WIDE_INT_PRINT_DEC "]",
3804 dir.width[0], dir.width[1]);
3805 }
3806
3807 if (star_precision)
3808 {
3809 if (dir.prec[0] == dir.prec[1])
3810 fprintf (dump_file, ", precision = " HOST_WIDE_INT_PRINT_DEC,
3811 dir.prec[0]);
3812 else
3813 fprintf (dump_file,
3814 ", precision in range [" HOST_WIDE_INT_PRINT_DEC
3815 HOST_WIDE_INT_PRINT_DEC "]",
3816 dir.prec[0], dir.prec[1]);
3817 }
3818 fputc ('\n', dump_file);
3819 }
3820
3821 return dir.len;
3822 }
3823
3824 /* Diagnose overlap between destination and %s directive arguments. */
3825
3826 static void
3827 maybe_warn_overlap (call_info &info, format_result *res)
3828 {
3829 /* Two vectors of 1-based indices corresponding to either certainly
3830 or possibly aliasing arguments. */
3831 auto_vec<int, 16> aliasarg[2];
3832
3833 /* Go through the array of potentially aliasing directives and collect
3834 argument numbers of those that do or may overlap the destination
3835 object given the full result. */
3836 for (unsigned i = 0; i != res->alias_count; ++i)
3837 {
3838 const format_result::alias_info &alias = res->aliases[i];
3839
3840 enum { possible = -1, none = 0, certain = 1 } overlap = none;
3841
3842 /* If the precision is zero there is no overlap. (This only
3843 considers %s directives and ignores %n.) */
3844 if (alias.dir.prec[0] == 0 && alias.dir.prec[1] == 0)
3845 continue;
3846
3847 if (alias.offset == HOST_WIDE_INT_MAX
3848 || info.dst_offset == HOST_WIDE_INT_MAX)
3849 overlap = possible;
3850 else if (alias.offset == info.dst_offset)
3851 overlap = alias.dir.prec[0] == 0 ? possible : certain;
3852 else
3853 {
3854 /* Determine overlap from the range of output and offsets
3855 into the same destination as the source, and rule out
3856 impossible overlap. */
3857 unsigned HOST_WIDE_INT albeg = alias.offset;
3858 unsigned HOST_WIDE_INT dstbeg = info.dst_offset;
3859
3860 unsigned HOST_WIDE_INT alend = albeg + alias.range.min;
3861 unsigned HOST_WIDE_INT dstend = dstbeg + res->range.min - 1;
3862
3863 if ((albeg <= dstbeg && alend > dstbeg)
3864 || (albeg >= dstbeg && albeg < dstend))
3865 overlap = certain;
3866 else
3867 {
3868 alend = albeg + alias.range.max;
3869 if (alend < albeg)
3870 alend = HOST_WIDE_INT_M1U;
3871
3872 dstend = dstbeg + res->range.max - 1;
3873 if (dstend < dstbeg)
3874 dstend = HOST_WIDE_INT_M1U;
3875
3876 if ((albeg >= dstbeg && albeg <= dstend)
3877 || (alend >= dstbeg && alend <= dstend))
3878 overlap = possible;
3879 }
3880 }
3881
3882 if (overlap == none)
3883 continue;
3884
3885 /* Append the 1-based argument number. */
3886 aliasarg[overlap != certain].safe_push (alias.dir.argno + 1);
3887
3888 /* Disable any kind of optimization. */
3889 res->range.unlikely = HOST_WIDE_INT_M1U;
3890 }
3891
3892 tree arg0 = gimple_call_arg (info.callstmt, 0);
3893 location_t loc = gimple_location (info.callstmt);
3894
3895 bool aliaswarn = false;
3896
3897 unsigned ncertain = aliasarg[0].length ();
3898 unsigned npossible = aliasarg[1].length ();
3899 if (ncertain && npossible)
3900 {
3901 /* If there are multiple arguments that overlap, some certainly
3902 and some possibly, handle both sets in a single diagnostic. */
3903 aliaswarn
3904 = warning_at (loc, OPT_Wrestrict,
3905 "%qE arguments %Z and maybe %Z overlap destination "
3906 "object %qE",
3907 info.func, aliasarg[0].address (), ncertain,
3908 aliasarg[1].address (), npossible,
3909 info.dst_origin);
3910 }
3911 else if (ncertain)
3912 {
3913 /* There is only one set of two or more arguments and they all
3914 certainly overlap the destination. */
3915 aliaswarn
3916 = warning_n (loc, OPT_Wrestrict, ncertain,
3917 "%qE argument %Z overlaps destination object %qE",
3918 "%qE arguments %Z overlap destination object %qE",
3919 info.func, aliasarg[0].address (), ncertain,
3920 info.dst_origin);
3921 }
3922 else if (npossible)
3923 {
3924 /* There is only one set of two or more arguments and they all
3925 may overlap (but need not). */
3926 aliaswarn
3927 = warning_n (loc, OPT_Wrestrict, npossible,
3928 "%qE argument %Z may overlap destination object %qE",
3929 "%qE arguments %Z may overlap destination object %qE",
3930 info.func, aliasarg[1].address (), npossible,
3931 info.dst_origin);
3932 }
3933
3934 if (aliaswarn)
3935 {
3936 res->warned = true;
3937
3938 if (info.dst_origin != arg0)
3939 {
3940 /* If its location is different from the first argument of the call
3941 point either at the destination object itself or at the expression
3942 that was used to determine the overlap. */
3943 loc = (DECL_P (info.dst_origin)
3944 ? DECL_SOURCE_LOCATION (info.dst_origin)
3945 : EXPR_LOCATION (info.dst_origin));
3946 if (loc != UNKNOWN_LOCATION)
3947 inform (loc,
3948 "destination object referenced by %<restrict%>-qualified "
3949 "argument 1 was declared here");
3950 }
3951 }
3952 }
3953
3954 /* Compute the length of the output resulting from the call to a formatted
3955 output function described by INFO and store the result of the call in
3956 *RES. Issue warnings for detected past the end writes. Return true
3957 if the complete format string has been processed and *RES can be relied
3958 on, false otherwise (e.g., when a unknown or unhandled directive was seen
3959 that caused the processing to be terminated early). */
3960
3961 static bool
3962 compute_format_length (call_info &info, format_result *res, const vr_values *vr)
3963 {
3964 if (dump_file)
3965 {
3966 location_t callloc = gimple_location (info.callstmt);
3967 fprintf (dump_file, "%s:%i: ",
3968 LOCATION_FILE (callloc), LOCATION_LINE (callloc));
3969 print_generic_expr (dump_file, info.func, dump_flags);
3970
3971 fprintf (dump_file,
3972 ": objsize = " HOST_WIDE_INT_PRINT_UNSIGNED
3973 ", fmtstr = \"%s\"\n",
3974 info.objsize, info.fmtstr);
3975 }
3976
3977 /* Reset the minimum and maximum byte counters. */
3978 res->range.min = res->range.max = 0;
3979
3980 /* No directive has been seen yet so the length of output is bounded
3981 by the known range [0, 0] (with no conversion resulting in a failure
3982 or producing more than 4K bytes) until determined otherwise. */
3983 res->knownrange = true;
3984 res->floating = false;
3985 res->warned = false;
3986
3987 /* 1-based directive counter. */
3988 unsigned dirno = 1;
3989
3990 /* The variadic argument counter. */
3991 unsigned argno = info.argidx;
3992
3993 bool success = true;
3994
3995 for (const char *pf = info.fmtstr; ; ++dirno)
3996 {
3997 directive dir (&info, dirno);
3998
3999 size_t n = parse_directive (info, dir, res, pf, &argno, vr);
4000
4001 /* Return failure if the format function fails. */
4002 if (!format_directive (info, res, dir, vr))
4003 return false;
4004
4005 /* Return success when the directive is zero bytes long and it's
4006 the last thing in the format string (i.e., it's the terminating
4007 nul, which isn't really a directive but handling it as one makes
4008 things simpler). */
4009 if (!n)
4010 {
4011 success = *pf == '\0';
4012 break;
4013 }
4014
4015 pf += n;
4016 }
4017
4018 maybe_warn_overlap (info, res);
4019
4020 /* The complete format string was processed (with or without warnings). */
4021 return success;
4022 }
4023
4024 /* Return the size of the object referenced by the expression DEST if
4025 available, or the maximum possible size otherwise. */
4026
4027 static unsigned HOST_WIDE_INT
4028 get_destination_size (tree dest)
4029 {
4030 /* When there is no destination return the maximum. */
4031 if (!dest)
4032 return HOST_WIDE_INT_MAX;
4033
4034 /* Initialize object size info before trying to compute it. */
4035 init_object_sizes ();
4036
4037 /* Use __builtin_object_size to determine the size of the destination
4038 object. When optimizing, determine the smallest object (such as
4039 a member array as opposed to the whole enclosing object), otherwise
4040 use type-zero object size to determine the size of the enclosing
4041 object (the function fails without optimization in this type). */
4042 int ost = optimize > 0;
4043 unsigned HOST_WIDE_INT size;
4044 if (compute_builtin_object_size (dest, ost, &size))
4045 return size;
4046
4047 return HOST_WIDE_INT_MAX;
4048 }
4049
4050 /* Return true if the call described by INFO with result RES safe to
4051 optimize (i.e., no undefined behavior), and set RETVAL to the range
4052 of its return values. */
4053
4054 static bool
4055 is_call_safe (const call_info &info,
4056 const format_result &res, bool under4k,
4057 unsigned HOST_WIDE_INT retval[2])
4058 {
4059 if (under4k && !res.posunder4k)
4060 return false;
4061
4062 /* The minimum return value. */
4063 retval[0] = res.range.min;
4064
4065 /* The maximum return value is in most cases bounded by RES.RANGE.MAX
4066 but in cases involving multibyte characters could be as large as
4067 RES.RANGE.UNLIKELY. */
4068 retval[1]
4069 = res.range.unlikely < res.range.max ? res.range.max : res.range.unlikely;
4070
4071 /* Adjust the number of bytes which includes the terminating nul
4072 to reflect the return value of the function which does not.
4073 Because the valid range of the function is [INT_MIN, INT_MAX],
4074 a valid range before the adjustment below is [0, INT_MAX + 1]
4075 (the functions only return negative values on error or undefined
4076 behavior). */
4077 if (retval[0] <= target_int_max () + 1)
4078 --retval[0];
4079 if (retval[1] <= target_int_max () + 1)
4080 --retval[1];
4081
4082 /* Avoid the return value optimization when the behavior of the call
4083 is undefined either because any directive may have produced 4K or
4084 more of output, or the return value exceeds INT_MAX, or because
4085 the output overflows the destination object (but leave it enabled
4086 when the function is bounded because then the behavior is well-
4087 defined). */
4088 if (retval[0] == retval[1]
4089 && (info.bounded || retval[0] < info.objsize)
4090 && retval[0] <= target_int_max ())
4091 return true;
4092
4093 if ((info.bounded || retval[1] < info.objsize)
4094 && (retval[0] < target_int_max ()
4095 && retval[1] < target_int_max ()))
4096 return true;
4097
4098 if (!under4k && (info.bounded || retval[0] < info.objsize))
4099 return true;
4100
4101 return false;
4102 }
4103
4104 /* Given a suitable result RES of a call to a formatted output function
4105 described by INFO, substitute the result for the return value of
4106 the call. The result is suitable if the number of bytes it represents
4107 is known and exact. A result that isn't suitable for substitution may
4108 have its range set to the range of return values, if that is known.
4109 Return true if the call is removed and gsi_next should not be performed
4110 in the caller. */
4111
4112 static bool
4113 try_substitute_return_value (gimple_stmt_iterator *gsi,
4114 const call_info &info,
4115 const format_result &res)
4116 {
4117 tree lhs = gimple_get_lhs (info.callstmt);
4118
4119 /* Set to true when the entire call has been removed. */
4120 bool removed = false;
4121
4122 /* The minimum and maximum return value. */
4123 unsigned HOST_WIDE_INT retval[2] = {0};
4124 bool safe = is_call_safe (info, res, true, retval);
4125
4126 if (safe
4127 && retval[0] == retval[1]
4128 /* Not prepared to handle possibly throwing calls here; they shouldn't
4129 appear in non-artificial testcases, except when the __*_chk routines
4130 are badly declared. */
4131 && !stmt_ends_bb_p (info.callstmt))
4132 {
4133 tree cst = build_int_cst (lhs ? TREE_TYPE (lhs) : integer_type_node,
4134 retval[0]);
4135
4136 if (lhs == NULL_TREE && info.nowrite)
4137 {
4138 /* Remove the call to the bounded function with a zero size
4139 (e.g., snprintf(0, 0, "%i", 123)) if there is no lhs. */
4140 unlink_stmt_vdef (info.callstmt);
4141 gsi_remove (gsi, true);
4142 removed = true;
4143 }
4144 else if (info.nowrite)
4145 {
4146 /* Replace the call to the bounded function with a zero size
4147 (e.g., snprintf(0, 0, "%i", 123) with the constant result
4148 of the function. */
4149 if (!update_call_from_tree (gsi, cst))
4150 gimplify_and_update_call_from_tree (gsi, cst);
4151 gimple *callstmt = gsi_stmt (*gsi);
4152 update_stmt (callstmt);
4153 }
4154 else if (lhs)
4155 {
4156 /* Replace the left-hand side of the call with the constant
4157 result of the formatted function. */
4158 gimple_call_set_lhs (info.callstmt, NULL_TREE);
4159 gimple *g = gimple_build_assign (lhs, cst);
4160 gsi_insert_after (gsi, g, GSI_NEW_STMT);
4161 update_stmt (info.callstmt);
4162 }
4163
4164 if (dump_file)
4165 {
4166 if (removed)
4167 fprintf (dump_file, " Removing call statement.");
4168 else
4169 {
4170 fprintf (dump_file, " Substituting ");
4171 print_generic_expr (dump_file, cst, dump_flags);
4172 fprintf (dump_file, " for %s.\n",
4173 info.nowrite ? "statement" : "return value");
4174 }
4175 }
4176 }
4177 else if (lhs && types_compatible_p (TREE_TYPE (lhs), integer_type_node))
4178 {
4179 bool setrange = false;
4180
4181 if (safe
4182 && (info.bounded || retval[1] < info.objsize)
4183 && (retval[0] < target_int_max ()
4184 && retval[1] < target_int_max ()))
4185 {
4186 /* If the result is in a valid range bounded by the size of
4187 the destination set it so that it can be used for subsequent
4188 optimizations. */
4189 int prec = TYPE_PRECISION (integer_type_node);
4190
4191 wide_int min = wi::shwi (retval[0], prec);
4192 wide_int max = wi::shwi (retval[1], prec);
4193 set_range_info (lhs, VR_RANGE, min, max);
4194
4195 setrange = true;
4196 }
4197
4198 if (dump_file)
4199 {
4200 const char *inbounds
4201 = (retval[0] < info.objsize
4202 ? (retval[1] < info.objsize
4203 ? "in" : "potentially out-of")
4204 : "out-of");
4205
4206 const char *what = setrange ? "Setting" : "Discarding";
4207 if (retval[0] != retval[1])
4208 fprintf (dump_file,
4209 " %s %s-bounds return value range ["
4210 HOST_WIDE_INT_PRINT_UNSIGNED ", "
4211 HOST_WIDE_INT_PRINT_UNSIGNED "].\n",
4212 what, inbounds, retval[0], retval[1]);
4213 else
4214 fprintf (dump_file, " %s %s-bounds return value "
4215 HOST_WIDE_INT_PRINT_UNSIGNED ".\n",
4216 what, inbounds, retval[0]);
4217 }
4218 }
4219
4220 if (dump_file)
4221 fputc ('\n', dump_file);
4222
4223 return removed;
4224 }
4225
4226 /* Try to simplify a s{,n}printf call described by INFO with result
4227 RES by replacing it with a simpler and presumably more efficient
4228 call (such as strcpy). */
4229
4230 static bool
4231 try_simplify_call (gimple_stmt_iterator *gsi,
4232 const call_info &info,
4233 const format_result &res)
4234 {
4235 unsigned HOST_WIDE_INT dummy[2];
4236 if (!is_call_safe (info, res, info.retval_used (), dummy))
4237 return false;
4238
4239 switch (info.fncode)
4240 {
4241 case BUILT_IN_SNPRINTF:
4242 return gimple_fold_builtin_snprintf (gsi);
4243
4244 case BUILT_IN_SPRINTF:
4245 return gimple_fold_builtin_sprintf (gsi);
4246
4247 default:
4248 ;
4249 }
4250
4251 return false;
4252 }
4253
4254 /* Return the zero-based index of the format string argument of a printf
4255 like function and set *IDX_ARGS to the first format argument. When
4256 no such index exists return UINT_MAX. */
4257
4258 static unsigned
4259 get_user_idx_format (tree fndecl, unsigned *idx_args)
4260 {
4261 tree attrs = lookup_attribute ("format", DECL_ATTRIBUTES (fndecl));
4262 if (!attrs)
4263 attrs = lookup_attribute ("format", TYPE_ATTRIBUTES (TREE_TYPE (fndecl)));
4264
4265 if (!attrs)
4266 return UINT_MAX;
4267
4268 attrs = TREE_VALUE (attrs);
4269
4270 tree archetype = TREE_VALUE (attrs);
4271 if (strcmp ("printf", IDENTIFIER_POINTER (archetype)))
4272 return UINT_MAX;
4273
4274 attrs = TREE_CHAIN (attrs);
4275 tree fmtarg = TREE_VALUE (attrs);
4276
4277 attrs = TREE_CHAIN (attrs);
4278 tree elliparg = TREE_VALUE (attrs);
4279
4280 /* Attribute argument indices are 1-based but we use zero-based. */
4281 *idx_args = tree_to_uhwi (elliparg) - 1;
4282 return tree_to_uhwi (fmtarg) - 1;
4283 }
4284
4285 } /* Unnamed namespace. */
4286
4287 /* Determine if a GIMPLE call at *GSI is to one of the sprintf-like built-in
4288 functions and if so, handle it. Return true if the call is removed and
4289 gsi_next should not be performed in the caller. */
4290
4291 bool
4292 handle_printf_call (gimple_stmt_iterator *gsi, const vr_values *vr_values)
4293 {
4294 init_target_to_host_charmap ();
4295
4296 call_info info = call_info ();
4297
4298 info.callstmt = gsi_stmt (*gsi);
4299 info.func = gimple_call_fndecl (info.callstmt);
4300 if (!info.func)
4301 return false;
4302
4303 /* Format string argument number (valid for all functions). */
4304 unsigned idx_format = UINT_MAX;
4305 if (gimple_call_builtin_p (info.callstmt, BUILT_IN_NORMAL))
4306 info.fncode = DECL_FUNCTION_CODE (info.func);
4307 else
4308 {
4309 unsigned idx_args;
4310 idx_format = get_user_idx_format (info.func, &idx_args);
4311 if (idx_format == UINT_MAX
4312 || idx_format >= gimple_call_num_args (info.callstmt)
4313 || idx_args > gimple_call_num_args (info.callstmt)
4314 || !POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (info.callstmt,
4315 idx_format))))
4316 return false;
4317 info.fncode = BUILT_IN_NONE;
4318 info.argidx = idx_args;
4319 }
4320
4321 /* The size of the destination as in snprintf(dest, size, ...). */
4322 unsigned HOST_WIDE_INT dstsize = HOST_WIDE_INT_M1U;
4323
4324 /* The size of the destination determined by __builtin_object_size. */
4325 unsigned HOST_WIDE_INT objsize = HOST_WIDE_INT_M1U;
4326
4327 /* Zero-based buffer size argument number (snprintf and vsnprintf). */
4328 unsigned idx_dstsize = UINT_MAX;
4329
4330 /* Object size argument number (snprintf_chk and vsnprintf_chk). */
4331 unsigned idx_objsize = UINT_MAX;
4332
4333 /* Destinaton argument number (valid for sprintf functions only). */
4334 unsigned idx_dstptr = 0;
4335
4336 switch (info.fncode)
4337 {
4338 case BUILT_IN_NONE:
4339 // User-defined function with attribute format (printf).
4340 idx_dstptr = -1;
4341 break;
4342
4343 case BUILT_IN_FPRINTF:
4344 // Signature:
4345 // __builtin_fprintf (FILE*, format, ...)
4346 idx_format = 1;
4347 info.argidx = 2;
4348 idx_dstptr = -1;
4349 break;
4350
4351 case BUILT_IN_FPRINTF_CHK:
4352 // Signature:
4353 // __builtin_fprintf_chk (FILE*, ost, format, ...)
4354 idx_format = 2;
4355 info.argidx = 3;
4356 idx_dstptr = -1;
4357 break;
4358
4359 case BUILT_IN_FPRINTF_UNLOCKED:
4360 // Signature:
4361 // __builtin_fprintf_unnlocked (FILE*, format, ...)
4362 idx_format = 1;
4363 info.argidx = 2;
4364 idx_dstptr = -1;
4365 break;
4366
4367 case BUILT_IN_PRINTF:
4368 // Signature:
4369 // __builtin_printf (format, ...)
4370 idx_format = 0;
4371 info.argidx = 1;
4372 idx_dstptr = -1;
4373 break;
4374
4375 case BUILT_IN_PRINTF_CHK:
4376 // Signature:
4377 // __builtin_printf_chk (ost, format, ...)
4378 idx_format = 1;
4379 info.argidx = 2;
4380 idx_dstptr = -1;
4381 break;
4382
4383 case BUILT_IN_PRINTF_UNLOCKED:
4384 // Signature:
4385 // __builtin_printf (format, ...)
4386 idx_format = 0;
4387 info.argidx = 1;
4388 idx_dstptr = -1;
4389 break;
4390
4391 case BUILT_IN_SPRINTF:
4392 // Signature:
4393 // __builtin_sprintf (dst, format, ...)
4394 idx_format = 1;
4395 info.argidx = 2;
4396 break;
4397
4398 case BUILT_IN_SPRINTF_CHK:
4399 // Signature:
4400 // __builtin___sprintf_chk (dst, ost, objsize, format, ...)
4401 idx_objsize = 2;
4402 idx_format = 3;
4403 info.argidx = 4;
4404 break;
4405
4406 case BUILT_IN_SNPRINTF:
4407 // Signature:
4408 // __builtin_snprintf (dst, size, format, ...)
4409 idx_dstsize = 1;
4410 idx_format = 2;
4411 info.argidx = 3;
4412 info.bounded = true;
4413 break;
4414
4415 case BUILT_IN_SNPRINTF_CHK:
4416 // Signature:
4417 // __builtin___snprintf_chk (dst, size, ost, objsize, format, ...)
4418 idx_dstsize = 1;
4419 idx_objsize = 3;
4420 idx_format = 4;
4421 info.argidx = 5;
4422 info.bounded = true;
4423 break;
4424
4425 case BUILT_IN_VFPRINTF:
4426 // Signature:
4427 // __builtin_vprintf (FILE*, format, va_list)
4428 idx_format = 1;
4429 info.argidx = -1;
4430 idx_dstptr = -1;
4431 break;
4432
4433 case BUILT_IN_VFPRINTF_CHK:
4434 // Signature:
4435 // __builtin___vfprintf_chk (FILE*, ost, format, va_list)
4436 idx_format = 2;
4437 info.argidx = -1;
4438 idx_dstptr = -1;
4439 break;
4440
4441 case BUILT_IN_VPRINTF:
4442 // Signature:
4443 // __builtin_vprintf (format, va_list)
4444 idx_format = 0;
4445 info.argidx = -1;
4446 idx_dstptr = -1;
4447 break;
4448
4449 case BUILT_IN_VPRINTF_CHK:
4450 // Signature:
4451 // __builtin___vprintf_chk (ost, format, va_list)
4452 idx_format = 1;
4453 info.argidx = -1;
4454 idx_dstptr = -1;
4455 break;
4456
4457 case BUILT_IN_VSNPRINTF:
4458 // Signature:
4459 // __builtin_vsprintf (dst, size, format, va)
4460 idx_dstsize = 1;
4461 idx_format = 2;
4462 info.argidx = -1;
4463 info.bounded = true;
4464 break;
4465
4466 case BUILT_IN_VSNPRINTF_CHK:
4467 // Signature:
4468 // __builtin___vsnprintf_chk (dst, size, ost, objsize, format, va)
4469 idx_dstsize = 1;
4470 idx_objsize = 3;
4471 idx_format = 4;
4472 info.argidx = -1;
4473 info.bounded = true;
4474 break;
4475
4476 case BUILT_IN_VSPRINTF:
4477 // Signature:
4478 // __builtin_vsprintf (dst, format, va)
4479 idx_format = 1;
4480 info.argidx = -1;
4481 break;
4482
4483 case BUILT_IN_VSPRINTF_CHK:
4484 // Signature:
4485 // __builtin___vsprintf_chk (dst, ost, objsize, format, va)
4486 idx_format = 3;
4487 idx_objsize = 2;
4488 info.argidx = -1;
4489 break;
4490
4491 default:
4492 return false;
4493 }
4494
4495 /* Set the global warning level for this function. */
4496 warn_level = info.bounded ? warn_format_trunc : warn_format_overflow;
4497
4498 /* For all string functions the first argument is a pointer to
4499 the destination. */
4500 tree dstptr = (idx_dstptr < gimple_call_num_args (info.callstmt)
4501 ? gimple_call_arg (info.callstmt, 0) : NULL_TREE);
4502
4503 info.format = gimple_call_arg (info.callstmt, idx_format);
4504
4505 /* True when the destination size is constant as opposed to the lower
4506 or upper bound of a range. */
4507 bool dstsize_cst_p = true;
4508 bool posunder4k = true;
4509
4510 if (idx_dstsize == UINT_MAX)
4511 {
4512 /* For non-bounded functions like sprintf, determine the size
4513 of the destination from the object or pointer passed to it
4514 as the first argument. */
4515 dstsize = get_destination_size (dstptr);
4516 }
4517 else if (tree size = gimple_call_arg (info.callstmt, idx_dstsize))
4518 {
4519 /* For bounded functions try to get the size argument. */
4520
4521 if (TREE_CODE (size) == INTEGER_CST)
4522 {
4523 dstsize = tree_to_uhwi (size);
4524 /* No object can be larger than SIZE_MAX bytes (half the address
4525 space) on the target.
4526 The functions are defined only for output of at most INT_MAX
4527 bytes. Specifying a bound in excess of that limit effectively
4528 defeats the bounds checking (and on some implementations such
4529 as Solaris cause the function to fail with EINVAL). */
4530 if (dstsize > target_size_max () / 2)
4531 {
4532 /* Avoid warning if -Wstringop-overflow is specified since
4533 it also warns for the same thing though only for the
4534 checking built-ins. */
4535 if ((idx_objsize == UINT_MAX
4536 || !warn_stringop_overflow))
4537 warning_at (gimple_location (info.callstmt), info.warnopt (),
4538 "specified bound %wu exceeds maximum object size "
4539 "%wu",
4540 dstsize, target_size_max () / 2);
4541 /* POSIX requires snprintf to fail if DSTSIZE is greater
4542 than INT_MAX. Even though not all POSIX implementations
4543 conform to the requirement, avoid folding in this case. */
4544 posunder4k = false;
4545 }
4546 else if (dstsize > target_int_max ())
4547 {
4548 warning_at (gimple_location (info.callstmt), info.warnopt (),
4549 "specified bound %wu exceeds %<INT_MAX%>",
4550 dstsize);
4551 /* POSIX requires snprintf to fail if DSTSIZE is greater
4552 than INT_MAX. Avoid folding in that case. */
4553 posunder4k = false;
4554 }
4555 }
4556 else if (TREE_CODE (size) == SSA_NAME)
4557 {
4558 /* Try to determine the range of values of the argument
4559 and use the greater of the two at level 1 and the smaller
4560 of them at level 2. */
4561 const value_range_equiv *vr
4562 = CONST_CAST (class vr_values *, vr_values)->get_value_range (size);
4563
4564 if (range_int_cst_p (vr))
4565 {
4566 unsigned HOST_WIDE_INT minsize = TREE_INT_CST_LOW (vr->min ());
4567 unsigned HOST_WIDE_INT maxsize = TREE_INT_CST_LOW (vr->max ());
4568 dstsize = warn_level < 2 ? maxsize : minsize;
4569
4570 if (minsize > target_int_max ())
4571 warning_at (gimple_location (info.callstmt), info.warnopt (),
4572 "specified bound range [%wu, %wu] exceeds "
4573 "%<INT_MAX%>",
4574 minsize, maxsize);
4575
4576 /* POSIX requires snprintf to fail if DSTSIZE is greater
4577 than INT_MAX. Avoid folding if that's possible. */
4578 if (maxsize > target_int_max ())
4579 posunder4k = false;
4580 }
4581 else if (vr->varying_p ())
4582 {
4583 /* POSIX requires snprintf to fail if DSTSIZE is greater
4584 than INT_MAX. Since SIZE's range is unknown, avoid
4585 folding. */
4586 posunder4k = false;
4587 }
4588
4589 /* The destination size is not constant. If the function is
4590 bounded (e.g., snprintf) a lower bound of zero doesn't
4591 necessarily imply it can be eliminated. */
4592 dstsize_cst_p = false;
4593 }
4594 }
4595
4596 if (idx_objsize != UINT_MAX)
4597 if (tree size = gimple_call_arg (info.callstmt, idx_objsize))
4598 if (tree_fits_uhwi_p (size))
4599 objsize = tree_to_uhwi (size);
4600
4601 if (info.bounded && !dstsize)
4602 {
4603 /* As a special case, when the explicitly specified destination
4604 size argument (to a bounded function like snprintf) is zero
4605 it is a request to determine the number of bytes on output
4606 without actually producing any. Pretend the size is
4607 unlimited in this case. */
4608 info.objsize = HOST_WIDE_INT_MAX;
4609 info.nowrite = dstsize_cst_p;
4610 }
4611 else
4612 {
4613 /* For calls to non-bounded functions or to those of bounded
4614 functions with a non-zero size, warn if the destination
4615 pointer is null. */
4616 if (dstptr && integer_zerop (dstptr))
4617 {
4618 /* This is diagnosed with -Wformat only when the null is a constant
4619 pointer. The warning here diagnoses instances where the pointer
4620 is not constant. */
4621 location_t loc = gimple_location (info.callstmt);
4622 warning_at (EXPR_LOC_OR_LOC (dstptr, loc),
4623 info.warnopt (), "%Gnull destination pointer",
4624 info.callstmt);
4625 return false;
4626 }
4627
4628 /* Set the object size to the smaller of the two arguments
4629 of both have been specified and they're not equal. */
4630 info.objsize = dstsize < objsize ? dstsize : objsize;
4631
4632 if (info.bounded
4633 && dstsize < target_size_max () / 2 && objsize < dstsize
4634 /* Avoid warning if -Wstringop-overflow is specified since
4635 it also warns for the same thing though only for the
4636 checking built-ins. */
4637 && (idx_objsize == UINT_MAX
4638 || !warn_stringop_overflow))
4639 {
4640 warning_at (gimple_location (info.callstmt), info.warnopt (),
4641 "specified bound %wu exceeds the size %wu "
4642 "of the destination object", dstsize, objsize);
4643 }
4644 }
4645
4646 /* Determine if the format argument may be null and warn if not
4647 and if the argument is null. */
4648 if (integer_zerop (info.format)
4649 && gimple_call_builtin_p (info.callstmt, BUILT_IN_NORMAL))
4650 {
4651 location_t loc = gimple_location (info.callstmt);
4652 warning_at (EXPR_LOC_OR_LOC (info.format, loc),
4653 info.warnopt (), "%Gnull format string",
4654 info.callstmt);
4655 return false;
4656 }
4657
4658 info.fmtstr = get_format_string (info.format, &info.fmtloc);
4659 if (!info.fmtstr)
4660 return false;
4661
4662 if (warn_restrict)
4663 {
4664 /* Compute the origin of the destination pointer and its offset
4665 from the base object/pointer if possible. */
4666 info.dst_offset = 0;
4667 info.dst_origin = get_origin_and_offset (dstptr, &info.dst_field,
4668 &info.dst_offset);
4669 }
4670
4671 /* The result is the number of bytes output by the formatted function,
4672 including the terminating NUL. */
4673 format_result res;
4674
4675 /* I/O functions with no destination argument (i.e., all forms of fprintf
4676 and printf) may fail under any conditions. Others (i.e., all forms of
4677 sprintf) may only fail under specific conditions determined for each
4678 directive. Clear POSUNDER4K for the former set of functions and set
4679 it to true for the latter (it can only be cleared later, but it is
4680 never set to true again). */
4681 res.posunder4k = posunder4k && dstptr;
4682
4683 bool success = compute_format_length (info, &res, vr_values);
4684 if (res.warned)
4685 gimple_set_no_warning (info.callstmt, true);
4686
4687 /* When optimizing and the printf return value optimization is enabled,
4688 attempt to substitute the computed result for the return value of
4689 the call. Avoid this optimization when -frounding-math is in effect
4690 and the format string contains a floating point directive. */
4691 bool call_removed = false;
4692 if (success && optimize > 0)
4693 {
4694 /* Save a copy of the iterator pointing at the call. The iterator
4695 may change to point past the call in try_substitute_return_value
4696 but the original value is needed in try_simplify_call. */
4697 gimple_stmt_iterator gsi_call = *gsi;
4698
4699 if (flag_printf_return_value
4700 && (!flag_rounding_math || !res.floating))
4701 call_removed = try_substitute_return_value (gsi, info, res);
4702
4703 if (!call_removed)
4704 try_simplify_call (&gsi_call, info, res);
4705 }
4706
4707 return call_removed;
4708 }