blob: bae60d4644078bc2aabdcf2fa0f0fd03b5819a69 [file] [log] [blame]
Ted Kremenek02087932010-07-16 02:11:22 +00001//== PrintfFormatString.cpp - Analysis of printf format strings --*- C++ -*-==//
Ted Kremeneka2e77b42010-01-27 23:43:25 +00002//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Ted Kremeneka2e77b42010-01-27 23:43:25 +00006//
7//===----------------------------------------------------------------------===//
8//
9// Handling of format string in printf and friends. The structure of format
10// strings for fprintf() are described in C99 7.19.6.1.
11//
12//===----------------------------------------------------------------------===//
13
Tim Northover314fbfa2018-11-02 13:14:11 +000014#include "clang/AST/FormatString.h"
15#include "clang/AST/OSLog.h"
Ted Kremenek02087932010-07-16 02:11:22 +000016#include "FormatStringParsing.h"
Chandler Carruth3a022472012-12-04 09:13:33 +000017#include "clang/Basic/TargetInfo.h"
Ted Kremeneka2e77b42010-01-27 23:43:25 +000018
Hans Wennborgc3b3da02012-08-07 08:11:26 +000019using clang::analyze_format_string::ArgType;
Ted Kremenek02087932010-07-16 02:11:22 +000020using clang::analyze_format_string::FormatStringHandler;
21using clang::analyze_format_string::LengthModifier;
22using clang::analyze_format_string::OptionalAmount;
Ted Kremenekf03e6d852010-07-20 20:04:27 +000023using clang::analyze_format_string::ConversionSpecifier;
Ted Kremenek02087932010-07-16 02:11:22 +000024using clang::analyze_printf::PrintfSpecifier;
Ted Kremenekd1668192010-02-27 01:41:03 +000025
Ted Kremenekc22f78d2010-01-29 03:16:21 +000026using namespace clang;
Ted Kremeneka2e77b42010-01-27 23:43:25 +000027
Ted Kremenek02087932010-07-16 02:11:22 +000028typedef clang::analyze_format_string::SpecifierResult<PrintfSpecifier>
29 PrintfSpecifierResult;
Ted Kremenekc8b188d2010-02-16 01:46:59 +000030
31//===----------------------------------------------------------------------===//
32// Methods for parsing format strings.
33//===----------------------------------------------------------------------===//
Ted Kremeneka2e77b42010-01-27 23:43:25 +000034
Ted Kremenek02087932010-07-16 02:11:22 +000035using analyze_format_string::ParseNonPositionAmount;
Ted Kremenekc8b188d2010-02-16 01:46:59 +000036
Ted Kremenek02087932010-07-16 02:11:22 +000037static bool ParsePrecision(FormatStringHandler &H, PrintfSpecifier &FS,
Ted Kremenekd1668192010-02-27 01:41:03 +000038 const char *Start, const char *&Beg, const char *E,
39 unsigned *argIndex) {
40 if (argIndex) {
41 FS.setPrecision(ParseNonPositionAmount(Beg, E, *argIndex));
Chad Rosier6fdf38b2011-08-17 23:08:45 +000042 } else {
Ted Kremenekd1668192010-02-27 01:41:03 +000043 const OptionalAmount Amt = ParsePositionAmount(H, Start, Beg, E,
Ted Kremenek02087932010-07-16 02:11:22 +000044 analyze_format_string::PrecisionPos);
Ted Kremenekd1668192010-02-27 01:41:03 +000045 if (Amt.isInvalid())
46 return true;
47 FS.setPrecision(Amt);
48 }
49 return false;
50}
51
Ted Kremenek2b417712015-07-02 05:39:16 +000052static bool ParseObjCFlags(FormatStringHandler &H, PrintfSpecifier &FS,
53 const char *FlagBeg, const char *E, bool Warn) {
54 StringRef Flag(FlagBeg, E - FlagBeg);
55 // Currently there is only one flag.
56 if (Flag == "tt") {
57 FS.setHasObjCTechnicalTerm(FlagBeg);
58 return false;
59 }
60 // Handle either the case of no flag or an invalid flag.
61 if (Warn) {
62 if (Flag == "")
63 H.HandleEmptyObjCModifierFlag(FlagBeg, E - FlagBeg);
64 else
65 H.HandleInvalidObjCModifierFlag(FlagBeg, E - FlagBeg);
66 }
67 return true;
68}
69
Ted Kremenek02087932010-07-16 02:11:22 +000070static PrintfSpecifierResult ParsePrintfSpecifier(FormatStringHandler &H,
Ted Kremenek1de17072010-02-04 20:46:58 +000071 const char *&Beg,
Ted Kremenek4a49d982010-02-26 19:18:41 +000072 const char *E,
Hans Wennborg23926bd2011-12-15 10:25:47 +000073 unsigned &argIndex,
Jordan Rose510260c2012-09-13 02:11:03 +000074 const LangOptions &LO,
Fariborz Jahanian6485fe42014-09-09 23:10:54 +000075 const TargetInfo &Target,
Dimitry Andric6b5ed342015-02-19 22:32:33 +000076 bool Warn,
77 bool isFreeBSDKPrintf) {
Ted Kremenekc8b188d2010-02-16 01:46:59 +000078
Ted Kremenekf03e6d852010-07-20 20:04:27 +000079 using namespace clang::analyze_format_string;
Ted Kremenek176f7d62010-01-29 02:13:53 +000080 using namespace clang::analyze_printf;
Ted Kremenekc8b188d2010-02-16 01:46:59 +000081
Ted Kremeneka2e77b42010-01-27 23:43:25 +000082 const char *I = Beg;
Craig Topper25542942014-05-20 04:30:07 +000083 const char *Start = nullptr;
Ted Kremeneka2e77b42010-01-27 23:43:25 +000084 UpdateOnReturn <const char*> UpdateBeg(Beg, I);
85
86 // Look for a '%' character that indicates the start of a format specifier.
Ted Kremenekb5c98ef2010-01-28 23:56:52 +000087 for ( ; I != E ; ++I) {
Ted Kremeneka2e77b42010-01-27 23:43:25 +000088 char c = *I;
Ted Kremeneka2e77b42010-01-27 23:43:25 +000089 if (c == '\0') {
90 // Detect spurious null characters, which are likely errors.
91 H.HandleNullChar(I);
92 return true;
93 }
94 if (c == '%') {
Ted Kremenekb5c98ef2010-01-28 23:56:52 +000095 Start = I++; // Record the start of the format specifier.
Ted Kremeneka2e77b42010-01-27 23:43:25 +000096 break;
97 }
98 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +000099
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000100 // No format specifier found?
101 if (!Start)
102 return false;
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000103
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000104 if (I == E) {
105 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000106 if (Warn)
107 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000108 return true;
109 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000110
Ted Kremenek02087932010-07-16 02:11:22 +0000111 PrintfSpecifier FS;
Ted Kremenekd1668192010-02-27 01:41:03 +0000112 if (ParseArgPosition(H, FS, Start, I, E))
113 return true;
114
115 if (I == E) {
116 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000117 if (Warn)
118 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremenekd1668192010-02-27 01:41:03 +0000119 return true;
120 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000121
Mehdi Amini06d367c2016-10-24 20:39:34 +0000122 if (*I == '{') {
Akira Hatanaka189359d2018-07-10 00:50:25 +0000123 ++I;
124 unsigned char PrivacyFlags = 0;
125 StringRef MatchedStr;
Mehdi Amini06d367c2016-10-24 20:39:34 +0000126
Akira Hatanaka189359d2018-07-10 00:50:25 +0000127 do {
128 StringRef Str(I, E - I);
Akira Hatanakad572cf42018-11-06 07:05:14 +0000129 std::string Match = "^[[:space:]]*"
130 "(private|public|sensitive|mask\\.[^[:space:],}]*)"
Akira Hatanakafb1e4462018-11-06 06:26:17 +0000131 "[[:space:]]*(,|})";
Akira Hatanaka189359d2018-07-10 00:50:25 +0000132 llvm::Regex R(Match);
133 SmallVector<StringRef, 2> Matches;
134
135 if (R.match(Str, &Matches)) {
136 MatchedStr = Matches[1];
137 I += Matches[0].size();
138
Akira Hatanakae18c2d22018-07-11 22:19:14 +0000139 // Set the privacy flag if the privacy annotation in the
140 // comma-delimited segment is at least as strict as the privacy
141 // annotations in previous comma-delimited segments.
Akira Hatanakad572cf42018-11-06 07:05:14 +0000142 if (MatchedStr.startswith("mask")) {
143 StringRef MaskType = MatchedStr.substr(sizeof("mask.") - 1);
144 unsigned Size = MaskType.size();
145 if (Warn && (Size == 0 || Size > 8))
146 H.handleInvalidMaskType(MaskType);
147 FS.setMaskType(MaskType);
148 } else if (MatchedStr.equals("sensitive"))
Akira Hatanakafb1e4462018-11-06 06:26:17 +0000149 PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsSensitive;
150 else if (PrivacyFlags !=
151 clang::analyze_os_log::OSLogBufferItem::IsSensitive &&
152 MatchedStr.equals("private"))
Akira Hatanaka189359d2018-07-10 00:50:25 +0000153 PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsPrivate;
Akira Hatanakae18c2d22018-07-11 22:19:14 +0000154 else if (PrivacyFlags == 0 && MatchedStr.equals("public"))
Akira Hatanaka189359d2018-07-10 00:50:25 +0000155 PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsPublic;
156 } else {
157 size_t CommaOrBracePos =
158 Str.find_if([](char c) { return c == ',' || c == '}'; });
Akira Hatanaka189359d2018-07-10 00:50:25 +0000159
160 if (CommaOrBracePos == StringRef::npos) {
161 // Neither a comma nor the closing brace was found.
162 if (Warn)
163 H.HandleIncompleteSpecifier(Start, E - Start);
164 return true;
165 }
Akira Hatanakae18c2d22018-07-11 22:19:14 +0000166
167 I += CommaOrBracePos + 1;
Akira Hatanaka189359d2018-07-10 00:50:25 +0000168 }
169 // Continue until the closing brace is found.
170 } while (*(I - 1) == ',');
171
172 // Set the privacy flag.
173 switch (PrivacyFlags) {
174 case 0:
175 break;
176 case clang::analyze_os_log::OSLogBufferItem::IsPrivate:
177 FS.setIsPrivate(MatchedStr.data());
178 break;
179 case clang::analyze_os_log::OSLogBufferItem::IsPublic:
180 FS.setIsPublic(MatchedStr.data());
181 break;
Akira Hatanakafb1e4462018-11-06 06:26:17 +0000182 case clang::analyze_os_log::OSLogBufferItem::IsSensitive:
183 FS.setIsSensitive(MatchedStr.data());
184 break;
Akira Hatanaka189359d2018-07-10 00:50:25 +0000185 default:
186 llvm_unreachable("Unexpected privacy flag value");
Mehdi Amini06d367c2016-10-24 20:39:34 +0000187 }
188 }
189
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000190 // Look for flags (if any).
191 bool hasMore = true;
192 for ( ; I != E; ++I) {
193 switch (*I) {
194 default: hasMore = false; break;
NAKAMURA Takumif9cbcc42011-01-27 07:10:08 +0000195 case '\'':
Ted Kremeneka322cae2011-01-08 05:28:38 +0000196 // FIXME: POSIX specific. Always accept?
197 FS.setHasThousandsGrouping(I);
198 break;
Tom Careb49ec692010-06-17 19:00:27 +0000199 case '-': FS.setIsLeftJustified(I); break;
200 case '+': FS.setHasPlusPrefix(I); break;
201 case ' ': FS.setHasSpacePrefix(I); break;
202 case '#': FS.setHasAlternativeForm(I); break;
203 case '0': FS.setHasLeadingZeros(I); break;
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000204 }
205 if (!hasMore)
206 break;
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000207 }
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000208
209 if (I == E) {
210 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000211 if (Warn)
212 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000213 return true;
214 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000215
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000216 // Look for the field width (if any).
Ted Kremenekd1668192010-02-27 01:41:03 +0000217 if (ParseFieldWidth(H, FS, Start, I, E,
Craig Topper25542942014-05-20 04:30:07 +0000218 FS.usesPositionalArg() ? nullptr : &argIndex))
Ted Kremenekd1668192010-02-27 01:41:03 +0000219 return true;
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000220
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000221 if (I == E) {
222 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000223 if (Warn)
224 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000225 return true;
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000226 }
227
228 // Look for the precision (if any).
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000229 if (*I == '.') {
Ted Kremenekc22f78d2010-01-29 03:16:21 +0000230 ++I;
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000231 if (I == E) {
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000232 if (Warn)
233 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000234 return true;
235 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000236
Ted Kremenekd1668192010-02-27 01:41:03 +0000237 if (ParsePrecision(H, FS, Start, I, E,
Craig Topper25542942014-05-20 04:30:07 +0000238 FS.usesPositionalArg() ? nullptr : &argIndex))
Ted Kremenekd1668192010-02-27 01:41:03 +0000239 return true;
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000240
241 if (I == E) {
242 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000243 if (Warn)
244 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000245 return true;
246 }
247 }
248
Matt Arsenault0ff50d42018-12-01 22:16:27 +0000249 if (ParseVectorModifier(H, FS, I, E, LO))
250 return true;
251
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000252 // Look for the length modifier.
Hans Wennborg23926bd2011-12-15 10:25:47 +0000253 if (ParseLengthModifier(FS, I, E, LO) && I == E) {
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000254 // No more characters left?
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000255 if (Warn)
256 H.HandleIncompleteSpecifier(Start, E - Start);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000257 return true;
258 }
Ted Kremenek2a0cd592010-02-09 00:04:09 +0000259
Ted Kremenek2b417712015-07-02 05:39:16 +0000260 // Look for the Objective-C modifier flags, if any.
261 // We parse these here, even if they don't apply to
262 // the conversion specifier, and then emit an error
263 // later if the conversion specifier isn't '@'. This
264 // enables better recovery, and we don't know if
265 // these flags are applicable until later.
266 const char *ObjCModifierFlagsStart = nullptr,
267 *ObjCModifierFlagsEnd = nullptr;
268 if (*I == '[') {
269 ObjCModifierFlagsStart = I;
270 ++I;
271 auto flagStart = I;
272 for (;; ++I) {
273 ObjCModifierFlagsEnd = I;
274 if (I == E) {
275 if (Warn)
276 H.HandleIncompleteSpecifier(Start, E - Start);
277 return true;
278 }
279 // Did we find the closing ']'?
280 if (*I == ']') {
281 if (ParseObjCFlags(H, FS, flagStart, I, Warn))
282 return true;
283 ++I;
284 break;
285 }
286 // There are no separators defined yet for multiple
287 // Objective-C modifier flags. When those are
288 // defined, this is the place to check.
289 }
290 }
291
Ted Kremenek23a71a12010-01-29 20:29:53 +0000292 if (*I == '\0') {
Ted Kremenek2a0cd592010-02-09 00:04:09 +0000293 // Detect spurious null characters, which are likely errors.
294 H.HandleNullChar(I);
295 return true;
Ted Kremenek23a71a12010-01-29 20:29:53 +0000296 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000297
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000298 // Finally, look for the conversion specifier.
Ted Kremenekfee0e962010-01-28 02:46:17 +0000299 const char *conversionPosition = I++;
Ted Kremenek94af5752010-01-29 02:40:24 +0000300 ConversionSpecifier::Kind k = ConversionSpecifier::InvalidSpecifier;
Ted Kremenekfee0e962010-01-28 02:46:17 +0000301 switch (*conversionPosition) {
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000302 default:
Ted Kremenek94af5752010-01-29 02:40:24 +0000303 break;
Ted Kremenekc06ead62010-01-28 00:55:28 +0000304 // C99: 7.19.6.1 (section 8).
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000305 case '%': k = ConversionSpecifier::PercentArg; break;
306 case 'A': k = ConversionSpecifier::AArg; break;
307 case 'E': k = ConversionSpecifier::EArg; break;
308 case 'F': k = ConversionSpecifier::FArg; break;
309 case 'G': k = ConversionSpecifier::GArg; break;
310 case 'X': k = ConversionSpecifier::XArg; break;
311 case 'a': k = ConversionSpecifier::aArg; break;
Ted Kremenekab0fe8a2010-07-20 20:03:49 +0000312 case 'c': k = ConversionSpecifier::cArg; break;
Ted Kremenekfee0e962010-01-28 02:46:17 +0000313 case 'd': k = ConversionSpecifier::dArg; break;
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000314 case 'e': k = ConversionSpecifier::eArg; break;
315 case 'f': k = ConversionSpecifier::fArg; break;
316 case 'g': k = ConversionSpecifier::gArg; break;
Ted Kremenekfee0e962010-01-28 02:46:17 +0000317 case 'i': k = ConversionSpecifier::iArg; break;
Matt Arsenault58fc8082019-01-29 20:49:54 +0000318 case 'n':
319 // Not handled, but reserved in OpenCL.
320 if (!LO.OpenCL)
321 k = ConversionSpecifier::nArg;
322 break;
Ted Kremenekfee0e962010-01-28 02:46:17 +0000323 case 'o': k = ConversionSpecifier::oArg; break;
David Majnemer3cba4952013-08-21 21:54:46 +0000324 case 'p': k = ConversionSpecifier::pArg; break;
325 case 's': k = ConversionSpecifier::sArg; break;
Ted Kremenekfee0e962010-01-28 02:46:17 +0000326 case 'u': k = ConversionSpecifier::uArg; break;
327 case 'x': k = ConversionSpecifier::xArg; break;
Ted Kremeneka322cae2011-01-08 05:28:38 +0000328 // POSIX specific.
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000329 case 'C': k = ConversionSpecifier::CArg; break;
Ted Kremenek348d1492010-07-20 20:04:15 +0000330 case 'S': k = ConversionSpecifier::SArg; break;
Mehdi Amini06d367c2016-10-24 20:39:34 +0000331 // Apple extension for os_log
332 case 'P':
333 k = ConversionSpecifier::PArg;
334 break;
Ted Kremenekc06ead62010-01-28 00:55:28 +0000335 // Objective-C.
Ted Kremenek23a71a12010-01-29 20:29:53 +0000336 case '@': k = ConversionSpecifier::ObjCObjArg; break;
Ted Kremenek2a0cd592010-02-09 00:04:09 +0000337 // Glibc specific.
Ted Kremenek23a71a12010-01-29 20:29:53 +0000338 case 'm': k = ConversionSpecifier::PrintErrno; break;
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000339 // FreeBSD kernel specific.
340 case 'b':
341 if (isFreeBSDKPrintf)
342 k = ConversionSpecifier::FreeBSDbArg; // int followed by char *
343 break;
344 case 'r':
345 if (isFreeBSDKPrintf)
346 k = ConversionSpecifier::FreeBSDrArg; // int
347 break;
348 case 'y':
349 if (isFreeBSDKPrintf)
350 k = ConversionSpecifier::FreeBSDyArg; // int
351 break;
Hans Wennborgc597b4c2014-09-07 03:03:51 +0000352 // Apple-specific.
Jordan Rose510260c2012-09-13 02:11:03 +0000353 case 'D':
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000354 if (isFreeBSDKPrintf)
355 k = ConversionSpecifier::FreeBSDDArg; // void * followed by char *
356 else if (Target.getTriple().isOSDarwin())
Jordan Rose510260c2012-09-13 02:11:03 +0000357 k = ConversionSpecifier::DArg;
358 break;
359 case 'O':
360 if (Target.getTriple().isOSDarwin())
361 k = ConversionSpecifier::OArg;
362 break;
363 case 'U':
364 if (Target.getTriple().isOSDarwin())
365 k = ConversionSpecifier::UArg;
366 break;
Hans Wennborgc597b4c2014-09-07 03:03:51 +0000367 // MS specific.
368 case 'Z':
369 if (Target.getTriple().isOSMSVCRT())
370 k = ConversionSpecifier::ZArg;
Matt Arsenaulte19dc612018-11-13 22:30:35 +0000371 break;
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000372 }
Fangrui Song6907ce22018-07-30 19:24:48 +0000373
Ted Kremenek2b417712015-07-02 05:39:16 +0000374 // Check to see if we used the Objective-C modifier flags with
375 // a conversion specifier other than '@'.
376 if (k != ConversionSpecifier::ObjCObjArg &&
377 k != ConversionSpecifier::InvalidSpecifier &&
378 ObjCModifierFlagsStart) {
379 H.HandleObjCFlagsWithNonObjCConversion(ObjCModifierFlagsStart,
380 ObjCModifierFlagsEnd + 1,
381 conversionPosition);
382 return true;
383 }
Mehdi Amini06d367c2016-10-24 20:39:34 +0000384
Ted Kremenekf03e6d852010-07-20 20:04:27 +0000385 PrintfConversionSpecifier CS(conversionPosition, k);
Ted Kremenek4a49d982010-02-26 19:18:41 +0000386 FS.setConversionSpecifier(CS);
Ted Kremenekd1668192010-02-27 01:41:03 +0000387 if (CS.consumesDataArgument() && !FS.usesPositionalArg())
Ted Kremenek4a49d982010-02-26 19:18:41 +0000388 FS.setArgIndex(argIndex++);
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000389 // FreeBSD kernel specific.
390 if (k == ConversionSpecifier::FreeBSDbArg ||
391 k == ConversionSpecifier::FreeBSDDArg)
392 argIndex++;
Ted Kremenek94af5752010-01-29 02:40:24 +0000393
394 if (k == ConversionSpecifier::InvalidSpecifier) {
Bruno Cardoso Lopes0c18d032016-03-29 17:35:02 +0000395 unsigned Len = I - Start;
396 if (ParseUTF8InvalidSpecifier(Start, E, Len)) {
397 CS.setEndScanList(Start + Len);
398 FS.setConversionSpecifier(CS);
399 }
Ted Kremenek4a49d982010-02-26 19:18:41 +0000400 // Assume the conversion takes one argument.
Bruno Cardoso Lopes0c18d032016-03-29 17:35:02 +0000401 return !H.HandleInvalidPrintfConversionSpecifier(FS, Start, Len);
Ted Kremenek94af5752010-01-29 02:40:24 +0000402 }
Ted Kremenek02087932010-07-16 02:11:22 +0000403 return PrintfSpecifierResult(Start, FS);
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000404}
405
Ted Kremenek02087932010-07-16 02:11:22 +0000406bool clang::analyze_format_string::ParsePrintfString(FormatStringHandler &H,
407 const char *I,
Hans Wennborg23926bd2011-12-15 10:25:47 +0000408 const char *E,
Jordan Rose510260c2012-09-13 02:11:03 +0000409 const LangOptions &LO,
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000410 const TargetInfo &Target,
411 bool isFreeBSDKPrintf) {
Ted Kremenek4a49d982010-02-26 19:18:41 +0000412
413 unsigned argIndex = 0;
414
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000415 // Keep looking for a format specifier until we have exhausted the string.
416 while (I != E) {
Hans Wennborg23926bd2011-12-15 10:25:47 +0000417 const PrintfSpecifierResult &FSR = ParsePrintfSpecifier(H, I, E, argIndex,
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000418 LO, Target, true,
419 isFreeBSDKPrintf);
Ted Kremenek94af5752010-01-29 02:40:24 +0000420 // Did a fail-stop error of any kind occur when parsing the specifier?
421 // If so, don't do any more processing.
422 if (FSR.shouldStop())
Dmitri Gribenko76bb5cabfa2012-09-10 21:20:09 +0000423 return true;
Ted Kremenek94af5752010-01-29 02:40:24 +0000424 // Did we exhaust the string or encounter an error that
425 // we can recover from?
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000426 if (!FSR.hasValue())
Ted Kremenek94af5752010-01-29 02:40:24 +0000427 continue;
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000428 // We have a format specifier. Pass it to the callback.
Ted Kremenek02087932010-07-16 02:11:22 +0000429 if (!H.HandlePrintfSpecifier(FSR.getValue(), FSR.getStart(),
Ted Kremenekfee0e962010-01-28 02:46:17 +0000430 I - FSR.getStart()))
Ted Kremenek23a71a12010-01-29 20:29:53 +0000431 return true;
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000432 }
433 assert(I == E && "Format string not exhausted");
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000434 return false;
435}
Ted Kremeneka2e77b42010-01-27 23:43:25 +0000436
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000437bool clang::analyze_format_string::ParseFormatStringHasSArg(const char *I,
438 const char *E,
439 const LangOptions &LO,
440 const TargetInfo &Target) {
Fangrui Song6907ce22018-07-30 19:24:48 +0000441
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000442 unsigned argIndex = 0;
Fangrui Song6907ce22018-07-30 19:24:48 +0000443
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000444 // Keep looking for a %s format specifier until we have exhausted the string.
445 FormatStringHandler H;
446 while (I != E) {
447 const PrintfSpecifierResult &FSR = ParsePrintfSpecifier(H, I, E, argIndex,
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000448 LO, Target, false,
449 false);
Fariborz Jahanian6485fe42014-09-09 23:10:54 +0000450 // Did a fail-stop error of any kind occur when parsing the specifier?
451 // If so, don't do any more processing.
452 if (FSR.shouldStop())
453 return false;
454 // Did we exhaust the string or encounter an error that
455 // we can recover from?
456 if (!FSR.hasValue())
457 continue;
458 const analyze_printf::PrintfSpecifier &FS = FSR.getValue();
459 // Return true if this a %s format specifier.
460 if (FS.getConversionSpecifier().getKind() == ConversionSpecifier::Kind::sArg)
461 return true;
462 }
463 return false;
464}
465
Erik Pilkingtonaa385562019-08-14 16:57:11 +0000466bool clang::analyze_format_string::parseFormatStringHasFormattingSpecifiers(
467 const char *Begin, const char *End, const LangOptions &LO,
468 const TargetInfo &Target) {
469 unsigned ArgIndex = 0;
470 // Keep looking for a formatting specifier until we have exhausted the string.
471 FormatStringHandler H;
472 while (Begin != End) {
473 const PrintfSpecifierResult &FSR =
474 ParsePrintfSpecifier(H, Begin, End, ArgIndex, LO, Target, false, false);
475 if (FSR.shouldStop())
476 break;
477 if (FSR.hasValue())
478 return true;
479 }
480 return false;
481}
482
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000483//===----------------------------------------------------------------------===//
Ted Kremenek02087932010-07-16 02:11:22 +0000484// Methods on PrintfSpecifier.
Tom Careb7042702010-06-09 04:11:11 +0000485//===----------------------------------------------------------------------===//
486
Matt Arsenault0ff50d42018-12-01 22:16:27 +0000487ArgType PrintfSpecifier::getScalarArgType(ASTContext &Ctx,
488 bool IsObjCLiteral) const {
Ted Kremenek5f0c0662010-08-24 22:24:51 +0000489 if (CS.getKind() == ConversionSpecifier::cArg)
490 switch (LM.getKind()) {
Hans Wennborg1b231582014-09-04 21:39:52 +0000491 case LengthModifier::None:
492 return Ctx.IntTy;
Hans Wennborga5b1aa92011-12-09 12:22:12 +0000493 case LengthModifier::AsLong:
Hans Wennborg68f42b92014-09-04 21:39:46 +0000494 case LengthModifier::AsWide:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000495 return ArgType(ArgType::WIntTy, "wint_t");
Hans Wennborg1b231582014-09-04 21:39:52 +0000496 case LengthModifier::AsShort:
497 if (Ctx.getTargetInfo().getTriple().isOSMSVCRT())
498 return Ctx.IntTy;
Galina Kistanovade7e2212017-06-03 06:23:51 +0000499 LLVM_FALLTHROUGH;
Ted Kremenek5f0c0662010-08-24 22:24:51 +0000500 default:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000501 return ArgType::Invalid();
Ted Kremenek5f0c0662010-08-24 22:24:51 +0000502 }
NAKAMURA Takumif9cbcc42011-01-27 07:10:08 +0000503
Ted Kremenek79db7b72010-01-29 22:59:32 +0000504 if (CS.isIntArg())
Tom Careb7042702010-06-09 04:11:11 +0000505 switch (LM.getKind()) {
506 case LengthModifier::AsLongDouble:
Ted Kremenek6fa57272012-01-24 21:29:54 +0000507 // GNU extension.
508 return Ctx.LongLongTy;
David Majnemer3cba4952013-08-21 21:54:46 +0000509 case LengthModifier::None:
Matt Arsenault58fc8082019-01-29 20:49:54 +0000510 case LengthModifier::AsShortLong:
David Majnemer3cba4952013-08-21 21:54:46 +0000511 return Ctx.IntTy;
512 case LengthModifier::AsInt32:
513 return ArgType(Ctx.IntTy, "__int32");
Matt Arsenault58fc8082019-01-29 20:49:54 +0000514 case LengthModifier::AsChar:
515 return ArgType::AnyCharTy;
Tom Careb7042702010-06-09 04:11:11 +0000516 case LengthModifier::AsShort: return Ctx.ShortTy;
517 case LengthModifier::AsLong: return Ctx.LongTy;
Hans Wennborg9bc9bcc2012-02-16 16:34:54 +0000518 case LengthModifier::AsLongLong:
519 case LengthModifier::AsQuad:
520 return Ctx.LongLongTy;
David Majnemer3cba4952013-08-21 21:54:46 +0000521 case LengthModifier::AsInt64:
522 return ArgType(Ctx.LongLongTy, "__int64");
Hans Wennborg772e9272011-12-07 10:33:11 +0000523 case LengthModifier::AsIntMax:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000524 return ArgType(Ctx.getIntMaxType(), "intmax_t");
Hans Wennborg27541db2011-10-27 08:29:09 +0000525 case LengthModifier::AsSizeT:
JF Bastienec7d7f32018-06-22 21:54:40 +0000526 return ArgType::makeSizeT(ArgType(Ctx.getSignedSizeType(), "ssize_t"));
David Majnemer3cba4952013-08-21 21:54:46 +0000527 case LengthModifier::AsInt3264:
David Majnemera39da8e2013-08-22 07:53:21 +0000528 return Ctx.getTargetInfo().getTriple().isArch64Bit()
529 ? ArgType(Ctx.LongLongTy, "__int64")
530 : ArgType(Ctx.IntTy, "__int32");
Hans Wennborg772e9272011-12-07 10:33:11 +0000531 case LengthModifier::AsPtrDiff:
Alex Lorenzb2043ac2018-07-05 22:51:11 +0000532 return ArgType::makePtrdiffT(
533 ArgType(Ctx.getPointerDiffType(), "ptrdiff_t"));
Hans Wennborg23926bd2011-12-15 10:25:47 +0000534 case LengthModifier::AsAllocate:
Hans Wennborg6073e312012-01-12 17:11:12 +0000535 case LengthModifier::AsMAllocate:
Hans Wennborg68f42b92014-09-04 21:39:46 +0000536 case LengthModifier::AsWide:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000537 return ArgType::Invalid();
Ted Kremenek79db7b72010-01-29 22:59:32 +0000538 }
539
540 if (CS.isUIntArg())
Tom Careb7042702010-06-09 04:11:11 +0000541 switch (LM.getKind()) {
542 case LengthModifier::AsLongDouble:
Ted Kremenek6fa57272012-01-24 21:29:54 +0000543 // GNU extension.
544 return Ctx.UnsignedLongLongTy;
David Majnemer3cba4952013-08-21 21:54:46 +0000545 case LengthModifier::None:
Matt Arsenault58fc8082019-01-29 20:49:54 +0000546 case LengthModifier::AsShortLong:
David Majnemer3cba4952013-08-21 21:54:46 +0000547 return Ctx.UnsignedIntTy;
548 case LengthModifier::AsInt32:
549 return ArgType(Ctx.UnsignedIntTy, "unsigned __int32");
Tom Careb7042702010-06-09 04:11:11 +0000550 case LengthModifier::AsChar: return Ctx.UnsignedCharTy;
551 case LengthModifier::AsShort: return Ctx.UnsignedShortTy;
552 case LengthModifier::AsLong: return Ctx.UnsignedLongTy;
Hans Wennborg9bc9bcc2012-02-16 16:34:54 +0000553 case LengthModifier::AsLongLong:
554 case LengthModifier::AsQuad:
555 return Ctx.UnsignedLongLongTy;
David Majnemer3cba4952013-08-21 21:54:46 +0000556 case LengthModifier::AsInt64:
557 return ArgType(Ctx.UnsignedLongLongTy, "unsigned __int64");
Hans Wennborg772e9272011-12-07 10:33:11 +0000558 case LengthModifier::AsIntMax:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000559 return ArgType(Ctx.getUIntMaxType(), "uintmax_t");
Tom Careb7042702010-06-09 04:11:11 +0000560 case LengthModifier::AsSizeT:
JF Bastienec7d7f32018-06-22 21:54:40 +0000561 return ArgType::makeSizeT(ArgType(Ctx.getSizeType(), "size_t"));
David Majnemer3cba4952013-08-21 21:54:46 +0000562 case LengthModifier::AsInt3264:
563 return Ctx.getTargetInfo().getTriple().isArch64Bit()
David Majnemera39da8e2013-08-22 07:53:21 +0000564 ? ArgType(Ctx.UnsignedLongLongTy, "unsigned __int64")
565 : ArgType(Ctx.UnsignedIntTy, "unsigned __int32");
Tom Careb7042702010-06-09 04:11:11 +0000566 case LengthModifier::AsPtrDiff:
Alex Lorenzb2043ac2018-07-05 22:51:11 +0000567 return ArgType::makePtrdiffT(
568 ArgType(Ctx.getUnsignedPointerDiffType(), "unsigned ptrdiff_t"));
Hans Wennborg23926bd2011-12-15 10:25:47 +0000569 case LengthModifier::AsAllocate:
Hans Wennborg6073e312012-01-12 17:11:12 +0000570 case LengthModifier::AsMAllocate:
Hans Wennborg68f42b92014-09-04 21:39:46 +0000571 case LengthModifier::AsWide:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000572 return ArgType::Invalid();
Ted Kremenek79db7b72010-01-29 22:59:32 +0000573 }
Ted Kremenekc8b188d2010-02-16 01:46:59 +0000574
Ted Kremenek016b6052010-02-01 23:23:50 +0000575 if (CS.isDoubleArg()) {
Matt Arsenault58fc8082019-01-29 20:49:54 +0000576 if (!VectorNumElts.isInvalid()) {
577 switch (LM.getKind()) {
578 case LengthModifier::AsShort:
579 return Ctx.HalfTy;
580 case LengthModifier::AsShortLong:
581 return Ctx.FloatTy;
582 case LengthModifier::AsLong:
583 default:
584 return Ctx.DoubleTy;
585 }
586 }
587
Tom Careb7042702010-06-09 04:11:11 +0000588 if (LM.getKind() == LengthModifier::AsLongDouble)
Ted Kremenek016b6052010-02-01 23:23:50 +0000589 return Ctx.LongDoubleTy;
Ted Kremenek9ff02052010-01-30 01:02:18 +0000590 return Ctx.DoubleTy;
Ted Kremenek016b6052010-02-01 23:23:50 +0000591 }
Ted Kremenek4a49d982010-02-26 19:18:41 +0000592
Hans Wennborgabc1e222012-08-07 09:13:19 +0000593 if (CS.getKind() == ConversionSpecifier::nArg) {
594 switch (LM.getKind()) {
595 case LengthModifier::None:
596 return ArgType::PtrTo(Ctx.IntTy);
597 case LengthModifier::AsChar:
598 return ArgType::PtrTo(Ctx.SignedCharTy);
599 case LengthModifier::AsShort:
600 return ArgType::PtrTo(Ctx.ShortTy);
601 case LengthModifier::AsLong:
602 return ArgType::PtrTo(Ctx.LongTy);
603 case LengthModifier::AsLongLong:
604 case LengthModifier::AsQuad:
605 return ArgType::PtrTo(Ctx.LongLongTy);
606 case LengthModifier::AsIntMax:
607 return ArgType::PtrTo(ArgType(Ctx.getIntMaxType(), "intmax_t"));
608 case LengthModifier::AsSizeT:
Alexander Shaposhnikov441c1d92017-07-14 22:57:00 +0000609 return ArgType::PtrTo(ArgType(Ctx.getSignedSizeType(), "ssize_t"));
Hans Wennborgabc1e222012-08-07 09:13:19 +0000610 case LengthModifier::AsPtrDiff:
611 return ArgType::PtrTo(ArgType(Ctx.getPointerDiffType(), "ptrdiff_t"));
612 case LengthModifier::AsLongDouble:
613 return ArgType(); // FIXME: Is this a known extension?
614 case LengthModifier::AsAllocate:
615 case LengthModifier::AsMAllocate:
David Majnemer3cba4952013-08-21 21:54:46 +0000616 case LengthModifier::AsInt32:
617 case LengthModifier::AsInt3264:
618 case LengthModifier::AsInt64:
Hans Wennborg68f42b92014-09-04 21:39:46 +0000619 case LengthModifier::AsWide:
Hans Wennborgabc1e222012-08-07 09:13:19 +0000620 return ArgType::Invalid();
Matt Arsenault58fc8082019-01-29 20:49:54 +0000621 case LengthModifier::AsShortLong:
622 llvm_unreachable("only used for OpenCL which doesn not handle nArg");
Hans Wennborgabc1e222012-08-07 09:13:19 +0000623 }
624 }
625
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000626 switch (CS.getKind()) {
Hans Wennborg0c353262011-12-09 15:57:33 +0000627 case ConversionSpecifier::sArg:
Nico Weber496cdc22012-01-31 01:43:25 +0000628 if (LM.getKind() == LengthModifier::AsWideChar) {
629 if (IsObjCLiteral)
Jordan Rose0e5badd2012-12-05 18:44:49 +0000630 return ArgType(Ctx.getPointerType(Ctx.UnsignedShortTy.withConst()),
631 "const unichar *");
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000632 return ArgType(ArgType::WCStrTy, "wchar_t *");
Nico Weber496cdc22012-01-31 01:43:25 +0000633 }
Hans Wennborg68f42b92014-09-04 21:39:46 +0000634 if (LM.getKind() == LengthModifier::AsWide)
635 return ArgType(ArgType::WCStrTy, "wchar_t *");
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000636 return ArgType::CStrTy;
Ted Kremenek348d1492010-07-20 20:04:15 +0000637 case ConversionSpecifier::SArg:
Nico Weber496cdc22012-01-31 01:43:25 +0000638 if (IsObjCLiteral)
Jordan Rose0e5badd2012-12-05 18:44:49 +0000639 return ArgType(Ctx.getPointerType(Ctx.UnsignedShortTy.withConst()),
640 "const unichar *");
Hans Wennborg1b231582014-09-04 21:39:52 +0000641 if (Ctx.getTargetInfo().getTriple().isOSMSVCRT() &&
642 LM.getKind() == LengthModifier::AsShort)
643 return ArgType::CStrTy;
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000644 return ArgType(ArgType::WCStrTy, "wchar_t *");
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000645 case ConversionSpecifier::CArg:
Nico Weber496cdc22012-01-31 01:43:25 +0000646 if (IsObjCLiteral)
Jordan Rose0e5badd2012-12-05 18:44:49 +0000647 return ArgType(Ctx.UnsignedShortTy, "unichar");
Hans Wennborg1b231582014-09-04 21:39:52 +0000648 if (Ctx.getTargetInfo().getTriple().isOSMSVCRT() &&
649 LM.getKind() == LengthModifier::AsShort)
650 return Ctx.IntTy;
Hans Wennborg0d81e012013-05-10 10:08:40 +0000651 return ArgType(Ctx.WideCharTy, "wchar_t");
Ted Kremenek1ce32be2010-07-20 20:04:04 +0000652 case ConversionSpecifier::pArg:
Mehdi Amini06d367c2016-10-24 20:39:34 +0000653 case ConversionSpecifier::PArg:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000654 return ArgType::CPointerTy;
Ted Kremenek9b1f3d42012-01-25 00:04:09 +0000655 case ConversionSpecifier::ObjCObjArg:
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000656 return ArgType::ObjCPointerTy;
Ted Kremenek74a4ce72010-02-24 00:05:54 +0000657 default:
658 break;
659 }
Ted Kremenek4a49d982010-02-26 19:18:41 +0000660
Ted Kremenek79db7b72010-01-29 22:59:32 +0000661 // FIXME: Handle other cases.
Hans Wennborgc3b3da02012-08-07 08:11:26 +0000662 return ArgType();
Ted Kremenek79db7b72010-01-29 22:59:32 +0000663}
664
Matt Arsenault0ff50d42018-12-01 22:16:27 +0000665
666ArgType PrintfSpecifier::getArgType(ASTContext &Ctx,
667 bool IsObjCLiteral) const {
668 const PrintfConversionSpecifier &CS = getConversionSpecifier();
669
670 if (!CS.consumesDataArgument())
671 return ArgType::Invalid();
672
673 ArgType ScalarTy = getScalarArgType(Ctx, IsObjCLiteral);
674 if (!ScalarTy.isValid() || VectorNumElts.isInvalid())
675 return ScalarTy;
676
677 return ScalarTy.makeVectorType(Ctx, VectorNumElts.getConstantAmount());
678}
679
Hans Wennborgd99d6882012-02-15 09:59:46 +0000680bool PrintfSpecifier::fixType(QualType QT, const LangOptions &LangOpt,
681 ASTContext &Ctx, bool IsObjCLiteral) {
Hans Wennborgebcd1c72012-07-30 17:11:32 +0000682 // %n is different from other conversion specifiers; don't try to fix it.
683 if (CS.getKind() == ConversionSpecifier::nArg)
684 return false;
685
Jordan Rose68f6d3b2012-05-30 21:53:13 +0000686 // Handle Objective-C objects first. Note that while the '%@' specifier will
687 // not warn for structure pointer or void pointer arguments (because that's
688 // how CoreFoundation objects are implemented), we only show a fixit for '%@'
689 // if we know it's an object (block, id, class, or __attribute__((NSObject))).
690 if (QT->isObjCRetainableType()) {
691 if (!IsObjCLiteral)
692 return false;
693
694 CS.setKind(ConversionSpecifier::ObjCObjArg);
695
696 // Disable irrelevant flags
697 HasThousandsGrouping = false;
698 HasPlusPrefix = false;
699 HasSpacePrefix = false;
700 HasAlternativeForm = false;
701 HasLeadingZeroes = false;
702 Precision.setHowSpecified(OptionalAmount::NotSpecified);
703 LM.setKind(LengthModifier::None);
704
705 return true;
706 }
707
708 // Handle strings next (char *, wchar_t *)
Tom Careb7042702010-06-09 04:11:11 +0000709 if (QT->isPointerType() && (QT->getPointeeType()->isAnyCharacterType())) {
Ted Kremenek563e3ed2010-07-20 20:03:58 +0000710 CS.setKind(ConversionSpecifier::sArg);
Tom Careb7042702010-06-09 04:11:11 +0000711
Tom Care00554632010-06-11 04:22:02 +0000712 // Disable irrelevant flags
713 HasAlternativeForm = 0;
714 HasLeadingZeroes = 0;
715
Tom Careb7042702010-06-09 04:11:11 +0000716 // Set the long length modifier for wide characters
717 if (QT->getPointeeType()->isWideCharType())
718 LM.setKind(LengthModifier::AsWideChar);
Hans Wennborg2027de32011-12-09 10:51:29 +0000719 else
720 LM.setKind(LengthModifier::None);
Tom Careb7042702010-06-09 04:11:11 +0000721
722 return true;
723 }
724
Jordan Rose614e72b2012-06-04 22:49:02 +0000725 // If it's an enum, get its underlying type.
726 if (const EnumType *ETy = QT->getAs<EnumType>())
727 QT = ETy->getDecl()->getIntegerType();
728
Tom Careb7042702010-06-09 04:11:11 +0000729 const BuiltinType *BT = QT->getAs<BuiltinType>();
Matt Arsenault0ff50d42018-12-01 22:16:27 +0000730 if (!BT) {
731 const VectorType *VT = QT->getAs<VectorType>();
732 if (VT) {
733 QT = VT->getElementType();
734 BT = QT->getAs<BuiltinType>();
735 VectorNumElts = OptionalAmount(VT->getNumElements());
736 }
737 }
738
739 // We can only work with builtin types.
John McCall59207972011-10-18 22:28:37 +0000740 if (!BT)
741 return false;
Tom Care00554632010-06-11 04:22:02 +0000742
Tom Careb7042702010-06-09 04:11:11 +0000743 // Set length modifier
744 switch (BT->getKind()) {
Eli Friedman7ec652a2011-04-27 22:06:20 +0000745 case BuiltinType::Bool:
746 case BuiltinType::WChar_U:
747 case BuiltinType::WChar_S:
Richard Smith3a8244d2018-05-01 05:02:45 +0000748 case BuiltinType::Char8: // FIXME: Treat like 'char'?
Eli Friedman7ec652a2011-04-27 22:06:20 +0000749 case BuiltinType::Char16:
750 case BuiltinType::Char32:
751 case BuiltinType::UInt128:
752 case BuiltinType::Int128:
Anton Korobeynikovf0c267e2011-10-14 23:23:15 +0000753 case BuiltinType::Half:
Sjoerd Meijercc623ad2017-09-08 15:15:00 +0000754 case BuiltinType::Float16:
Nemanja Ivanovicbb1ea2d2016-05-09 08:52:33 +0000755 case BuiltinType::Float128:
Leonard Chanf921d852018-06-04 16:07:52 +0000756 case BuiltinType::ShortAccum:
757 case BuiltinType::Accum:
758 case BuiltinType::LongAccum:
759 case BuiltinType::UShortAccum:
760 case BuiltinType::UAccum:
761 case BuiltinType::ULongAccum:
Leonard Chanab80f3c2018-06-14 14:53:51 +0000762 case BuiltinType::ShortFract:
763 case BuiltinType::Fract:
764 case BuiltinType::LongFract:
765 case BuiltinType::UShortFract:
766 case BuiltinType::UFract:
767 case BuiltinType::ULongFract:
768 case BuiltinType::SatShortAccum:
769 case BuiltinType::SatAccum:
770 case BuiltinType::SatLongAccum:
771 case BuiltinType::SatUShortAccum:
772 case BuiltinType::SatUAccum:
773 case BuiltinType::SatULongAccum:
774 case BuiltinType::SatShortFract:
775 case BuiltinType::SatFract:
776 case BuiltinType::SatLongFract:
777 case BuiltinType::SatUShortFract:
778 case BuiltinType::SatUFract:
779 case BuiltinType::SatULongFract:
John McCall59207972011-10-18 22:28:37 +0000780 // Various types which are non-trivial to correct.
Eli Friedman7ec652a2011-04-27 22:06:20 +0000781 return false;
782
Alexey Bader954ba212016-04-08 13:40:33 +0000783#define IMAGE_TYPE(ImgType, Id, SingletonId, Access, Suffix) \
784 case BuiltinType::Id:
Alexey Baderb62f1442016-04-13 08:33:41 +0000785#include "clang/Basic/OpenCLImageTypes.def"
Andrew Savonichev3fee3512018-11-08 11:25:41 +0000786#define EXT_OPAQUE_TYPE(ExtType, Id, Ext) \
787 case BuiltinType::Id:
788#include "clang/Basic/OpenCLExtensionTypes.def"
Richard Sandifordeb485fb2019-08-09 08:52:54 +0000789#define SVE_TYPE(Name, Id, SingletonId) \
790 case BuiltinType::Id:
791#include "clang/Basic/AArch64SVEACLETypes.def"
John McCall59207972011-10-18 22:28:37 +0000792#define SIGNED_TYPE(Id, SingletonId)
793#define UNSIGNED_TYPE(Id, SingletonId)
794#define FLOATING_TYPE(Id, SingletonId)
795#define BUILTIN_TYPE(Id, SingletonId) \
796 case BuiltinType::Id:
797#include "clang/AST/BuiltinTypes.def"
Eli Friedman7ec652a2011-04-27 22:06:20 +0000798 // Misc other stuff which doesn't make sense here.
799 return false;
800
801 case BuiltinType::UInt:
802 case BuiltinType::Int:
803 case BuiltinType::Float:
Matt Arsenault58fc8082019-01-29 20:49:54 +0000804 LM.setKind(VectorNumElts.isInvalid() ?
805 LengthModifier::None : LengthModifier::AsShortLong);
Tom Careb7042702010-06-09 04:11:11 +0000806 break;
Matt Arsenault58fc8082019-01-29 20:49:54 +0000807 case BuiltinType::Double:
808 LM.setKind(VectorNumElts.isInvalid() ?
809 LengthModifier::None : LengthModifier::AsLong);
810 break;
Ted Kremenek12a37de2010-10-21 04:00:58 +0000811 case BuiltinType::Char_U:
812 case BuiltinType::UChar:
813 case BuiltinType::Char_S:
814 case BuiltinType::SChar:
815 LM.setKind(LengthModifier::AsChar);
816 break;
817
818 case BuiltinType::Short:
819 case BuiltinType::UShort:
820 LM.setKind(LengthModifier::AsShort);
821 break;
822
Tom Careb7042702010-06-09 04:11:11 +0000823 case BuiltinType::Long:
824 case BuiltinType::ULong:
825 LM.setKind(LengthModifier::AsLong);
826 break;
827
828 case BuiltinType::LongLong:
829 case BuiltinType::ULongLong:
830 LM.setKind(LengthModifier::AsLongLong);
831 break;
832
833 case BuiltinType::LongDouble:
834 LM.setKind(LengthModifier::AsLongDouble);
835 break;
836 }
837
Hans Wennborgf99d04f2011-10-18 08:10:06 +0000838 // Handle size_t, ptrdiff_t, etc. that have dedicated length modifiers in C99.
Richard Smith2bf7fdb2013-01-02 11:42:31 +0000839 if (isa<TypedefType>(QT) && (LangOpt.C99 || LangOpt.CPlusPlus11))
Hans Wennborg08574d32012-07-27 19:17:46 +0000840 namedTypeToLengthModifier(QT, LM);
Hans Wennborgf99d04f2011-10-18 08:10:06 +0000841
Jordan Roseaa7a3b32013-01-17 18:47:16 +0000842 // If fixing the length modifier was enough, we might be done.
Matt Arsenault58fc8082019-01-29 20:49:54 +0000843 if (hasValidLengthModifier(Ctx.getTargetInfo(), LangOpt)) {
Jordan Roseaa7a3b32013-01-17 18:47:16 +0000844 // If we're going to offer a fix anyway, make sure the sign matches.
845 switch (CS.getKind()) {
846 case ConversionSpecifier::uArg:
847 case ConversionSpecifier::UArg:
848 if (QT->isSignedIntegerType())
849 CS.setKind(clang::analyze_format_string::ConversionSpecifier::dArg);
850 break;
851 case ConversionSpecifier::dArg:
852 case ConversionSpecifier::DArg:
853 case ConversionSpecifier::iArg:
Jordan Rose1eb34292013-01-17 22:34:10 +0000854 if (QT->isUnsignedIntegerType() && !HasPlusPrefix)
Jordan Roseaa7a3b32013-01-17 18:47:16 +0000855 CS.setKind(clang::analyze_format_string::ConversionSpecifier::uArg);
856 break;
857 default:
858 // Other specifiers do not have signed/unsigned variants.
859 break;
860 }
861
Jordan Rose92303592012-09-08 04:00:03 +0000862 const analyze_printf::ArgType &ATR = getArgType(Ctx, IsObjCLiteral);
863 if (ATR.isValid() && ATR.matchesType(Ctx, QT))
864 return true;
865 }
Hans Wennborgd99d6882012-02-15 09:59:46 +0000866
Tom Careb7042702010-06-09 04:11:11 +0000867 // Set conversion specifier and disable any flags which do not apply to it.
Ted Kremenek12a37de2010-10-21 04:00:58 +0000868 // Let typedefs to char fall through to int, as %c is silly for uint8_t.
Jordan Rose6aaa87e2012-12-05 18:44:37 +0000869 if (!isa<TypedefType>(QT) && QT->isCharType()) {
Ted Kremenekab0fe8a2010-07-20 20:03:49 +0000870 CS.setKind(ConversionSpecifier::cArg);
Ted Kremenek12a37de2010-10-21 04:00:58 +0000871 LM.setKind(LengthModifier::None);
Tom Careb7042702010-06-09 04:11:11 +0000872 Precision.setHowSpecified(OptionalAmount::NotSpecified);
873 HasAlternativeForm = 0;
874 HasLeadingZeroes = 0;
Tom Careb49ec692010-06-17 19:00:27 +0000875 HasPlusPrefix = 0;
Tom Careb7042702010-06-09 04:11:11 +0000876 }
877 // Test for Floating type first as LongDouble can pass isUnsignedIntegerType
Douglas Gregor49b4d732010-06-22 23:07:26 +0000878 else if (QT->isRealFloatingType()) {
Tom Careb7042702010-06-09 04:11:11 +0000879 CS.setKind(ConversionSpecifier::fArg);
880 }
Tom Careb7042702010-06-09 04:11:11 +0000881 else if (QT->isSignedIntegerType()) {
882 CS.setKind(ConversionSpecifier::dArg);
883 HasAlternativeForm = 0;
884 }
Douglas Gregorb4e3533ce2010-06-09 05:25:34 +0000885 else if (QT->isUnsignedIntegerType()) {
Hans Wennborgd99d6882012-02-15 09:59:46 +0000886 CS.setKind(ConversionSpecifier::uArg);
Tom Careb7042702010-06-09 04:11:11 +0000887 HasAlternativeForm = 0;
Tom Careb49ec692010-06-17 19:00:27 +0000888 HasPlusPrefix = 0;
Chad Rosier6fdf38b2011-08-17 23:08:45 +0000889 } else {
David Blaikie83d382b2011-09-23 05:06:16 +0000890 llvm_unreachable("Unexpected type");
Tom Careb7042702010-06-09 04:11:11 +0000891 }
892
893 return true;
894}
895
Chris Lattner0e62c1c2011-07-23 10:55:15 +0000896void PrintfSpecifier::toString(raw_ostream &os) const {
Tom Careb7042702010-06-09 04:11:11 +0000897 // Whilst some features have no defined order, we are using the order
NAKAMURA Takumi7c288862011-01-27 07:09:49 +0000898 // appearing in the C99 standard (ISO/IEC 9899:1999 (E) 7.19.6.1)
Tom Careb7042702010-06-09 04:11:11 +0000899 os << "%";
900
901 // Positional args
902 if (usesPositionalArg()) {
903 os << getPositionalArgIndex() << "$";
904 }
905
906 // Conversion flags
907 if (IsLeftJustified) os << "-";
908 if (HasPlusPrefix) os << "+";
909 if (HasSpacePrefix) os << " ";
910 if (HasAlternativeForm) os << "#";
911 if (HasLeadingZeroes) os << "0";
912
913 // Minimum field width
914 FieldWidth.toString(os);
915 // Precision
916 Precision.toString(os);
Matt Arsenault0ff50d42018-12-01 22:16:27 +0000917
918 // Vector modifier
919 if (!VectorNumElts.isInvalid())
920 os << 'v' << VectorNumElts.getConstantAmount();
921
Tom Careb7042702010-06-09 04:11:11 +0000922 // Length modifier
923 os << LM.toString();
924 // Conversion specifier
925 os << CS.toString();
926}
Tom Careb49ec692010-06-17 19:00:27 +0000927
Ted Kremenek02087932010-07-16 02:11:22 +0000928bool PrintfSpecifier::hasValidPlusPrefix() const {
Tom Careb49ec692010-06-17 19:00:27 +0000929 if (!HasPlusPrefix)
930 return true;
931
932 // The plus prefix only makes sense for signed conversions
933 switch (CS.getKind()) {
934 case ConversionSpecifier::dArg:
Jordan Rose510260c2012-09-13 02:11:03 +0000935 case ConversionSpecifier::DArg:
Tom Careb49ec692010-06-17 19:00:27 +0000936 case ConversionSpecifier::iArg:
937 case ConversionSpecifier::fArg:
938 case ConversionSpecifier::FArg:
939 case ConversionSpecifier::eArg:
940 case ConversionSpecifier::EArg:
941 case ConversionSpecifier::gArg:
942 case ConversionSpecifier::GArg:
943 case ConversionSpecifier::aArg:
944 case ConversionSpecifier::AArg:
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000945 case ConversionSpecifier::FreeBSDrArg:
946 case ConversionSpecifier::FreeBSDyArg:
Tom Careb49ec692010-06-17 19:00:27 +0000947 return true;
948
949 default:
950 return false;
951 }
952}
953
Ted Kremenek02087932010-07-16 02:11:22 +0000954bool PrintfSpecifier::hasValidAlternativeForm() const {
Tom Careb49ec692010-06-17 19:00:27 +0000955 if (!HasAlternativeForm)
956 return true;
957
Anders Carlssona369f8d2010-11-21 18:34:21 +0000958 // Alternate form flag only valid with the oxXaAeEfFgG conversions
Tom Careb49ec692010-06-17 19:00:27 +0000959 switch (CS.getKind()) {
960 case ConversionSpecifier::oArg:
Jordan Rose510260c2012-09-13 02:11:03 +0000961 case ConversionSpecifier::OArg:
Tom Careb49ec692010-06-17 19:00:27 +0000962 case ConversionSpecifier::xArg:
Anders Carlssona369f8d2010-11-21 18:34:21 +0000963 case ConversionSpecifier::XArg:
Tom Careb49ec692010-06-17 19:00:27 +0000964 case ConversionSpecifier::aArg:
965 case ConversionSpecifier::AArg:
966 case ConversionSpecifier::eArg:
967 case ConversionSpecifier::EArg:
968 case ConversionSpecifier::fArg:
969 case ConversionSpecifier::FArg:
970 case ConversionSpecifier::gArg:
971 case ConversionSpecifier::GArg:
Dimitry Andric6b5ed342015-02-19 22:32:33 +0000972 case ConversionSpecifier::FreeBSDrArg:
973 case ConversionSpecifier::FreeBSDyArg:
Tom Careb49ec692010-06-17 19:00:27 +0000974 return true;
975
976 default:
977 return false;
978 }
979}
980
Ted Kremenek02087932010-07-16 02:11:22 +0000981bool PrintfSpecifier::hasValidLeadingZeros() const {
Tom Careb49ec692010-06-17 19:00:27 +0000982 if (!HasLeadingZeroes)
983 return true;
984
985 // Leading zeroes flag only valid with the diouxXaAeEfFgG conversions
986 switch (CS.getKind()) {
987 case ConversionSpecifier::dArg:
Jordan Rose510260c2012-09-13 02:11:03 +0000988 case ConversionSpecifier::DArg:
Tom Careb49ec692010-06-17 19:00:27 +0000989 case ConversionSpecifier::iArg:
990 case ConversionSpecifier::oArg:
Jordan Rose510260c2012-09-13 02:11:03 +0000991 case ConversionSpecifier::OArg:
Tom Careb49ec692010-06-17 19:00:27 +0000992 case ConversionSpecifier::uArg:
Jordan Rose510260c2012-09-13 02:11:03 +0000993 case ConversionSpecifier::UArg:
Tom Careb49ec692010-06-17 19:00:27 +0000994 case ConversionSpecifier::xArg:
995 case ConversionSpecifier::XArg:
996 case ConversionSpecifier::aArg:
997 case ConversionSpecifier::AArg:
998 case ConversionSpecifier::eArg:
999 case ConversionSpecifier::EArg:
1000 case ConversionSpecifier::fArg:
1001 case ConversionSpecifier::FArg:
1002 case ConversionSpecifier::gArg:
1003 case ConversionSpecifier::GArg:
Dimitry Andric6b5ed342015-02-19 22:32:33 +00001004 case ConversionSpecifier::FreeBSDrArg:
1005 case ConversionSpecifier::FreeBSDyArg:
Tom Careb49ec692010-06-17 19:00:27 +00001006 return true;
1007
1008 default:
1009 return false;
1010 }
1011}
1012
Ted Kremenek02087932010-07-16 02:11:22 +00001013bool PrintfSpecifier::hasValidSpacePrefix() const {
Tom Careb49ec692010-06-17 19:00:27 +00001014 if (!HasSpacePrefix)
1015 return true;
1016
1017 // The space prefix only makes sense for signed conversions
1018 switch (CS.getKind()) {
1019 case ConversionSpecifier::dArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001020 case ConversionSpecifier::DArg:
Tom Careb49ec692010-06-17 19:00:27 +00001021 case ConversionSpecifier::iArg:
1022 case ConversionSpecifier::fArg:
1023 case ConversionSpecifier::FArg:
1024 case ConversionSpecifier::eArg:
1025 case ConversionSpecifier::EArg:
1026 case ConversionSpecifier::gArg:
1027 case ConversionSpecifier::GArg:
1028 case ConversionSpecifier::aArg:
1029 case ConversionSpecifier::AArg:
Dimitry Andric6b5ed342015-02-19 22:32:33 +00001030 case ConversionSpecifier::FreeBSDrArg:
1031 case ConversionSpecifier::FreeBSDyArg:
Tom Careb49ec692010-06-17 19:00:27 +00001032 return true;
1033
1034 default:
1035 return false;
1036 }
1037}
1038
Ted Kremenek02087932010-07-16 02:11:22 +00001039bool PrintfSpecifier::hasValidLeftJustified() const {
Tom Careb49ec692010-06-17 19:00:27 +00001040 if (!IsLeftJustified)
1041 return true;
1042
1043 // The left justified flag is valid for all conversions except n
1044 switch (CS.getKind()) {
Ted Kremenek516ef222010-07-20 20:04:10 +00001045 case ConversionSpecifier::nArg:
Tom Careb49ec692010-06-17 19:00:27 +00001046 return false;
1047
1048 default:
1049 return true;
1050 }
1051}
1052
Ted Kremenekbf4832c2011-01-08 05:28:46 +00001053bool PrintfSpecifier::hasValidThousandsGroupingPrefix() const {
1054 if (!HasThousandsGrouping)
1055 return true;
NAKAMURA Takumif9cbcc42011-01-27 07:10:08 +00001056
Ted Kremenekbf4832c2011-01-08 05:28:46 +00001057 switch (CS.getKind()) {
1058 case ConversionSpecifier::dArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001059 case ConversionSpecifier::DArg:
Ted Kremenekbf4832c2011-01-08 05:28:46 +00001060 case ConversionSpecifier::iArg:
1061 case ConversionSpecifier::uArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001062 case ConversionSpecifier::UArg:
Ted Kremenekbf4832c2011-01-08 05:28:46 +00001063 case ConversionSpecifier::fArg:
1064 case ConversionSpecifier::FArg:
1065 case ConversionSpecifier::gArg:
1066 case ConversionSpecifier::GArg:
1067 return true;
1068 default:
1069 return false;
1070 }
1071}
1072
Ted Kremenek02087932010-07-16 02:11:22 +00001073bool PrintfSpecifier::hasValidPrecision() const {
Tom Careb49ec692010-06-17 19:00:27 +00001074 if (Precision.getHowSpecified() == OptionalAmount::NotSpecified)
1075 return true;
1076
Mehdi Amini06d367c2016-10-24 20:39:34 +00001077 // Precision is only valid with the diouxXaAeEfFgGsP conversions
Tom Careb49ec692010-06-17 19:00:27 +00001078 switch (CS.getKind()) {
1079 case ConversionSpecifier::dArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001080 case ConversionSpecifier::DArg:
Tom Careb49ec692010-06-17 19:00:27 +00001081 case ConversionSpecifier::iArg:
1082 case ConversionSpecifier::oArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001083 case ConversionSpecifier::OArg:
Tom Careb49ec692010-06-17 19:00:27 +00001084 case ConversionSpecifier::uArg:
Jordan Rose510260c2012-09-13 02:11:03 +00001085 case ConversionSpecifier::UArg:
Tom Careb49ec692010-06-17 19:00:27 +00001086 case ConversionSpecifier::xArg:
1087 case ConversionSpecifier::XArg:
1088 case ConversionSpecifier::aArg:
1089 case ConversionSpecifier::AArg:
1090 case ConversionSpecifier::eArg:
1091 case ConversionSpecifier::EArg:
1092 case ConversionSpecifier::fArg:
1093 case ConversionSpecifier::FArg:
1094 case ConversionSpecifier::gArg:
1095 case ConversionSpecifier::GArg:
Ted Kremenek563e3ed2010-07-20 20:03:58 +00001096 case ConversionSpecifier::sArg:
Dimitry Andric6b5ed342015-02-19 22:32:33 +00001097 case ConversionSpecifier::FreeBSDrArg:
1098 case ConversionSpecifier::FreeBSDyArg:
Mehdi Amini06d367c2016-10-24 20:39:34 +00001099 case ConversionSpecifier::PArg:
Tom Careb49ec692010-06-17 19:00:27 +00001100 return true;
1101
1102 default:
1103 return false;
1104 }
1105}
Ted Kremenek02087932010-07-16 02:11:22 +00001106bool PrintfSpecifier::hasValidFieldWidth() const {
Tom Careb49ec692010-06-17 19:00:27 +00001107 if (FieldWidth.getHowSpecified() == OptionalAmount::NotSpecified)
1108 return true;
1109
1110 // The field width is valid for all conversions except n
1111 switch (CS.getKind()) {
Ted Kremenek516ef222010-07-20 20:04:10 +00001112 case ConversionSpecifier::nArg:
Tom Careb49ec692010-06-17 19:00:27 +00001113 return false;
1114
1115 default:
1116 return true;
1117 }
1118}