PrintfFormatString.cpp 36 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118
  1. //== PrintfFormatString.cpp - Analysis of printf format strings --*- C++ -*-==//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. //
  9. // Handling of format string in printf and friends. The structure of format
  10. // strings for fprintf() are described in C99 7.19.6.1.
  11. //
  12. //===----------------------------------------------------------------------===//
  13. #include "clang/AST/FormatString.h"
  14. #include "clang/AST/OSLog.h"
  15. #include "FormatStringParsing.h"
  16. #include "clang/Basic/TargetInfo.h"
  17. using clang::analyze_format_string::ArgType;
  18. using clang::analyze_format_string::FormatStringHandler;
  19. using clang::analyze_format_string::LengthModifier;
  20. using clang::analyze_format_string::OptionalAmount;
  21. using clang::analyze_format_string::ConversionSpecifier;
  22. using clang::analyze_printf::PrintfSpecifier;
  23. using namespace clang;
  24. typedef clang::analyze_format_string::SpecifierResult<PrintfSpecifier>
  25. PrintfSpecifierResult;
  26. //===----------------------------------------------------------------------===//
  27. // Methods for parsing format strings.
  28. //===----------------------------------------------------------------------===//
  29. using analyze_format_string::ParseNonPositionAmount;
  30. static bool ParsePrecision(FormatStringHandler &H, PrintfSpecifier &FS,
  31. const char *Start, const char *&Beg, const char *E,
  32. unsigned *argIndex) {
  33. if (argIndex) {
  34. FS.setPrecision(ParseNonPositionAmount(Beg, E, *argIndex));
  35. } else {
  36. const OptionalAmount Amt = ParsePositionAmount(H, Start, Beg, E,
  37. analyze_format_string::PrecisionPos);
  38. if (Amt.isInvalid())
  39. return true;
  40. FS.setPrecision(Amt);
  41. }
  42. return false;
  43. }
  44. static bool ParseObjCFlags(FormatStringHandler &H, PrintfSpecifier &FS,
  45. const char *FlagBeg, const char *E, bool Warn) {
  46. StringRef Flag(FlagBeg, E - FlagBeg);
  47. // Currently there is only one flag.
  48. if (Flag == "tt") {
  49. FS.setHasObjCTechnicalTerm(FlagBeg);
  50. return false;
  51. }
  52. // Handle either the case of no flag or an invalid flag.
  53. if (Warn) {
  54. if (Flag == "")
  55. H.HandleEmptyObjCModifierFlag(FlagBeg, E - FlagBeg);
  56. else
  57. H.HandleInvalidObjCModifierFlag(FlagBeg, E - FlagBeg);
  58. }
  59. return true;
  60. }
  61. static PrintfSpecifierResult ParsePrintfSpecifier(FormatStringHandler &H,
  62. const char *&Beg,
  63. const char *E,
  64. unsigned &argIndex,
  65. const LangOptions &LO,
  66. const TargetInfo &Target,
  67. bool Warn,
  68. bool isFreeBSDKPrintf) {
  69. using namespace clang::analyze_format_string;
  70. using namespace clang::analyze_printf;
  71. const char *I = Beg;
  72. const char *Start = nullptr;
  73. UpdateOnReturn <const char*> UpdateBeg(Beg, I);
  74. // Look for a '%' character that indicates the start of a format specifier.
  75. for ( ; I != E ; ++I) {
  76. char c = *I;
  77. if (c == '\0') {
  78. // Detect spurious null characters, which are likely errors.
  79. H.HandleNullChar(I);
  80. return true;
  81. }
  82. if (c == '%') {
  83. Start = I++; // Record the start of the format specifier.
  84. break;
  85. }
  86. }
  87. // No format specifier found?
  88. if (!Start)
  89. return false;
  90. if (I == E) {
  91. // No more characters left?
  92. if (Warn)
  93. H.HandleIncompleteSpecifier(Start, E - Start);
  94. return true;
  95. }
  96. PrintfSpecifier FS;
  97. if (ParseArgPosition(H, FS, Start, I, E))
  98. return true;
  99. if (I == E) {
  100. // No more characters left?
  101. if (Warn)
  102. H.HandleIncompleteSpecifier(Start, E - Start);
  103. return true;
  104. }
  105. if (*I == '{') {
  106. ++I;
  107. unsigned char PrivacyFlags = 0;
  108. StringRef MatchedStr;
  109. do {
  110. StringRef Str(I, E - I);
  111. std::string Match = "^[[:space:]]*"
  112. "(private|public|sensitive|mask\\.[^[:space:],}]*)"
  113. "[[:space:]]*(,|})";
  114. llvm::Regex R(Match);
  115. SmallVector<StringRef, 2> Matches;
  116. if (R.match(Str, &Matches)) {
  117. MatchedStr = Matches[1];
  118. I += Matches[0].size();
  119. // Set the privacy flag if the privacy annotation in the
  120. // comma-delimited segment is at least as strict as the privacy
  121. // annotations in previous comma-delimited segments.
  122. if (MatchedStr.startswith("mask")) {
  123. StringRef MaskType = MatchedStr.substr(sizeof("mask.") - 1);
  124. unsigned Size = MaskType.size();
  125. if (Warn && (Size == 0 || Size > 8))
  126. H.handleInvalidMaskType(MaskType);
  127. FS.setMaskType(MaskType);
  128. } else if (MatchedStr.equals("sensitive"))
  129. PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsSensitive;
  130. else if (PrivacyFlags !=
  131. clang::analyze_os_log::OSLogBufferItem::IsSensitive &&
  132. MatchedStr.equals("private"))
  133. PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsPrivate;
  134. else if (PrivacyFlags == 0 && MatchedStr.equals("public"))
  135. PrivacyFlags = clang::analyze_os_log::OSLogBufferItem::IsPublic;
  136. } else {
  137. size_t CommaOrBracePos =
  138. Str.find_if([](char c) { return c == ',' || c == '}'; });
  139. if (CommaOrBracePos == StringRef::npos) {
  140. // Neither a comma nor the closing brace was found.
  141. if (Warn)
  142. H.HandleIncompleteSpecifier(Start, E - Start);
  143. return true;
  144. }
  145. I += CommaOrBracePos + 1;
  146. }
  147. // Continue until the closing brace is found.
  148. } while (*(I - 1) == ',');
  149. // Set the privacy flag.
  150. switch (PrivacyFlags) {
  151. case 0:
  152. break;
  153. case clang::analyze_os_log::OSLogBufferItem::IsPrivate:
  154. FS.setIsPrivate(MatchedStr.data());
  155. break;
  156. case clang::analyze_os_log::OSLogBufferItem::IsPublic:
  157. FS.setIsPublic(MatchedStr.data());
  158. break;
  159. case clang::analyze_os_log::OSLogBufferItem::IsSensitive:
  160. FS.setIsSensitive(MatchedStr.data());
  161. break;
  162. default:
  163. llvm_unreachable("Unexpected privacy flag value");
  164. }
  165. }
  166. // Look for flags (if any).
  167. bool hasMore = true;
  168. for ( ; I != E; ++I) {
  169. switch (*I) {
  170. default: hasMore = false; break;
  171. case '\'':
  172. // FIXME: POSIX specific. Always accept?
  173. FS.setHasThousandsGrouping(I);
  174. break;
  175. case '-': FS.setIsLeftJustified(I); break;
  176. case '+': FS.setHasPlusPrefix(I); break;
  177. case ' ': FS.setHasSpacePrefix(I); break;
  178. case '#': FS.setHasAlternativeForm(I); break;
  179. case '0': FS.setHasLeadingZeros(I); break;
  180. }
  181. if (!hasMore)
  182. break;
  183. }
  184. if (I == E) {
  185. // No more characters left?
  186. if (Warn)
  187. H.HandleIncompleteSpecifier(Start, E - Start);
  188. return true;
  189. }
  190. // Look for the field width (if any).
  191. if (ParseFieldWidth(H, FS, Start, I, E,
  192. FS.usesPositionalArg() ? nullptr : &argIndex))
  193. return true;
  194. if (I == E) {
  195. // No more characters left?
  196. if (Warn)
  197. H.HandleIncompleteSpecifier(Start, E - Start);
  198. return true;
  199. }
  200. // Look for the precision (if any).
  201. if (*I == '.') {
  202. ++I;
  203. if (I == E) {
  204. if (Warn)
  205. H.HandleIncompleteSpecifier(Start, E - Start);
  206. return true;
  207. }
  208. if (ParsePrecision(H, FS, Start, I, E,
  209. FS.usesPositionalArg() ? nullptr : &argIndex))
  210. return true;
  211. if (I == E) {
  212. // No more characters left?
  213. if (Warn)
  214. H.HandleIncompleteSpecifier(Start, E - Start);
  215. return true;
  216. }
  217. }
  218. if (ParseVectorModifier(H, FS, I, E, LO))
  219. return true;
  220. // Look for the length modifier.
  221. if (ParseLengthModifier(FS, I, E, LO) && I == E) {
  222. // No more characters left?
  223. if (Warn)
  224. H.HandleIncompleteSpecifier(Start, E - Start);
  225. return true;
  226. }
  227. // Look for the Objective-C modifier flags, if any.
  228. // We parse these here, even if they don't apply to
  229. // the conversion specifier, and then emit an error
  230. // later if the conversion specifier isn't '@'. This
  231. // enables better recovery, and we don't know if
  232. // these flags are applicable until later.
  233. const char *ObjCModifierFlagsStart = nullptr,
  234. *ObjCModifierFlagsEnd = nullptr;
  235. if (*I == '[') {
  236. ObjCModifierFlagsStart = I;
  237. ++I;
  238. auto flagStart = I;
  239. for (;; ++I) {
  240. ObjCModifierFlagsEnd = I;
  241. if (I == E) {
  242. if (Warn)
  243. H.HandleIncompleteSpecifier(Start, E - Start);
  244. return true;
  245. }
  246. // Did we find the closing ']'?
  247. if (*I == ']') {
  248. if (ParseObjCFlags(H, FS, flagStart, I, Warn))
  249. return true;
  250. ++I;
  251. break;
  252. }
  253. // There are no separators defined yet for multiple
  254. // Objective-C modifier flags. When those are
  255. // defined, this is the place to check.
  256. }
  257. }
  258. if (*I == '\0') {
  259. // Detect spurious null characters, which are likely errors.
  260. H.HandleNullChar(I);
  261. return true;
  262. }
  263. // Finally, look for the conversion specifier.
  264. const char *conversionPosition = I++;
  265. ConversionSpecifier::Kind k = ConversionSpecifier::InvalidSpecifier;
  266. switch (*conversionPosition) {
  267. default:
  268. break;
  269. // C99: 7.19.6.1 (section 8).
  270. case '%': k = ConversionSpecifier::PercentArg; break;
  271. case 'A': k = ConversionSpecifier::AArg; break;
  272. case 'E': k = ConversionSpecifier::EArg; break;
  273. case 'F': k = ConversionSpecifier::FArg; break;
  274. case 'G': k = ConversionSpecifier::GArg; break;
  275. case 'X': k = ConversionSpecifier::XArg; break;
  276. case 'a': k = ConversionSpecifier::aArg; break;
  277. case 'c': k = ConversionSpecifier::cArg; break;
  278. case 'd': k = ConversionSpecifier::dArg; break;
  279. case 'e': k = ConversionSpecifier::eArg; break;
  280. case 'f': k = ConversionSpecifier::fArg; break;
  281. case 'g': k = ConversionSpecifier::gArg; break;
  282. case 'i': k = ConversionSpecifier::iArg; break;
  283. case 'n':
  284. // Not handled, but reserved in OpenCL.
  285. if (!LO.OpenCL)
  286. k = ConversionSpecifier::nArg;
  287. break;
  288. case 'o': k = ConversionSpecifier::oArg; break;
  289. case 'p': k = ConversionSpecifier::pArg; break;
  290. case 's': k = ConversionSpecifier::sArg; break;
  291. case 'u': k = ConversionSpecifier::uArg; break;
  292. case 'x': k = ConversionSpecifier::xArg; break;
  293. // POSIX specific.
  294. case 'C': k = ConversionSpecifier::CArg; break;
  295. case 'S': k = ConversionSpecifier::SArg; break;
  296. // Apple extension for os_log
  297. case 'P':
  298. k = ConversionSpecifier::PArg;
  299. break;
  300. // Objective-C.
  301. case '@': k = ConversionSpecifier::ObjCObjArg; break;
  302. // Glibc specific.
  303. case 'm': k = ConversionSpecifier::PrintErrno; break;
  304. // FreeBSD kernel specific.
  305. case 'b':
  306. if (isFreeBSDKPrintf)
  307. k = ConversionSpecifier::FreeBSDbArg; // int followed by char *
  308. break;
  309. case 'r':
  310. if (isFreeBSDKPrintf)
  311. k = ConversionSpecifier::FreeBSDrArg; // int
  312. break;
  313. case 'y':
  314. if (isFreeBSDKPrintf)
  315. k = ConversionSpecifier::FreeBSDyArg; // int
  316. break;
  317. // Apple-specific.
  318. case 'D':
  319. if (isFreeBSDKPrintf)
  320. k = ConversionSpecifier::FreeBSDDArg; // void * followed by char *
  321. else if (Target.getTriple().isOSDarwin())
  322. k = ConversionSpecifier::DArg;
  323. break;
  324. case 'O':
  325. if (Target.getTriple().isOSDarwin())
  326. k = ConversionSpecifier::OArg;
  327. break;
  328. case 'U':
  329. if (Target.getTriple().isOSDarwin())
  330. k = ConversionSpecifier::UArg;
  331. break;
  332. // MS specific.
  333. case 'Z':
  334. if (Target.getTriple().isOSMSVCRT())
  335. k = ConversionSpecifier::ZArg;
  336. break;
  337. }
  338. // Check to see if we used the Objective-C modifier flags with
  339. // a conversion specifier other than '@'.
  340. if (k != ConversionSpecifier::ObjCObjArg &&
  341. k != ConversionSpecifier::InvalidSpecifier &&
  342. ObjCModifierFlagsStart) {
  343. H.HandleObjCFlagsWithNonObjCConversion(ObjCModifierFlagsStart,
  344. ObjCModifierFlagsEnd + 1,
  345. conversionPosition);
  346. return true;
  347. }
  348. PrintfConversionSpecifier CS(conversionPosition, k);
  349. FS.setConversionSpecifier(CS);
  350. if (CS.consumesDataArgument() && !FS.usesPositionalArg())
  351. FS.setArgIndex(argIndex++);
  352. // FreeBSD kernel specific.
  353. if (k == ConversionSpecifier::FreeBSDbArg ||
  354. k == ConversionSpecifier::FreeBSDDArg)
  355. argIndex++;
  356. if (k == ConversionSpecifier::InvalidSpecifier) {
  357. unsigned Len = I - Start;
  358. if (ParseUTF8InvalidSpecifier(Start, E, Len)) {
  359. CS.setEndScanList(Start + Len);
  360. FS.setConversionSpecifier(CS);
  361. }
  362. // Assume the conversion takes one argument.
  363. return !H.HandleInvalidPrintfConversionSpecifier(FS, Start, Len);
  364. }
  365. return PrintfSpecifierResult(Start, FS);
  366. }
  367. bool clang::analyze_format_string::ParsePrintfString(FormatStringHandler &H,
  368. const char *I,
  369. const char *E,
  370. const LangOptions &LO,
  371. const TargetInfo &Target,
  372. bool isFreeBSDKPrintf) {
  373. unsigned argIndex = 0;
  374. // Keep looking for a format specifier until we have exhausted the string.
  375. while (I != E) {
  376. const PrintfSpecifierResult &FSR = ParsePrintfSpecifier(H, I, E, argIndex,
  377. LO, Target, true,
  378. isFreeBSDKPrintf);
  379. // Did a fail-stop error of any kind occur when parsing the specifier?
  380. // If so, don't do any more processing.
  381. if (FSR.shouldStop())
  382. return true;
  383. // Did we exhaust the string or encounter an error that
  384. // we can recover from?
  385. if (!FSR.hasValue())
  386. continue;
  387. // We have a format specifier. Pass it to the callback.
  388. if (!H.HandlePrintfSpecifier(FSR.getValue(), FSR.getStart(),
  389. I - FSR.getStart()))
  390. return true;
  391. }
  392. assert(I == E && "Format string not exhausted");
  393. return false;
  394. }
  395. bool clang::analyze_format_string::ParseFormatStringHasSArg(const char *I,
  396. const char *E,
  397. const LangOptions &LO,
  398. const TargetInfo &Target) {
  399. unsigned argIndex = 0;
  400. // Keep looking for a %s format specifier until we have exhausted the string.
  401. FormatStringHandler H;
  402. while (I != E) {
  403. const PrintfSpecifierResult &FSR = ParsePrintfSpecifier(H, I, E, argIndex,
  404. LO, Target, false,
  405. false);
  406. // Did a fail-stop error of any kind occur when parsing the specifier?
  407. // If so, don't do any more processing.
  408. if (FSR.shouldStop())
  409. return false;
  410. // Did we exhaust the string or encounter an error that
  411. // we can recover from?
  412. if (!FSR.hasValue())
  413. continue;
  414. const analyze_printf::PrintfSpecifier &FS = FSR.getValue();
  415. // Return true if this a %s format specifier.
  416. if (FS.getConversionSpecifier().getKind() == ConversionSpecifier::Kind::sArg)
  417. return true;
  418. }
  419. return false;
  420. }
  421. bool clang::analyze_format_string::parseFormatStringHasFormattingSpecifiers(
  422. const char *Begin, const char *End, const LangOptions &LO,
  423. const TargetInfo &Target) {
  424. unsigned ArgIndex = 0;
  425. // Keep looking for a formatting specifier until we have exhausted the string.
  426. FormatStringHandler H;
  427. while (Begin != End) {
  428. const PrintfSpecifierResult &FSR =
  429. ParsePrintfSpecifier(H, Begin, End, ArgIndex, LO, Target, false, false);
  430. if (FSR.shouldStop())
  431. break;
  432. if (FSR.hasValue())
  433. return true;
  434. }
  435. return false;
  436. }
  437. //===----------------------------------------------------------------------===//
  438. // Methods on PrintfSpecifier.
  439. //===----------------------------------------------------------------------===//
  440. ArgType PrintfSpecifier::getScalarArgType(ASTContext &Ctx,
  441. bool IsObjCLiteral) const {
  442. if (CS.getKind() == ConversionSpecifier::cArg)
  443. switch (LM.getKind()) {
  444. case LengthModifier::None:
  445. return Ctx.IntTy;
  446. case LengthModifier::AsLong:
  447. case LengthModifier::AsWide:
  448. return ArgType(ArgType::WIntTy, "wint_t");
  449. case LengthModifier::AsShort:
  450. if (Ctx.getTargetInfo().getTriple().isOSMSVCRT())
  451. return Ctx.IntTy;
  452. LLVM_FALLTHROUGH;
  453. default:
  454. return ArgType::Invalid();
  455. }
  456. if (CS.isIntArg())
  457. switch (LM.getKind()) {
  458. case LengthModifier::AsLongDouble:
  459. // GNU extension.
  460. return Ctx.LongLongTy;
  461. case LengthModifier::None:
  462. case LengthModifier::AsShortLong:
  463. return Ctx.IntTy;
  464. case LengthModifier::AsInt32:
  465. return ArgType(Ctx.IntTy, "__int32");
  466. case LengthModifier::AsChar:
  467. return ArgType::AnyCharTy;
  468. case LengthModifier::AsShort: return Ctx.ShortTy;
  469. case LengthModifier::AsLong: return Ctx.LongTy;
  470. case LengthModifier::AsLongLong:
  471. case LengthModifier::AsQuad:
  472. return Ctx.LongLongTy;
  473. case LengthModifier::AsInt64:
  474. return ArgType(Ctx.LongLongTy, "__int64");
  475. case LengthModifier::AsIntMax:
  476. return ArgType(Ctx.getIntMaxType(), "intmax_t");
  477. case LengthModifier::AsSizeT:
  478. return ArgType::makeSizeT(ArgType(Ctx.getSignedSizeType(), "ssize_t"));
  479. case LengthModifier::AsInt3264:
  480. return Ctx.getTargetInfo().getTriple().isArch64Bit()
  481. ? ArgType(Ctx.LongLongTy, "__int64")
  482. : ArgType(Ctx.IntTy, "__int32");
  483. case LengthModifier::AsPtrDiff:
  484. return ArgType::makePtrdiffT(
  485. ArgType(Ctx.getPointerDiffType(), "ptrdiff_t"));
  486. case LengthModifier::AsAllocate:
  487. case LengthModifier::AsMAllocate:
  488. case LengthModifier::AsWide:
  489. return ArgType::Invalid();
  490. }
  491. if (CS.isUIntArg())
  492. switch (LM.getKind()) {
  493. case LengthModifier::AsLongDouble:
  494. // GNU extension.
  495. return Ctx.UnsignedLongLongTy;
  496. case LengthModifier::None:
  497. case LengthModifier::AsShortLong:
  498. return Ctx.UnsignedIntTy;
  499. case LengthModifier::AsInt32:
  500. return ArgType(Ctx.UnsignedIntTy, "unsigned __int32");
  501. case LengthModifier::AsChar: return Ctx.UnsignedCharTy;
  502. case LengthModifier::AsShort: return Ctx.UnsignedShortTy;
  503. case LengthModifier::AsLong: return Ctx.UnsignedLongTy;
  504. case LengthModifier::AsLongLong:
  505. case LengthModifier::AsQuad:
  506. return Ctx.UnsignedLongLongTy;
  507. case LengthModifier::AsInt64:
  508. return ArgType(Ctx.UnsignedLongLongTy, "unsigned __int64");
  509. case LengthModifier::AsIntMax:
  510. return ArgType(Ctx.getUIntMaxType(), "uintmax_t");
  511. case LengthModifier::AsSizeT:
  512. return ArgType::makeSizeT(ArgType(Ctx.getSizeType(), "size_t"));
  513. case LengthModifier::AsInt3264:
  514. return Ctx.getTargetInfo().getTriple().isArch64Bit()
  515. ? ArgType(Ctx.UnsignedLongLongTy, "unsigned __int64")
  516. : ArgType(Ctx.UnsignedIntTy, "unsigned __int32");
  517. case LengthModifier::AsPtrDiff:
  518. return ArgType::makePtrdiffT(
  519. ArgType(Ctx.getUnsignedPointerDiffType(), "unsigned ptrdiff_t"));
  520. case LengthModifier::AsAllocate:
  521. case LengthModifier::AsMAllocate:
  522. case LengthModifier::AsWide:
  523. return ArgType::Invalid();
  524. }
  525. if (CS.isDoubleArg()) {
  526. if (!VectorNumElts.isInvalid()) {
  527. switch (LM.getKind()) {
  528. case LengthModifier::AsShort:
  529. return Ctx.HalfTy;
  530. case LengthModifier::AsShortLong:
  531. return Ctx.FloatTy;
  532. case LengthModifier::AsLong:
  533. default:
  534. return Ctx.DoubleTy;
  535. }
  536. }
  537. if (LM.getKind() == LengthModifier::AsLongDouble)
  538. return Ctx.LongDoubleTy;
  539. return Ctx.DoubleTy;
  540. }
  541. if (CS.getKind() == ConversionSpecifier::nArg) {
  542. switch (LM.getKind()) {
  543. case LengthModifier::None:
  544. return ArgType::PtrTo(Ctx.IntTy);
  545. case LengthModifier::AsChar:
  546. return ArgType::PtrTo(Ctx.SignedCharTy);
  547. case LengthModifier::AsShort:
  548. return ArgType::PtrTo(Ctx.ShortTy);
  549. case LengthModifier::AsLong:
  550. return ArgType::PtrTo(Ctx.LongTy);
  551. case LengthModifier::AsLongLong:
  552. case LengthModifier::AsQuad:
  553. return ArgType::PtrTo(Ctx.LongLongTy);
  554. case LengthModifier::AsIntMax:
  555. return ArgType::PtrTo(ArgType(Ctx.getIntMaxType(), "intmax_t"));
  556. case LengthModifier::AsSizeT:
  557. return ArgType::PtrTo(ArgType(Ctx.getSignedSizeType(), "ssize_t"));
  558. case LengthModifier::AsPtrDiff:
  559. return ArgType::PtrTo(ArgType(Ctx.getPointerDiffType(), "ptrdiff_t"));
  560. case LengthModifier::AsLongDouble:
  561. return ArgType(); // FIXME: Is this a known extension?
  562. case LengthModifier::AsAllocate:
  563. case LengthModifier::AsMAllocate:
  564. case LengthModifier::AsInt32:
  565. case LengthModifier::AsInt3264:
  566. case LengthModifier::AsInt64:
  567. case LengthModifier::AsWide:
  568. return ArgType::Invalid();
  569. case LengthModifier::AsShortLong:
  570. llvm_unreachable("only used for OpenCL which doesn not handle nArg");
  571. }
  572. }
  573. switch (CS.getKind()) {
  574. case ConversionSpecifier::sArg:
  575. if (LM.getKind() == LengthModifier::AsWideChar) {
  576. if (IsObjCLiteral)
  577. return ArgType(Ctx.getPointerType(Ctx.UnsignedShortTy.withConst()),
  578. "const unichar *");
  579. return ArgType(ArgType::WCStrTy, "wchar_t *");
  580. }
  581. if (LM.getKind() == LengthModifier::AsWide)
  582. return ArgType(ArgType::WCStrTy, "wchar_t *");
  583. return ArgType::CStrTy;
  584. case ConversionSpecifier::SArg:
  585. if (IsObjCLiteral)
  586. return ArgType(Ctx.getPointerType(Ctx.UnsignedShortTy.withConst()),
  587. "const unichar *");
  588. if (Ctx.getTargetInfo().getTriple().isOSMSVCRT() &&
  589. LM.getKind() == LengthModifier::AsShort)
  590. return ArgType::CStrTy;
  591. return ArgType(ArgType::WCStrTy, "wchar_t *");
  592. case ConversionSpecifier::CArg:
  593. if (IsObjCLiteral)
  594. return ArgType(Ctx.UnsignedShortTy, "unichar");
  595. if (Ctx.getTargetInfo().getTriple().isOSMSVCRT() &&
  596. LM.getKind() == LengthModifier::AsShort)
  597. return Ctx.IntTy;
  598. return ArgType(Ctx.WideCharTy, "wchar_t");
  599. case ConversionSpecifier::pArg:
  600. case ConversionSpecifier::PArg:
  601. return ArgType::CPointerTy;
  602. case ConversionSpecifier::ObjCObjArg:
  603. return ArgType::ObjCPointerTy;
  604. default:
  605. break;
  606. }
  607. // FIXME: Handle other cases.
  608. return ArgType();
  609. }
  610. ArgType PrintfSpecifier::getArgType(ASTContext &Ctx,
  611. bool IsObjCLiteral) const {
  612. const PrintfConversionSpecifier &CS = getConversionSpecifier();
  613. if (!CS.consumesDataArgument())
  614. return ArgType::Invalid();
  615. ArgType ScalarTy = getScalarArgType(Ctx, IsObjCLiteral);
  616. if (!ScalarTy.isValid() || VectorNumElts.isInvalid())
  617. return ScalarTy;
  618. return ScalarTy.makeVectorType(Ctx, VectorNumElts.getConstantAmount());
  619. }
  620. bool PrintfSpecifier::fixType(QualType QT, const LangOptions &LangOpt,
  621. ASTContext &Ctx, bool IsObjCLiteral) {
  622. // %n is different from other conversion specifiers; don't try to fix it.
  623. if (CS.getKind() == ConversionSpecifier::nArg)
  624. return false;
  625. // Handle Objective-C objects first. Note that while the '%@' specifier will
  626. // not warn for structure pointer or void pointer arguments (because that's
  627. // how CoreFoundation objects are implemented), we only show a fixit for '%@'
  628. // if we know it's an object (block, id, class, or __attribute__((NSObject))).
  629. if (QT->isObjCRetainableType()) {
  630. if (!IsObjCLiteral)
  631. return false;
  632. CS.setKind(ConversionSpecifier::ObjCObjArg);
  633. // Disable irrelevant flags
  634. HasThousandsGrouping = false;
  635. HasPlusPrefix = false;
  636. HasSpacePrefix = false;
  637. HasAlternativeForm = false;
  638. HasLeadingZeroes = false;
  639. Precision.setHowSpecified(OptionalAmount::NotSpecified);
  640. LM.setKind(LengthModifier::None);
  641. return true;
  642. }
  643. // Handle strings next (char *, wchar_t *)
  644. if (QT->isPointerType() && (QT->getPointeeType()->isAnyCharacterType())) {
  645. CS.setKind(ConversionSpecifier::sArg);
  646. // Disable irrelevant flags
  647. HasAlternativeForm = 0;
  648. HasLeadingZeroes = 0;
  649. // Set the long length modifier for wide characters
  650. if (QT->getPointeeType()->isWideCharType())
  651. LM.setKind(LengthModifier::AsWideChar);
  652. else
  653. LM.setKind(LengthModifier::None);
  654. return true;
  655. }
  656. // If it's an enum, get its underlying type.
  657. if (const EnumType *ETy = QT->getAs<EnumType>())
  658. QT = ETy->getDecl()->getIntegerType();
  659. const BuiltinType *BT = QT->getAs<BuiltinType>();
  660. if (!BT) {
  661. const VectorType *VT = QT->getAs<VectorType>();
  662. if (VT) {
  663. QT = VT->getElementType();
  664. BT = QT->getAs<BuiltinType>();
  665. VectorNumElts = OptionalAmount(VT->getNumElements());
  666. }
  667. }
  668. // We can only work with builtin types.
  669. if (!BT)
  670. return false;
  671. // Set length modifier
  672. switch (BT->getKind()) {
  673. case BuiltinType::Bool:
  674. case BuiltinType::WChar_U:
  675. case BuiltinType::WChar_S:
  676. case BuiltinType::Char8: // FIXME: Treat like 'char'?
  677. case BuiltinType::Char16:
  678. case BuiltinType::Char32:
  679. case BuiltinType::UInt128:
  680. case BuiltinType::Int128:
  681. case BuiltinType::Half:
  682. case BuiltinType::Float16:
  683. case BuiltinType::Float128:
  684. case BuiltinType::ShortAccum:
  685. case BuiltinType::Accum:
  686. case BuiltinType::LongAccum:
  687. case BuiltinType::UShortAccum:
  688. case BuiltinType::UAccum:
  689. case BuiltinType::ULongAccum:
  690. case BuiltinType::ShortFract:
  691. case BuiltinType::Fract:
  692. case BuiltinType::LongFract:
  693. case BuiltinType::UShortFract:
  694. case BuiltinType::UFract:
  695. case BuiltinType::ULongFract:
  696. case BuiltinType::SatShortAccum:
  697. case BuiltinType::SatAccum:
  698. case BuiltinType::SatLongAccum:
  699. case BuiltinType::SatUShortAccum:
  700. case BuiltinType::SatUAccum:
  701. case BuiltinType::SatULongAccum:
  702. case BuiltinType::SatShortFract:
  703. case BuiltinType::SatFract:
  704. case BuiltinType::SatLongFract:
  705. case BuiltinType::SatUShortFract:
  706. case BuiltinType::SatUFract:
  707. case BuiltinType::SatULongFract:
  708. // Various types which are non-trivial to correct.
  709. return false;
  710. #define IMAGE_TYPE(ImgType, Id, SingletonId, Access, Suffix) \
  711. case BuiltinType::Id:
  712. #include "clang/Basic/OpenCLImageTypes.def"
  713. #define EXT_OPAQUE_TYPE(ExtType, Id, Ext) \
  714. case BuiltinType::Id:
  715. #include "clang/Basic/OpenCLExtensionTypes.def"
  716. #define SVE_TYPE(Name, Id, SingletonId) \
  717. case BuiltinType::Id:
  718. #include "clang/Basic/AArch64SVEACLETypes.def"
  719. #define SIGNED_TYPE(Id, SingletonId)
  720. #define UNSIGNED_TYPE(Id, SingletonId)
  721. #define FLOATING_TYPE(Id, SingletonId)
  722. #define BUILTIN_TYPE(Id, SingletonId) \
  723. case BuiltinType::Id:
  724. #include "clang/AST/BuiltinTypes.def"
  725. // Misc other stuff which doesn't make sense here.
  726. return false;
  727. case BuiltinType::UInt:
  728. case BuiltinType::Int:
  729. case BuiltinType::Float:
  730. LM.setKind(VectorNumElts.isInvalid() ?
  731. LengthModifier::None : LengthModifier::AsShortLong);
  732. break;
  733. case BuiltinType::Double:
  734. LM.setKind(VectorNumElts.isInvalid() ?
  735. LengthModifier::None : LengthModifier::AsLong);
  736. break;
  737. case BuiltinType::Char_U:
  738. case BuiltinType::UChar:
  739. case BuiltinType::Char_S:
  740. case BuiltinType::SChar:
  741. LM.setKind(LengthModifier::AsChar);
  742. break;
  743. case BuiltinType::Short:
  744. case BuiltinType::UShort:
  745. LM.setKind(LengthModifier::AsShort);
  746. break;
  747. case BuiltinType::Long:
  748. case BuiltinType::ULong:
  749. LM.setKind(LengthModifier::AsLong);
  750. break;
  751. case BuiltinType::LongLong:
  752. case BuiltinType::ULongLong:
  753. LM.setKind(LengthModifier::AsLongLong);
  754. break;
  755. case BuiltinType::LongDouble:
  756. LM.setKind(LengthModifier::AsLongDouble);
  757. break;
  758. }
  759. // Handle size_t, ptrdiff_t, etc. that have dedicated length modifiers in C99.
  760. if (isa<TypedefType>(QT) && (LangOpt.C99 || LangOpt.CPlusPlus11))
  761. namedTypeToLengthModifier(QT, LM);
  762. // If fixing the length modifier was enough, we might be done.
  763. if (hasValidLengthModifier(Ctx.getTargetInfo(), LangOpt)) {
  764. // If we're going to offer a fix anyway, make sure the sign matches.
  765. switch (CS.getKind()) {
  766. case ConversionSpecifier::uArg:
  767. case ConversionSpecifier::UArg:
  768. if (QT->isSignedIntegerType())
  769. CS.setKind(clang::analyze_format_string::ConversionSpecifier::dArg);
  770. break;
  771. case ConversionSpecifier::dArg:
  772. case ConversionSpecifier::DArg:
  773. case ConversionSpecifier::iArg:
  774. if (QT->isUnsignedIntegerType() && !HasPlusPrefix)
  775. CS.setKind(clang::analyze_format_string::ConversionSpecifier::uArg);
  776. break;
  777. default:
  778. // Other specifiers do not have signed/unsigned variants.
  779. break;
  780. }
  781. const analyze_printf::ArgType &ATR = getArgType(Ctx, IsObjCLiteral);
  782. if (ATR.isValid() && ATR.matchesType(Ctx, QT))
  783. return true;
  784. }
  785. // Set conversion specifier and disable any flags which do not apply to it.
  786. // Let typedefs to char fall through to int, as %c is silly for uint8_t.
  787. if (!isa<TypedefType>(QT) && QT->isCharType()) {
  788. CS.setKind(ConversionSpecifier::cArg);
  789. LM.setKind(LengthModifier::None);
  790. Precision.setHowSpecified(OptionalAmount::NotSpecified);
  791. HasAlternativeForm = 0;
  792. HasLeadingZeroes = 0;
  793. HasPlusPrefix = 0;
  794. }
  795. // Test for Floating type first as LongDouble can pass isUnsignedIntegerType
  796. else if (QT->isRealFloatingType()) {
  797. CS.setKind(ConversionSpecifier::fArg);
  798. }
  799. else if (QT->isSignedIntegerType()) {
  800. CS.setKind(ConversionSpecifier::dArg);
  801. HasAlternativeForm = 0;
  802. }
  803. else if (QT->isUnsignedIntegerType()) {
  804. CS.setKind(ConversionSpecifier::uArg);
  805. HasAlternativeForm = 0;
  806. HasPlusPrefix = 0;
  807. } else {
  808. llvm_unreachable("Unexpected type");
  809. }
  810. return true;
  811. }
  812. void PrintfSpecifier::toString(raw_ostream &os) const {
  813. // Whilst some features have no defined order, we are using the order
  814. // appearing in the C99 standard (ISO/IEC 9899:1999 (E) 7.19.6.1)
  815. os << "%";
  816. // Positional args
  817. if (usesPositionalArg()) {
  818. os << getPositionalArgIndex() << "$";
  819. }
  820. // Conversion flags
  821. if (IsLeftJustified) os << "-";
  822. if (HasPlusPrefix) os << "+";
  823. if (HasSpacePrefix) os << " ";
  824. if (HasAlternativeForm) os << "#";
  825. if (HasLeadingZeroes) os << "0";
  826. // Minimum field width
  827. FieldWidth.toString(os);
  828. // Precision
  829. Precision.toString(os);
  830. // Vector modifier
  831. if (!VectorNumElts.isInvalid())
  832. os << 'v' << VectorNumElts.getConstantAmount();
  833. // Length modifier
  834. os << LM.toString();
  835. // Conversion specifier
  836. os << CS.toString();
  837. }
  838. bool PrintfSpecifier::hasValidPlusPrefix() const {
  839. if (!HasPlusPrefix)
  840. return true;
  841. // The plus prefix only makes sense for signed conversions
  842. switch (CS.getKind()) {
  843. case ConversionSpecifier::dArg:
  844. case ConversionSpecifier::DArg:
  845. case ConversionSpecifier::iArg:
  846. case ConversionSpecifier::fArg:
  847. case ConversionSpecifier::FArg:
  848. case ConversionSpecifier::eArg:
  849. case ConversionSpecifier::EArg:
  850. case ConversionSpecifier::gArg:
  851. case ConversionSpecifier::GArg:
  852. case ConversionSpecifier::aArg:
  853. case ConversionSpecifier::AArg:
  854. case ConversionSpecifier::FreeBSDrArg:
  855. case ConversionSpecifier::FreeBSDyArg:
  856. return true;
  857. default:
  858. return false;
  859. }
  860. }
  861. bool PrintfSpecifier::hasValidAlternativeForm() const {
  862. if (!HasAlternativeForm)
  863. return true;
  864. // Alternate form flag only valid with the oxXaAeEfFgG conversions
  865. switch (CS.getKind()) {
  866. case ConversionSpecifier::oArg:
  867. case ConversionSpecifier::OArg:
  868. case ConversionSpecifier::xArg:
  869. case ConversionSpecifier::XArg:
  870. case ConversionSpecifier::aArg:
  871. case ConversionSpecifier::AArg:
  872. case ConversionSpecifier::eArg:
  873. case ConversionSpecifier::EArg:
  874. case ConversionSpecifier::fArg:
  875. case ConversionSpecifier::FArg:
  876. case ConversionSpecifier::gArg:
  877. case ConversionSpecifier::GArg:
  878. case ConversionSpecifier::FreeBSDrArg:
  879. case ConversionSpecifier::FreeBSDyArg:
  880. return true;
  881. default:
  882. return false;
  883. }
  884. }
  885. bool PrintfSpecifier::hasValidLeadingZeros() const {
  886. if (!HasLeadingZeroes)
  887. return true;
  888. // Leading zeroes flag only valid with the diouxXaAeEfFgG conversions
  889. switch (CS.getKind()) {
  890. case ConversionSpecifier::dArg:
  891. case ConversionSpecifier::DArg:
  892. case ConversionSpecifier::iArg:
  893. case ConversionSpecifier::oArg:
  894. case ConversionSpecifier::OArg:
  895. case ConversionSpecifier::uArg:
  896. case ConversionSpecifier::UArg:
  897. case ConversionSpecifier::xArg:
  898. case ConversionSpecifier::XArg:
  899. case ConversionSpecifier::aArg:
  900. case ConversionSpecifier::AArg:
  901. case ConversionSpecifier::eArg:
  902. case ConversionSpecifier::EArg:
  903. case ConversionSpecifier::fArg:
  904. case ConversionSpecifier::FArg:
  905. case ConversionSpecifier::gArg:
  906. case ConversionSpecifier::GArg:
  907. case ConversionSpecifier::FreeBSDrArg:
  908. case ConversionSpecifier::FreeBSDyArg:
  909. return true;
  910. default:
  911. return false;
  912. }
  913. }
  914. bool PrintfSpecifier::hasValidSpacePrefix() const {
  915. if (!HasSpacePrefix)
  916. return true;
  917. // The space prefix only makes sense for signed conversions
  918. switch (CS.getKind()) {
  919. case ConversionSpecifier::dArg:
  920. case ConversionSpecifier::DArg:
  921. case ConversionSpecifier::iArg:
  922. case ConversionSpecifier::fArg:
  923. case ConversionSpecifier::FArg:
  924. case ConversionSpecifier::eArg:
  925. case ConversionSpecifier::EArg:
  926. case ConversionSpecifier::gArg:
  927. case ConversionSpecifier::GArg:
  928. case ConversionSpecifier::aArg:
  929. case ConversionSpecifier::AArg:
  930. case ConversionSpecifier::FreeBSDrArg:
  931. case ConversionSpecifier::FreeBSDyArg:
  932. return true;
  933. default:
  934. return false;
  935. }
  936. }
  937. bool PrintfSpecifier::hasValidLeftJustified() const {
  938. if (!IsLeftJustified)
  939. return true;
  940. // The left justified flag is valid for all conversions except n
  941. switch (CS.getKind()) {
  942. case ConversionSpecifier::nArg:
  943. return false;
  944. default:
  945. return true;
  946. }
  947. }
  948. bool PrintfSpecifier::hasValidThousandsGroupingPrefix() const {
  949. if (!HasThousandsGrouping)
  950. return true;
  951. switch (CS.getKind()) {
  952. case ConversionSpecifier::dArg:
  953. case ConversionSpecifier::DArg:
  954. case ConversionSpecifier::iArg:
  955. case ConversionSpecifier::uArg:
  956. case ConversionSpecifier::UArg:
  957. case ConversionSpecifier::fArg:
  958. case ConversionSpecifier::FArg:
  959. case ConversionSpecifier::gArg:
  960. case ConversionSpecifier::GArg:
  961. return true;
  962. default:
  963. return false;
  964. }
  965. }
  966. bool PrintfSpecifier::hasValidPrecision() const {
  967. if (Precision.getHowSpecified() == OptionalAmount::NotSpecified)
  968. return true;
  969. // Precision is only valid with the diouxXaAeEfFgGsP conversions
  970. switch (CS.getKind()) {
  971. case ConversionSpecifier::dArg:
  972. case ConversionSpecifier::DArg:
  973. case ConversionSpecifier::iArg:
  974. case ConversionSpecifier::oArg:
  975. case ConversionSpecifier::OArg:
  976. case ConversionSpecifier::uArg:
  977. case ConversionSpecifier::UArg:
  978. case ConversionSpecifier::xArg:
  979. case ConversionSpecifier::XArg:
  980. case ConversionSpecifier::aArg:
  981. case ConversionSpecifier::AArg:
  982. case ConversionSpecifier::eArg:
  983. case ConversionSpecifier::EArg:
  984. case ConversionSpecifier::fArg:
  985. case ConversionSpecifier::FArg:
  986. case ConversionSpecifier::gArg:
  987. case ConversionSpecifier::GArg:
  988. case ConversionSpecifier::sArg:
  989. case ConversionSpecifier::FreeBSDrArg:
  990. case ConversionSpecifier::FreeBSDyArg:
  991. case ConversionSpecifier::PArg:
  992. return true;
  993. default:
  994. return false;
  995. }
  996. }
  997. bool PrintfSpecifier::hasValidFieldWidth() const {
  998. if (FieldWidth.getHowSpecified() == OptionalAmount::NotSpecified)
  999. return true;
  1000. // The field width is valid for all conversions except n
  1001. switch (CS.getKind()) {
  1002. case ConversionSpecifier::nArg:
  1003. return false;
  1004. default:
  1005. return true;
  1006. }
  1007. }