1 // FormatString.cpp - Common stuff for handling printf/scanf formats -*- C++ -*- 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // Shared details for processing format strings of printf and scanf 10 // (and friends). 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "FormatStringParsing.h" 15 #include "clang/Basic/LangOptions.h" 16 #include "clang/Basic/TargetInfo.h" 17 #include "llvm/Support/ConvertUTF.h" 18 19 using clang::analyze_format_string::ArgType; 20 using clang::analyze_format_string::FormatStringHandler; 21 using clang::analyze_format_string::FormatSpecifier; 22 using clang::analyze_format_string::LengthModifier; 23 using clang::analyze_format_string::OptionalAmount; 24 using clang::analyze_format_string::PositionContext; 25 using clang::analyze_format_string::ConversionSpecifier; 26 using namespace clang; 27 28 // Key function to FormatStringHandler. 29 FormatStringHandler::~FormatStringHandler() {} 30 31 //===----------------------------------------------------------------------===// 32 // Functions for parsing format strings components in both printf and 33 // scanf format strings. 34 //===----------------------------------------------------------------------===// 35 36 OptionalAmount 37 clang::analyze_format_string::ParseAmount(const char *&Beg, const char *E) { 38 const char *I = Beg; 39 UpdateOnReturn <const char*> UpdateBeg(Beg, I); 40 41 unsigned accumulator = 0; 42 bool hasDigits = false; 43 44 for ( ; I != E; ++I) { 45 char c = *I; 46 if (c >= '0' && c <= '9') { 47 hasDigits = true; 48 accumulator = (accumulator * 10) + (c - '0'); 49 continue; 50 } 51 52 if (hasDigits) 53 return OptionalAmount(OptionalAmount::Constant, accumulator, Beg, I - Beg, 54 false); 55 56 break; 57 } 58 59 return OptionalAmount(); 60 } 61 62 OptionalAmount 63 clang::analyze_format_string::ParseNonPositionAmount(const char *&Beg, 64 const char *E, 65 unsigned &argIndex) { 66 if (*Beg == '*') { 67 ++Beg; 68 return OptionalAmount(OptionalAmount::Arg, argIndex++, Beg, 0, false); 69 } 70 71 return ParseAmount(Beg, E); 72 } 73 74 OptionalAmount 75 clang::analyze_format_string::ParsePositionAmount(FormatStringHandler &H, 76 const char *Start, 77 const char *&Beg, 78 const char *E, 79 PositionContext p) { 80 if (*Beg == '*') { 81 const char *I = Beg + 1; 82 const OptionalAmount &Amt = ParseAmount(I, E); 83 84 if (Amt.getHowSpecified() == OptionalAmount::NotSpecified) { 85 H.HandleInvalidPosition(Beg, I - Beg, p); 86 return OptionalAmount(false); 87 } 88 89 if (I == E) { 90 // No more characters left? 91 H.HandleIncompleteSpecifier(Start, E - Start); 92 return OptionalAmount(false); 93 } 94 95 assert(Amt.getHowSpecified() == OptionalAmount::Constant); 96 97 if (*I == '$') { 98 // Handle positional arguments 99 100 // Special case: '*0$', since this is an easy mistake. 101 if (Amt.getConstantAmount() == 0) { 102 H.HandleZeroPosition(Beg, I - Beg + 1); 103 return OptionalAmount(false); 104 } 105 106 const char *Tmp = Beg; 107 Beg = ++I; 108 109 return OptionalAmount(OptionalAmount::Arg, Amt.getConstantAmount() - 1, 110 Tmp, 0, true); 111 } 112 113 H.HandleInvalidPosition(Beg, I - Beg, p); 114 return OptionalAmount(false); 115 } 116 117 return ParseAmount(Beg, E); 118 } 119 120 121 bool 122 clang::analyze_format_string::ParseFieldWidth(FormatStringHandler &H, 123 FormatSpecifier &CS, 124 const char *Start, 125 const char *&Beg, const char *E, 126 unsigned *argIndex) { 127 // FIXME: Support negative field widths. 128 if (argIndex) { 129 CS.setFieldWidth(ParseNonPositionAmount(Beg, E, *argIndex)); 130 } 131 else { 132 const OptionalAmount Amt = 133 ParsePositionAmount(H, Start, Beg, E, 134 analyze_format_string::FieldWidthPos); 135 136 if (Amt.isInvalid()) 137 return true; 138 CS.setFieldWidth(Amt); 139 } 140 return false; 141 } 142 143 bool 144 clang::analyze_format_string::ParseArgPosition(FormatStringHandler &H, 145 FormatSpecifier &FS, 146 const char *Start, 147 const char *&Beg, 148 const char *E) { 149 const char *I = Beg; 150 151 const OptionalAmount &Amt = ParseAmount(I, E); 152 153 if (I == E) { 154 // No more characters left? 155 H.HandleIncompleteSpecifier(Start, E - Start); 156 return true; 157 } 158 159 if (Amt.getHowSpecified() == OptionalAmount::Constant && *(I++) == '$') { 160 // Warn that positional arguments are non-standard. 161 H.HandlePosition(Start, I - Start); 162 163 // Special case: '%0$', since this is an easy mistake. 164 if (Amt.getConstantAmount() == 0) { 165 H.HandleZeroPosition(Start, I - Start); 166 return true; 167 } 168 169 FS.setArgIndex(Amt.getConstantAmount() - 1); 170 FS.setUsesPositionalArg(); 171 // Update the caller's pointer if we decided to consume 172 // these characters. 173 Beg = I; 174 return false; 175 } 176 177 return false; 178 } 179 180 bool 181 clang::analyze_format_string::ParseVectorModifier(FormatStringHandler &H, 182 FormatSpecifier &FS, 183 const char *&I, 184 const char *E, 185 const LangOptions &LO) { 186 if (!LO.OpenCL) 187 return false; 188 189 const char *Start = I; 190 if (*I == 'v') { 191 ++I; 192 193 if (I == E) { 194 H.HandleIncompleteSpecifier(Start, E - Start); 195 return true; 196 } 197 198 OptionalAmount NumElts = ParseAmount(I, E); 199 if (NumElts.getHowSpecified() != OptionalAmount::Constant) { 200 H.HandleIncompleteSpecifier(Start, E - Start); 201 return true; 202 } 203 204 FS.setVectorNumElts(NumElts); 205 } 206 207 return false; 208 } 209 210 bool 211 clang::analyze_format_string::ParseLengthModifier(FormatSpecifier &FS, 212 const char *&I, 213 const char *E, 214 const LangOptions &LO, 215 bool IsScanf) { 216 LengthModifier::Kind lmKind = LengthModifier::None; 217 const char *lmPosition = I; 218 switch (*I) { 219 default: 220 return false; 221 case 'h': 222 ++I; 223 if (I != E && *I == 'h') { 224 ++I; 225 lmKind = LengthModifier::AsChar; 226 } else if (I != E && *I == 'l' && LO.OpenCL) { 227 ++I; 228 lmKind = LengthModifier::AsShortLong; 229 } else { 230 lmKind = LengthModifier::AsShort; 231 } 232 break; 233 case 'l': 234 ++I; 235 if (I != E && *I == 'l') { 236 ++I; 237 lmKind = LengthModifier::AsLongLong; 238 } else { 239 lmKind = LengthModifier::AsLong; 240 } 241 break; 242 case 'j': lmKind = LengthModifier::AsIntMax; ++I; break; 243 case 'z': lmKind = LengthModifier::AsSizeT; ++I; break; 244 case 't': lmKind = LengthModifier::AsPtrDiff; ++I; break; 245 case 'L': lmKind = LengthModifier::AsLongDouble; ++I; break; 246 case 'q': lmKind = LengthModifier::AsQuad; ++I; break; 247 case 'a': 248 if (IsScanf && !LO.C99 && !LO.CPlusPlus11) { 249 // For scanf in C90, look at the next character to see if this should 250 // be parsed as the GNU extension 'a' length modifier. If not, this 251 // will be parsed as a conversion specifier. 252 ++I; 253 if (I != E && (*I == 's' || *I == 'S' || *I == '[')) { 254 lmKind = LengthModifier::AsAllocate; 255 break; 256 } 257 --I; 258 } 259 return false; 260 case 'm': 261 if (IsScanf) { 262 lmKind = LengthModifier::AsMAllocate; 263 ++I; 264 break; 265 } 266 return false; 267 // printf: AsInt64, AsInt32, AsInt3264 268 // scanf: AsInt64 269 case 'I': 270 if (I + 1 != E && I + 2 != E) { 271 if (I[1] == '6' && I[2] == '4') { 272 I += 3; 273 lmKind = LengthModifier::AsInt64; 274 break; 275 } 276 if (IsScanf) 277 return false; 278 279 if (I[1] == '3' && I[2] == '2') { 280 I += 3; 281 lmKind = LengthModifier::AsInt32; 282 break; 283 } 284 } 285 ++I; 286 lmKind = LengthModifier::AsInt3264; 287 break; 288 case 'w': 289 lmKind = LengthModifier::AsWide; ++I; break; 290 } 291 LengthModifier lm(lmPosition, lmKind); 292 FS.setLengthModifier(lm); 293 return true; 294 } 295 296 bool clang::analyze_format_string::ParseUTF8InvalidSpecifier( 297 const char *SpecifierBegin, const char *FmtStrEnd, unsigned &Len) { 298 if (SpecifierBegin + 1 >= FmtStrEnd) 299 return false; 300 301 const llvm::UTF8 *SB = 302 reinterpret_cast<const llvm::UTF8 *>(SpecifierBegin + 1); 303 const llvm::UTF8 *SE = reinterpret_cast<const llvm::UTF8 *>(FmtStrEnd); 304 const char FirstByte = *SB; 305 306 // If the invalid specifier is a multibyte UTF-8 string, return the 307 // total length accordingly so that the conversion specifier can be 308 // properly updated to reflect a complete UTF-8 specifier. 309 unsigned NumBytes = llvm::getNumBytesForUTF8(FirstByte); 310 if (NumBytes == 1) 311 return false; 312 if (SB + NumBytes > SE) 313 return false; 314 315 Len = NumBytes + 1; 316 return true; 317 } 318 319 //===----------------------------------------------------------------------===// 320 // Methods on ArgType. 321 //===----------------------------------------------------------------------===// 322 323 clang::analyze_format_string::ArgType::MatchKind 324 ArgType::matchesType(ASTContext &C, QualType argTy) const { 325 if (Ptr) { 326 // It has to be a pointer. 327 const PointerType *PT = argTy->getAs<PointerType>(); 328 if (!PT) 329 return NoMatch; 330 331 // We cannot write through a const qualified pointer. 332 if (PT->getPointeeType().isConstQualified()) 333 return NoMatch; 334 335 argTy = PT->getPointeeType(); 336 } 337 338 switch (K) { 339 case InvalidTy: 340 llvm_unreachable("ArgType must be valid"); 341 342 case UnknownTy: 343 return Match; 344 345 case AnyCharTy: { 346 if (const EnumType *ETy = argTy->getAs<EnumType>()) { 347 // If the enum is incomplete we know nothing about the underlying type. 348 // Assume that it's 'int'. 349 if (!ETy->getDecl()->isComplete()) 350 return NoMatch; 351 argTy = ETy->getDecl()->getIntegerType(); 352 } 353 354 if (const BuiltinType *BT = argTy->getAs<BuiltinType>()) 355 switch (BT->getKind()) { 356 default: 357 break; 358 case BuiltinType::Char_S: 359 case BuiltinType::SChar: 360 case BuiltinType::UChar: 361 case BuiltinType::Char_U: 362 case BuiltinType::Bool: 363 return Match; 364 } 365 return NoMatch; 366 } 367 368 case SpecificTy: { 369 if (const EnumType *ETy = argTy->getAs<EnumType>()) { 370 // If the enum is incomplete we know nothing about the underlying type. 371 // Assume that it's 'int'. 372 if (!ETy->getDecl()->isComplete()) 373 argTy = C.IntTy; 374 else 375 argTy = ETy->getDecl()->getIntegerType(); 376 } 377 argTy = C.getCanonicalType(argTy).getUnqualifiedType(); 378 379 if (T == argTy) 380 return Match; 381 // Check for "compatible types". 382 if (const BuiltinType *BT = argTy->getAs<BuiltinType>()) 383 switch (BT->getKind()) { 384 default: 385 break; 386 case BuiltinType::Char_S: 387 case BuiltinType::SChar: 388 case BuiltinType::Char_U: 389 case BuiltinType::UChar: 390 case BuiltinType::Bool: 391 if (T == C.UnsignedShortTy || T == C.ShortTy) 392 return NoMatchTypeConfusion; 393 return T == C.UnsignedCharTy || T == C.SignedCharTy ? Match 394 : NoMatch; 395 case BuiltinType::Short: 396 return T == C.UnsignedShortTy ? Match : NoMatch; 397 case BuiltinType::UShort: 398 return T == C.ShortTy ? Match : NoMatch; 399 case BuiltinType::Int: 400 return T == C.UnsignedIntTy ? Match : NoMatch; 401 case BuiltinType::UInt: 402 return T == C.IntTy ? Match : NoMatch; 403 case BuiltinType::Long: 404 return T == C.UnsignedLongTy ? Match : NoMatch; 405 case BuiltinType::ULong: 406 return T == C.LongTy ? Match : NoMatch; 407 case BuiltinType::LongLong: 408 return T == C.UnsignedLongLongTy ? Match : NoMatch; 409 case BuiltinType::ULongLong: 410 return T == C.LongLongTy ? Match : NoMatch; 411 } 412 return NoMatch; 413 } 414 415 case CStrTy: { 416 const PointerType *PT = argTy->getAs<PointerType>(); 417 if (!PT) 418 return NoMatch; 419 QualType pointeeTy = PT->getPointeeType(); 420 if (const BuiltinType *BT = pointeeTy->getAs<BuiltinType>()) 421 switch (BT->getKind()) { 422 case BuiltinType::Char_U: 423 case BuiltinType::UChar: 424 case BuiltinType::Char_S: 425 case BuiltinType::SChar: 426 return Match; 427 default: 428 break; 429 } 430 431 return NoMatch; 432 } 433 434 case WCStrTy: { 435 const PointerType *PT = argTy->getAs<PointerType>(); 436 if (!PT) 437 return NoMatch; 438 QualType pointeeTy = 439 C.getCanonicalType(PT->getPointeeType()).getUnqualifiedType(); 440 return pointeeTy == C.getWideCharType() ? Match : NoMatch; 441 } 442 443 case WIntTy: { 444 QualType WInt = C.getCanonicalType(C.getWIntType()).getUnqualifiedType(); 445 446 if (C.getCanonicalType(argTy).getUnqualifiedType() == WInt) 447 return Match; 448 449 QualType PromoArg = argTy->isPromotableIntegerType() 450 ? C.getPromotedIntegerType(argTy) 451 : argTy; 452 PromoArg = C.getCanonicalType(PromoArg).getUnqualifiedType(); 453 454 // If the promoted argument is the corresponding signed type of the 455 // wint_t type, then it should match. 456 if (PromoArg->hasSignedIntegerRepresentation() && 457 C.getCorrespondingUnsignedType(PromoArg) == WInt) 458 return Match; 459 460 return WInt == PromoArg ? Match : NoMatch; 461 } 462 463 case CPointerTy: 464 if (argTy->isVoidPointerType()) { 465 return Match; 466 } if (argTy->isPointerType() || argTy->isObjCObjectPointerType() || 467 argTy->isBlockPointerType() || argTy->isNullPtrType()) { 468 return NoMatchPedantic; 469 } else { 470 return NoMatch; 471 } 472 473 case ObjCPointerTy: { 474 if (argTy->getAs<ObjCObjectPointerType>() || 475 argTy->getAs<BlockPointerType>()) 476 return Match; 477 478 // Handle implicit toll-free bridging. 479 if (const PointerType *PT = argTy->getAs<PointerType>()) { 480 // Things such as CFTypeRef are really just opaque pointers 481 // to C structs representing CF types that can often be bridged 482 // to Objective-C objects. Since the compiler doesn't know which 483 // structs can be toll-free bridged, we just accept them all. 484 QualType pointee = PT->getPointeeType(); 485 if (pointee->getAsStructureType() || pointee->isVoidType()) 486 return Match; 487 } 488 return NoMatch; 489 } 490 } 491 492 llvm_unreachable("Invalid ArgType Kind!"); 493 } 494 495 ArgType ArgType::makeVectorType(ASTContext &C, unsigned NumElts) const { 496 // Check for valid vector element types. 497 if (T.isNull()) 498 return ArgType::Invalid(); 499 500 QualType Vec = C.getExtVectorType(T, NumElts); 501 return ArgType(Vec, Name); 502 } 503 504 QualType ArgType::getRepresentativeType(ASTContext &C) const { 505 QualType Res; 506 switch (K) { 507 case InvalidTy: 508 llvm_unreachable("No representative type for Invalid ArgType"); 509 case UnknownTy: 510 llvm_unreachable("No representative type for Unknown ArgType"); 511 case AnyCharTy: 512 Res = C.CharTy; 513 break; 514 case SpecificTy: 515 Res = T; 516 break; 517 case CStrTy: 518 Res = C.getPointerType(C.CharTy); 519 break; 520 case WCStrTy: 521 Res = C.getPointerType(C.getWideCharType()); 522 break; 523 case ObjCPointerTy: 524 Res = C.ObjCBuiltinIdTy; 525 break; 526 case CPointerTy: 527 Res = C.VoidPtrTy; 528 break; 529 case WIntTy: { 530 Res = C.getWIntType(); 531 break; 532 } 533 } 534 535 if (Ptr) 536 Res = C.getPointerType(Res); 537 return Res; 538 } 539 540 std::string ArgType::getRepresentativeTypeName(ASTContext &C) const { 541 std::string S = getRepresentativeType(C).getAsString(C.getPrintingPolicy()); 542 543 std::string Alias; 544 if (Name) { 545 // Use a specific name for this type, e.g. "size_t". 546 Alias = Name; 547 if (Ptr) { 548 // If ArgType is actually a pointer to T, append an asterisk. 549 Alias += (Alias[Alias.size()-1] == '*') ? "*" : " *"; 550 } 551 // If Alias is the same as the underlying type, e.g. wchar_t, then drop it. 552 if (S == Alias) 553 Alias.clear(); 554 } 555 556 if (!Alias.empty()) 557 return std::string("'") + Alias + "' (aka '" + S + "')"; 558 return std::string("'") + S + "'"; 559 } 560 561 562 //===----------------------------------------------------------------------===// 563 // Methods on OptionalAmount. 564 //===----------------------------------------------------------------------===// 565 566 ArgType 567 analyze_format_string::OptionalAmount::getArgType(ASTContext &Ctx) const { 568 return Ctx.IntTy; 569 } 570 571 //===----------------------------------------------------------------------===// 572 // Methods on LengthModifier. 573 //===----------------------------------------------------------------------===// 574 575 const char * 576 analyze_format_string::LengthModifier::toString() const { 577 switch (kind) { 578 case AsChar: 579 return "hh"; 580 case AsShort: 581 return "h"; 582 case AsShortLong: 583 return "hl"; 584 case AsLong: // or AsWideChar 585 return "l"; 586 case AsLongLong: 587 return "ll"; 588 case AsQuad: 589 return "q"; 590 case AsIntMax: 591 return "j"; 592 case AsSizeT: 593 return "z"; 594 case AsPtrDiff: 595 return "t"; 596 case AsInt32: 597 return "I32"; 598 case AsInt3264: 599 return "I"; 600 case AsInt64: 601 return "I64"; 602 case AsLongDouble: 603 return "L"; 604 case AsAllocate: 605 return "a"; 606 case AsMAllocate: 607 return "m"; 608 case AsWide: 609 return "w"; 610 case None: 611 return ""; 612 } 613 return nullptr; 614 } 615 616 //===----------------------------------------------------------------------===// 617 // Methods on ConversionSpecifier. 618 //===----------------------------------------------------------------------===// 619 620 const char *ConversionSpecifier::toString() const { 621 switch (kind) { 622 case dArg: return "d"; 623 case DArg: return "D"; 624 case iArg: return "i"; 625 case oArg: return "o"; 626 case OArg: return "O"; 627 case uArg: return "u"; 628 case UArg: return "U"; 629 case xArg: return "x"; 630 case XArg: return "X"; 631 case fArg: return "f"; 632 case FArg: return "F"; 633 case eArg: return "e"; 634 case EArg: return "E"; 635 case gArg: return "g"; 636 case GArg: return "G"; 637 case aArg: return "a"; 638 case AArg: return "A"; 639 case cArg: return "c"; 640 case sArg: return "s"; 641 case pArg: return "p"; 642 case PArg: 643 return "P"; 644 case nArg: return "n"; 645 case PercentArg: return "%"; 646 case ScanListArg: return "["; 647 case InvalidSpecifier: return nullptr; 648 649 // POSIX unicode extensions. 650 case CArg: return "C"; 651 case SArg: return "S"; 652 653 // Objective-C specific specifiers. 654 case ObjCObjArg: return "@"; 655 656 // FreeBSD kernel specific specifiers. 657 case FreeBSDbArg: return "b"; 658 case FreeBSDDArg: return "D"; 659 case FreeBSDrArg: return "r"; 660 case FreeBSDyArg: return "y"; 661 662 // GlibC specific specifiers. 663 case PrintErrno: return "m"; 664 665 // MS specific specifiers. 666 case ZArg: return "Z"; 667 } 668 return nullptr; 669 } 670 671 Optional<ConversionSpecifier> 672 ConversionSpecifier::getStandardSpecifier() const { 673 ConversionSpecifier::Kind NewKind; 674 675 switch (getKind()) { 676 default: 677 return None; 678 case DArg: 679 NewKind = dArg; 680 break; 681 case UArg: 682 NewKind = uArg; 683 break; 684 case OArg: 685 NewKind = oArg; 686 break; 687 } 688 689 ConversionSpecifier FixedCS(*this); 690 FixedCS.setKind(NewKind); 691 return FixedCS; 692 } 693 694 //===----------------------------------------------------------------------===// 695 // Methods on OptionalAmount. 696 //===----------------------------------------------------------------------===// 697 698 void OptionalAmount::toString(raw_ostream &os) const { 699 switch (hs) { 700 case Invalid: 701 case NotSpecified: 702 return; 703 case Arg: 704 if (UsesDotPrefix) 705 os << "."; 706 if (usesPositionalArg()) 707 os << "*" << getPositionalArgIndex() << "$"; 708 else 709 os << "*"; 710 break; 711 case Constant: 712 if (UsesDotPrefix) 713 os << "."; 714 os << amt; 715 break; 716 } 717 } 718 719 bool FormatSpecifier::hasValidLengthModifier(const TargetInfo &Target, 720 const LangOptions &LO) const { 721 switch (LM.getKind()) { 722 case LengthModifier::None: 723 return true; 724 725 // Handle most integer flags 726 case LengthModifier::AsShort: 727 // Length modifier only applies to FP vectors. 728 if (LO.OpenCL && CS.isDoubleArg()) 729 return !VectorNumElts.isInvalid(); 730 731 if (Target.getTriple().isOSMSVCRT()) { 732 switch (CS.getKind()) { 733 case ConversionSpecifier::cArg: 734 case ConversionSpecifier::CArg: 735 case ConversionSpecifier::sArg: 736 case ConversionSpecifier::SArg: 737 case ConversionSpecifier::ZArg: 738 return true; 739 default: 740 break; 741 } 742 } 743 LLVM_FALLTHROUGH; 744 case LengthModifier::AsChar: 745 case LengthModifier::AsLongLong: 746 case LengthModifier::AsQuad: 747 case LengthModifier::AsIntMax: 748 case LengthModifier::AsSizeT: 749 case LengthModifier::AsPtrDiff: 750 switch (CS.getKind()) { 751 case ConversionSpecifier::dArg: 752 case ConversionSpecifier::DArg: 753 case ConversionSpecifier::iArg: 754 case ConversionSpecifier::oArg: 755 case ConversionSpecifier::OArg: 756 case ConversionSpecifier::uArg: 757 case ConversionSpecifier::UArg: 758 case ConversionSpecifier::xArg: 759 case ConversionSpecifier::XArg: 760 case ConversionSpecifier::nArg: 761 return true; 762 case ConversionSpecifier::FreeBSDbArg: 763 return Target.getTriple().isOSFreeBSD() || 764 Target.getTriple().isPS4() || 765 Target.getTriple().isOSOpenBSD(); 766 case ConversionSpecifier::FreeBSDrArg: 767 case ConversionSpecifier::FreeBSDyArg: 768 return Target.getTriple().isOSFreeBSD() || Target.getTriple().isPS4(); 769 default: 770 return false; 771 } 772 773 case LengthModifier::AsShortLong: 774 return LO.OpenCL && !VectorNumElts.isInvalid(); 775 776 // Handle 'l' flag 777 case LengthModifier::AsLong: // or AsWideChar 778 if (CS.isDoubleArg()) { 779 // Invalid for OpenCL FP scalars. 780 if (LO.OpenCL && VectorNumElts.isInvalid()) 781 return false; 782 return true; 783 } 784 785 switch (CS.getKind()) { 786 case ConversionSpecifier::dArg: 787 case ConversionSpecifier::DArg: 788 case ConversionSpecifier::iArg: 789 case ConversionSpecifier::oArg: 790 case ConversionSpecifier::OArg: 791 case ConversionSpecifier::uArg: 792 case ConversionSpecifier::UArg: 793 case ConversionSpecifier::xArg: 794 case ConversionSpecifier::XArg: 795 case ConversionSpecifier::nArg: 796 case ConversionSpecifier::cArg: 797 case ConversionSpecifier::sArg: 798 case ConversionSpecifier::ScanListArg: 799 case ConversionSpecifier::ZArg: 800 return true; 801 case ConversionSpecifier::FreeBSDbArg: 802 return Target.getTriple().isOSFreeBSD() || 803 Target.getTriple().isPS4() || 804 Target.getTriple().isOSOpenBSD(); 805 case ConversionSpecifier::FreeBSDrArg: 806 case ConversionSpecifier::FreeBSDyArg: 807 return Target.getTriple().isOSFreeBSD() || Target.getTriple().isPS4(); 808 default: 809 return false; 810 } 811 812 case LengthModifier::AsLongDouble: 813 switch (CS.getKind()) { 814 case ConversionSpecifier::aArg: 815 case ConversionSpecifier::AArg: 816 case ConversionSpecifier::fArg: 817 case ConversionSpecifier::FArg: 818 case ConversionSpecifier::eArg: 819 case ConversionSpecifier::EArg: 820 case ConversionSpecifier::gArg: 821 case ConversionSpecifier::GArg: 822 return true; 823 // GNU libc extension. 824 case ConversionSpecifier::dArg: 825 case ConversionSpecifier::iArg: 826 case ConversionSpecifier::oArg: 827 case ConversionSpecifier::uArg: 828 case ConversionSpecifier::xArg: 829 case ConversionSpecifier::XArg: 830 return !Target.getTriple().isOSDarwin() && 831 !Target.getTriple().isOSWindows(); 832 default: 833 return false; 834 } 835 836 case LengthModifier::AsAllocate: 837 switch (CS.getKind()) { 838 case ConversionSpecifier::sArg: 839 case ConversionSpecifier::SArg: 840 case ConversionSpecifier::ScanListArg: 841 return true; 842 default: 843 return false; 844 } 845 846 case LengthModifier::AsMAllocate: 847 switch (CS.getKind()) { 848 case ConversionSpecifier::cArg: 849 case ConversionSpecifier::CArg: 850 case ConversionSpecifier::sArg: 851 case ConversionSpecifier::SArg: 852 case ConversionSpecifier::ScanListArg: 853 return true; 854 default: 855 return false; 856 } 857 case LengthModifier::AsInt32: 858 case LengthModifier::AsInt3264: 859 case LengthModifier::AsInt64: 860 switch (CS.getKind()) { 861 case ConversionSpecifier::dArg: 862 case ConversionSpecifier::iArg: 863 case ConversionSpecifier::oArg: 864 case ConversionSpecifier::uArg: 865 case ConversionSpecifier::xArg: 866 case ConversionSpecifier::XArg: 867 return Target.getTriple().isOSMSVCRT(); 868 default: 869 return false; 870 } 871 case LengthModifier::AsWide: 872 switch (CS.getKind()) { 873 case ConversionSpecifier::cArg: 874 case ConversionSpecifier::CArg: 875 case ConversionSpecifier::sArg: 876 case ConversionSpecifier::SArg: 877 case ConversionSpecifier::ZArg: 878 return Target.getTriple().isOSMSVCRT(); 879 default: 880 return false; 881 } 882 } 883 llvm_unreachable("Invalid LengthModifier Kind!"); 884 } 885 886 bool FormatSpecifier::hasStandardLengthModifier() const { 887 switch (LM.getKind()) { 888 case LengthModifier::None: 889 case LengthModifier::AsChar: 890 case LengthModifier::AsShort: 891 case LengthModifier::AsLong: 892 case LengthModifier::AsLongLong: 893 case LengthModifier::AsIntMax: 894 case LengthModifier::AsSizeT: 895 case LengthModifier::AsPtrDiff: 896 case LengthModifier::AsLongDouble: 897 return true; 898 case LengthModifier::AsAllocate: 899 case LengthModifier::AsMAllocate: 900 case LengthModifier::AsQuad: 901 case LengthModifier::AsInt32: 902 case LengthModifier::AsInt3264: 903 case LengthModifier::AsInt64: 904 case LengthModifier::AsWide: 905 case LengthModifier::AsShortLong: // ??? 906 return false; 907 } 908 llvm_unreachable("Invalid LengthModifier Kind!"); 909 } 910 911 bool FormatSpecifier::hasStandardConversionSpecifier( 912 const LangOptions &LangOpt) const { 913 switch (CS.getKind()) { 914 case ConversionSpecifier::cArg: 915 case ConversionSpecifier::dArg: 916 case ConversionSpecifier::iArg: 917 case ConversionSpecifier::oArg: 918 case ConversionSpecifier::uArg: 919 case ConversionSpecifier::xArg: 920 case ConversionSpecifier::XArg: 921 case ConversionSpecifier::fArg: 922 case ConversionSpecifier::FArg: 923 case ConversionSpecifier::eArg: 924 case ConversionSpecifier::EArg: 925 case ConversionSpecifier::gArg: 926 case ConversionSpecifier::GArg: 927 case ConversionSpecifier::aArg: 928 case ConversionSpecifier::AArg: 929 case ConversionSpecifier::sArg: 930 case ConversionSpecifier::pArg: 931 case ConversionSpecifier::nArg: 932 case ConversionSpecifier::ObjCObjArg: 933 case ConversionSpecifier::ScanListArg: 934 case ConversionSpecifier::PercentArg: 935 case ConversionSpecifier::PArg: 936 return true; 937 case ConversionSpecifier::CArg: 938 case ConversionSpecifier::SArg: 939 return LangOpt.ObjC; 940 case ConversionSpecifier::InvalidSpecifier: 941 case ConversionSpecifier::FreeBSDbArg: 942 case ConversionSpecifier::FreeBSDDArg: 943 case ConversionSpecifier::FreeBSDrArg: 944 case ConversionSpecifier::FreeBSDyArg: 945 case ConversionSpecifier::PrintErrno: 946 case ConversionSpecifier::DArg: 947 case ConversionSpecifier::OArg: 948 case ConversionSpecifier::UArg: 949 case ConversionSpecifier::ZArg: 950 return false; 951 } 952 llvm_unreachable("Invalid ConversionSpecifier Kind!"); 953 } 954 955 bool FormatSpecifier::hasStandardLengthConversionCombination() const { 956 if (LM.getKind() == LengthModifier::AsLongDouble) { 957 switch(CS.getKind()) { 958 case ConversionSpecifier::dArg: 959 case ConversionSpecifier::iArg: 960 case ConversionSpecifier::oArg: 961 case ConversionSpecifier::uArg: 962 case ConversionSpecifier::xArg: 963 case ConversionSpecifier::XArg: 964 case ConversionSpecifier::FreeBSDbArg: 965 return false; 966 default: 967 return true; 968 } 969 } 970 return true; 971 } 972 973 Optional<LengthModifier> FormatSpecifier::getCorrectedLengthModifier() const { 974 if (CS.isAnyIntArg() || CS.getKind() == ConversionSpecifier::nArg) { 975 if (LM.getKind() == LengthModifier::AsLongDouble || 976 LM.getKind() == LengthModifier::AsQuad) { 977 LengthModifier FixedLM(LM); 978 FixedLM.setKind(LengthModifier::AsLongLong); 979 return FixedLM; 980 } 981 } 982 983 return None; 984 } 985 986 bool FormatSpecifier::namedTypeToLengthModifier(QualType QT, 987 LengthModifier &LM) { 988 assert(isa<TypedefType>(QT) && "Expected a TypedefType"); 989 const TypedefNameDecl *Typedef = cast<TypedefType>(QT)->getDecl(); 990 991 for (;;) { 992 const IdentifierInfo *Identifier = Typedef->getIdentifier(); 993 if (Identifier->getName() == "size_t") { 994 LM.setKind(LengthModifier::AsSizeT); 995 return true; 996 } else if (Identifier->getName() == "ssize_t") { 997 // Not C99, but common in Unix. 998 LM.setKind(LengthModifier::AsSizeT); 999 return true; 1000 } else if (Identifier->getName() == "intmax_t") { 1001 LM.setKind(LengthModifier::AsIntMax); 1002 return true; 1003 } else if (Identifier->getName() == "uintmax_t") { 1004 LM.setKind(LengthModifier::AsIntMax); 1005 return true; 1006 } else if (Identifier->getName() == "ptrdiff_t") { 1007 LM.setKind(LengthModifier::AsPtrDiff); 1008 return true; 1009 } 1010 1011 QualType T = Typedef->getUnderlyingType(); 1012 if (!isa<TypedefType>(T)) 1013 break; 1014 1015 Typedef = cast<TypedefType>(T)->getDecl(); 1016 } 1017 return false; 1018 } 1019