//===- FormatVariadic.cpp - Format string parsing and analysis ----*-C++-*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception //===----------------------------------------------------------------------===// #include "llvm/Support/FormatVariadic.h" #include #include using namespace llvm; static std::optional translateLocChar(char C) { switch (C) { case '-': return AlignStyle::Left; case '=': return AlignStyle::Center; case '+': return AlignStyle::Right; default: return std::nullopt; } LLVM_BUILTIN_UNREACHABLE; } static bool consumeFieldLayout(StringRef &Spec, AlignStyle &Where, unsigned &Align, char &Pad) { Where = AlignStyle::Right; Align = 0; Pad = ' '; if (Spec.empty()) return true; if (Spec.size() > 1) { // A maximum of 2 characters at the beginning can be used for something // other than the width. // If Spec[1] is a loc char, then Spec[0] is a pad char and Spec[2:...] // contains the width. // Otherwise, if Spec[0] is a loc char, then Spec[1:...] contains the width. // Otherwise, Spec[0:...] contains the width. if (auto Loc = translateLocChar(Spec[1])) { Pad = Spec[0]; Where = *Loc; Spec = Spec.drop_front(2); } else if (auto Loc = translateLocChar(Spec[0])) { Where = *Loc; Spec = Spec.drop_front(1); } } bool Failed = Spec.consumeInteger(0, Align); return !Failed; } static std::optional parseReplacementItem(StringRef Spec) { StringRef RepString = Spec.trim("{}"); // If the replacement sequence does not start with a non-negative integer, // this is an error. char Pad = ' '; unsigned Align = 0; AlignStyle Where = AlignStyle::Right; StringRef Options; unsigned Index = ~0U; RepString = RepString.ltrim(); // If index is not specified, keep it ~0U to indicate unresolved index. RepString.consumeInteger(0, Index); if (RepString.consume_front(",")) { if (!consumeFieldLayout(RepString, Where, Align, Pad)) { assert(false && "Invalid replacement field layout specification!"); return std::nullopt; } } RepString = RepString.ltrim(); if (RepString.consume_front(":")) { Options = RepString; RepString = StringRef(); } RepString = RepString.trim(); if (!RepString.empty()) { assert(0 && "Unexpected characters found in replacement string!"); return std::nullopt; } return ReplacementItem(Spec, Index, Align, Where, Pad, Options); } static std::pair, StringRef> splitLiteralAndReplacement(StringRef Fmt) { assert(!Fmt.empty()); // Everything up until the first brace is a literal. if (Fmt.front() != '{') { size_t BO = Fmt.find_first_of('{'); return {ReplacementItem{Fmt.substr(0, BO)}, Fmt.substr(BO)}; } StringRef Braces = Fmt.take_while([](char C) { return C == '{'; }); // If there is more than one brace, then some of them are escaped. Treat // these as replacements. if (Braces.size() > 1) { size_t NumEscapedBraces = Braces.size() / 2; StringRef Middle = Fmt.take_front(NumEscapedBraces); StringRef Right = Fmt.drop_front(NumEscapedBraces * 2); return {ReplacementItem(Middle), Right}; } // An unterminated open brace is undefined. Assert to indicate that this is // undefined and that we consider it an error. When asserts are disabled, // build a replacement item with an error message. size_t BC = Fmt.find_first_of('}'); if (BC == StringRef::npos) { assert(false && "Unterminated brace sequence. Escape with {{ for a literal brace."); return {ReplacementItem("Unterminated brace sequence. Escape with {{ for a " "literal brace."), StringRef()}; } // Even if there is a closing brace, if there is another open brace before // this closing brace, treat this portion as literal, and try again with the // next one. size_t BO2 = Fmt.find_first_of('{', 1); if (BO2 < BC) return {ReplacementItem(Fmt.substr(0, BO2)), Fmt.substr(BO2)}; StringRef Spec = Fmt.slice(1, BC); StringRef Right = Fmt.substr(BC + 1); return {parseReplacementItem(Spec), Right}; } #ifndef NDEBUG #define ENABLE_VALIDATION 1 #else #define ENABLE_VALIDATION 0 // Conveniently enable validation in release mode. #endif SmallVector formatv_object_base::parseFormatString(StringRef Fmt, size_t NumArgs, bool Validate) { SmallVector Replacements; unsigned NextAutomaticIndex = 0; #if ENABLE_VALIDATION const StringRef SavedFmtStr = Fmt; unsigned NumExpectedArgs = 0; bool HasExplicitIndex = false; #endif while (!Fmt.empty()) { std::optional I; std::tie(I, Fmt) = splitLiteralAndReplacement(Fmt); if (!I) continue; if (I->Type == ReplacementType::Format) { if (I->Index == ~0U) I->Index = NextAutomaticIndex++; #if ENABLE_VALIDATION else HasExplicitIndex = true; NumExpectedArgs = std::max(NumExpectedArgs, I->Index + 1); #endif } Replacements.emplace_back(*I); } #if ENABLE_VALIDATION if (!Validate) return Replacements; // Perform additional validation. Verify that the number of arguments matches // the number of replacement indices and that there are no holes in the // replacement indices. // When validation fails, return an array of replacement items that // will print an error message as the outout of this formatv() (used when // validation is enabled in release mode). auto getErrorReplacements = [SavedFmtStr](StringLiteral ErrorMsg) { return SmallVector{ ReplacementItem("Invalid formatv() call: "), ReplacementItem(ErrorMsg), ReplacementItem(" for format string: "), ReplacementItem(SavedFmtStr)}; }; if (NumExpectedArgs != NumArgs) { errs() << formatv("Expected {} Args, but got {} for format string '{}'\n", NumExpectedArgs, NumArgs, SavedFmtStr); assert(0 && "Invalid formatv() call"); return getErrorReplacements("Unexpected number of arguments"); } // Find the number of unique indices seen. All replacement indices // are < NumExpectedArgs. SmallVector Indices(NumExpectedArgs); unsigned Count = 0; for (const ReplacementItem &I : Replacements) { if (I.Type != ReplacementType::Format || Indices[I.Index]) continue; Indices[I.Index] = true; ++Count; } if (Count != NumExpectedArgs) { errs() << formatv( "Replacement field indices cannot have holes for format string '{}'\n", SavedFmtStr); assert(0 && "Invalid format string"); return getErrorReplacements("Replacement indices have holes"); } // Fail validation if we see both automatic index and explicit index. if (NextAutomaticIndex != 0 && HasExplicitIndex) { errs() << formatv( "Cannot mix automatic and explicit indices for format string '{}'\n", SavedFmtStr); assert(0 && "Invalid format string"); return getErrorReplacements("Cannot mix automatic and explicit indices"); } #endif // ENABLE_VALIDATION return Replacements; } void support::detail::format_adapter::anchor() {}