xref: /freebsd-src/contrib/kyua/utils/format/formatter.cpp (revision b0d29bc47dba79f6f38e67eabadfb4b32ffd9390)
1*b0d29bc4SBrooks Davis // Copyright 2010 The Kyua Authors.
2*b0d29bc4SBrooks Davis // All rights reserved.
3*b0d29bc4SBrooks Davis //
4*b0d29bc4SBrooks Davis // Redistribution and use in source and binary forms, with or without
5*b0d29bc4SBrooks Davis // modification, are permitted provided that the following conditions are
6*b0d29bc4SBrooks Davis // met:
7*b0d29bc4SBrooks Davis //
8*b0d29bc4SBrooks Davis // * Redistributions of source code must retain the above copyright
9*b0d29bc4SBrooks Davis //   notice, this list of conditions and the following disclaimer.
10*b0d29bc4SBrooks Davis // * Redistributions in binary form must reproduce the above copyright
11*b0d29bc4SBrooks Davis //   notice, this list of conditions and the following disclaimer in the
12*b0d29bc4SBrooks Davis //   documentation and/or other materials provided with the distribution.
13*b0d29bc4SBrooks Davis // * Neither the name of Google Inc. nor the names of its contributors
14*b0d29bc4SBrooks Davis //   may be used to endorse or promote products derived from this software
15*b0d29bc4SBrooks Davis //   without specific prior written permission.
16*b0d29bc4SBrooks Davis //
17*b0d29bc4SBrooks Davis // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18*b0d29bc4SBrooks Davis // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19*b0d29bc4SBrooks Davis // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20*b0d29bc4SBrooks Davis // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21*b0d29bc4SBrooks Davis // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22*b0d29bc4SBrooks Davis // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23*b0d29bc4SBrooks Davis // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24*b0d29bc4SBrooks Davis // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25*b0d29bc4SBrooks Davis // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26*b0d29bc4SBrooks Davis // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27*b0d29bc4SBrooks Davis // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28*b0d29bc4SBrooks Davis 
29*b0d29bc4SBrooks Davis #include "utils/format/formatter.hpp"
30*b0d29bc4SBrooks Davis 
31*b0d29bc4SBrooks Davis #include <memory>
32*b0d29bc4SBrooks Davis #include <string>
33*b0d29bc4SBrooks Davis #include <utility>
34*b0d29bc4SBrooks Davis 
35*b0d29bc4SBrooks Davis #include "utils/format/exceptions.hpp"
36*b0d29bc4SBrooks Davis #include "utils/sanity.hpp"
37*b0d29bc4SBrooks Davis #include "utils/text/exceptions.hpp"
38*b0d29bc4SBrooks Davis #include "utils/text/operations.ipp"
39*b0d29bc4SBrooks Davis 
40*b0d29bc4SBrooks Davis namespace format = utils::format;
41*b0d29bc4SBrooks Davis namespace text = utils::text;
42*b0d29bc4SBrooks Davis 
43*b0d29bc4SBrooks Davis 
44*b0d29bc4SBrooks Davis namespace {
45*b0d29bc4SBrooks Davis 
46*b0d29bc4SBrooks Davis 
47*b0d29bc4SBrooks Davis /// Finds the next placeholder in a string.
48*b0d29bc4SBrooks Davis ///
49*b0d29bc4SBrooks Davis /// \param format The original format string provided by the user; needed for
50*b0d29bc4SBrooks Davis ///     error reporting purposes only.
51*b0d29bc4SBrooks Davis /// \param expansion The string containing the placeholder to look for.  Any
52*b0d29bc4SBrooks Davis ///     '%%' in the string will be skipped, and they must be stripped later by
53*b0d29bc4SBrooks Davis ///     strip_double_percent().
54*b0d29bc4SBrooks Davis /// \param begin The position from which to start looking for the next
55*b0d29bc4SBrooks Davis ///     placeholder.
56*b0d29bc4SBrooks Davis ///
57*b0d29bc4SBrooks Davis /// \return The position in the string in which the placeholder is located and
58*b0d29bc4SBrooks Davis /// the placeholder itself.  If there are no placeholders left, this returns
59*b0d29bc4SBrooks Davis /// the length of the string and an empty string.
60*b0d29bc4SBrooks Davis ///
61*b0d29bc4SBrooks Davis /// \throw bad_format_error If the input string contains a trailing formatting
62*b0d29bc4SBrooks Davis ///     character.  We cannot detect any other kind of invalid formatter because
63*b0d29bc4SBrooks Davis ///     we do not implement a full parser for them.
64*b0d29bc4SBrooks Davis static std::pair< std::string::size_type, std::string >
find_next_placeholder(const std::string & format,const std::string & expansion,std::string::size_type begin)65*b0d29bc4SBrooks Davis find_next_placeholder(const std::string& format,
66*b0d29bc4SBrooks Davis                       const std::string& expansion,
67*b0d29bc4SBrooks Davis                       std::string::size_type begin)
68*b0d29bc4SBrooks Davis {
69*b0d29bc4SBrooks Davis     begin = expansion.find('%', begin);
70*b0d29bc4SBrooks Davis     while (begin != std::string::npos && expansion[begin + 1] == '%')
71*b0d29bc4SBrooks Davis         begin = expansion.find('%', begin + 2);
72*b0d29bc4SBrooks Davis     if (begin == std::string::npos)
73*b0d29bc4SBrooks Davis         return std::make_pair(expansion.length(), "");
74*b0d29bc4SBrooks Davis     if (begin == expansion.length() - 1)
75*b0d29bc4SBrooks Davis         throw format::bad_format_error(format, "Trailing %");
76*b0d29bc4SBrooks Davis 
77*b0d29bc4SBrooks Davis     std::string::size_type end = begin + 1;
78*b0d29bc4SBrooks Davis     while (end < expansion.length() && expansion[end] != 's')
79*b0d29bc4SBrooks Davis         end++;
80*b0d29bc4SBrooks Davis     const std::string placeholder = expansion.substr(begin, end - begin + 1);
81*b0d29bc4SBrooks Davis     if (end == expansion.length() ||
82*b0d29bc4SBrooks Davis         placeholder.find('%', 1) != std::string::npos)
83*b0d29bc4SBrooks Davis         throw format::bad_format_error(format, "Unterminated placeholder '" +
84*b0d29bc4SBrooks Davis                                        placeholder + "'");
85*b0d29bc4SBrooks Davis     return std::make_pair(begin, placeholder);
86*b0d29bc4SBrooks Davis }
87*b0d29bc4SBrooks Davis 
88*b0d29bc4SBrooks Davis 
89*b0d29bc4SBrooks Davis /// Converts a string to an integer.
90*b0d29bc4SBrooks Davis ///
91*b0d29bc4SBrooks Davis /// \param format The format string; for error reporting purposes only.
92*b0d29bc4SBrooks Davis /// \param str The string to conver.
93*b0d29bc4SBrooks Davis /// \param what The name of the field this integer belongs to; for error
94*b0d29bc4SBrooks Davis ///     reporting purposes only.
95*b0d29bc4SBrooks Davis ///
96*b0d29bc4SBrooks Davis /// \return An integer representing the input string.
97*b0d29bc4SBrooks Davis inline int
to_int(const std::string & format,const std::string & str,const char * what)98*b0d29bc4SBrooks Davis to_int(const std::string& format, const std::string& str, const char* what)
99*b0d29bc4SBrooks Davis {
100*b0d29bc4SBrooks Davis     try {
101*b0d29bc4SBrooks Davis         return text::to_type< int >(str);
102*b0d29bc4SBrooks Davis     } catch (const text::value_error& e) {
103*b0d29bc4SBrooks Davis         throw format::bad_format_error(format, "Invalid " + std::string(what) +
104*b0d29bc4SBrooks Davis                                        "specifier");
105*b0d29bc4SBrooks Davis     }
106*b0d29bc4SBrooks Davis }
107*b0d29bc4SBrooks Davis 
108*b0d29bc4SBrooks Davis 
109*b0d29bc4SBrooks Davis /// Constructs an std::ostringstream based on a formatting placeholder.
110*b0d29bc4SBrooks Davis ///
111*b0d29bc4SBrooks Davis /// \param format The format placeholder; may be empty.
112*b0d29bc4SBrooks Davis ///
113*b0d29bc4SBrooks Davis /// \return A new std::ostringstream that is prepared to format a single
114*b0d29bc4SBrooks Davis /// object in the manner specified by the format placeholder.
115*b0d29bc4SBrooks Davis ///
116*b0d29bc4SBrooks Davis /// \throw bad_format_error If the format string is bad.  We do minimal
117*b0d29bc4SBrooks Davis ///     validation on this string though.
118*b0d29bc4SBrooks Davis static std::ostringstream*
new_ostringstream(const std::string & format)119*b0d29bc4SBrooks Davis new_ostringstream(const std::string& format)
120*b0d29bc4SBrooks Davis {
121*b0d29bc4SBrooks Davis     std::auto_ptr< std::ostringstream > output(new std::ostringstream());
122*b0d29bc4SBrooks Davis 
123*b0d29bc4SBrooks Davis     if (format.length() <= 2) {
124*b0d29bc4SBrooks Davis         // If the format is empty, we create a new stream so that we don't have
125*b0d29bc4SBrooks Davis         // to check for NULLs later on.  We rarely should hit this condition
126*b0d29bc4SBrooks Davis         // (and when we do it's a bug in the caller), so this is not a big deal.
127*b0d29bc4SBrooks Davis         //
128*b0d29bc4SBrooks Davis         // Otherwise, if the format is a regular '%s', then we don't have to do
129*b0d29bc4SBrooks Davis         // any processing for additional formatters.  So this is just a "fast
130*b0d29bc4SBrooks Davis         // path".
131*b0d29bc4SBrooks Davis     } else {
132*b0d29bc4SBrooks Davis         std::string partial = format.substr(1, format.length() - 2);
133*b0d29bc4SBrooks Davis         if (partial[0] == '0') {
134*b0d29bc4SBrooks Davis             output->fill('0');
135*b0d29bc4SBrooks Davis             partial.erase(0, 1);
136*b0d29bc4SBrooks Davis         }
137*b0d29bc4SBrooks Davis         if (!partial.empty()) {
138*b0d29bc4SBrooks Davis             const std::string::size_type dot = partial.find('.');
139*b0d29bc4SBrooks Davis             if (dot != 0)
140*b0d29bc4SBrooks Davis                 output->width(to_int(format, partial.substr(0, dot), "width"));
141*b0d29bc4SBrooks Davis             if (dot != std::string::npos) {
142*b0d29bc4SBrooks Davis                 output->setf(std::ios::fixed, std::ios::floatfield);
143*b0d29bc4SBrooks Davis                 output->precision(to_int(format, partial.substr(dot + 1),
144*b0d29bc4SBrooks Davis                                          "precision"));
145*b0d29bc4SBrooks Davis             }
146*b0d29bc4SBrooks Davis         }
147*b0d29bc4SBrooks Davis     }
148*b0d29bc4SBrooks Davis 
149*b0d29bc4SBrooks Davis     return output.release();
150*b0d29bc4SBrooks Davis }
151*b0d29bc4SBrooks Davis 
152*b0d29bc4SBrooks Davis 
153*b0d29bc4SBrooks Davis /// Replaces '%%' by '%' in a given string range.
154*b0d29bc4SBrooks Davis ///
155*b0d29bc4SBrooks Davis /// \param in The input string to be rewritten.
156*b0d29bc4SBrooks Davis /// \param begin The position at which to start the replacement.
157*b0d29bc4SBrooks Davis /// \param end The position at which to end the replacement.
158*b0d29bc4SBrooks Davis ///
159*b0d29bc4SBrooks Davis /// \return The modified string and the amount of characters removed.
160*b0d29bc4SBrooks Davis static std::pair< std::string, int >
strip_double_percent(const std::string & in,const std::string::size_type begin,std::string::size_type end)161*b0d29bc4SBrooks Davis strip_double_percent(const std::string& in, const std::string::size_type begin,
162*b0d29bc4SBrooks Davis                      std::string::size_type end)
163*b0d29bc4SBrooks Davis {
164*b0d29bc4SBrooks Davis     std::string part = in.substr(begin, end - begin);
165*b0d29bc4SBrooks Davis 
166*b0d29bc4SBrooks Davis     int removed = 0;
167*b0d29bc4SBrooks Davis     std::string::size_type pos = part.find("%%");
168*b0d29bc4SBrooks Davis     while (pos != std::string::npos) {
169*b0d29bc4SBrooks Davis         part.erase(pos, 1);
170*b0d29bc4SBrooks Davis         ++removed;
171*b0d29bc4SBrooks Davis         pos = part.find("%%", pos + 1);
172*b0d29bc4SBrooks Davis     }
173*b0d29bc4SBrooks Davis 
174*b0d29bc4SBrooks Davis     return std::make_pair(in.substr(0, begin) + part + in.substr(end), removed);
175*b0d29bc4SBrooks Davis }
176*b0d29bc4SBrooks Davis 
177*b0d29bc4SBrooks Davis 
178*b0d29bc4SBrooks Davis }  // anonymous namespace
179*b0d29bc4SBrooks Davis 
180*b0d29bc4SBrooks Davis 
181*b0d29bc4SBrooks Davis /// Performs internal initialization of the formatter.
182*b0d29bc4SBrooks Davis ///
183*b0d29bc4SBrooks Davis /// This is separate from the constructor just because it is shared by different
184*b0d29bc4SBrooks Davis /// overloaded constructors.
185*b0d29bc4SBrooks Davis void
init(void)186*b0d29bc4SBrooks Davis format::formatter::init(void)
187*b0d29bc4SBrooks Davis {
188*b0d29bc4SBrooks Davis     const std::pair< std::string::size_type, std::string > placeholder =
189*b0d29bc4SBrooks Davis         find_next_placeholder(_format, _expansion, _last_pos);
190*b0d29bc4SBrooks Davis     const std::pair< std::string, int > no_percents =
191*b0d29bc4SBrooks Davis         strip_double_percent(_expansion, _last_pos, placeholder.first);
192*b0d29bc4SBrooks Davis 
193*b0d29bc4SBrooks Davis     _oss = new_ostringstream(placeholder.second);
194*b0d29bc4SBrooks Davis 
195*b0d29bc4SBrooks Davis     _expansion = no_percents.first;
196*b0d29bc4SBrooks Davis     _placeholder_pos = placeholder.first - no_percents.second;
197*b0d29bc4SBrooks Davis     _placeholder = placeholder.second;
198*b0d29bc4SBrooks Davis }
199*b0d29bc4SBrooks Davis 
200*b0d29bc4SBrooks Davis 
201*b0d29bc4SBrooks Davis /// Constructs a new formatter object (internal).
202*b0d29bc4SBrooks Davis ///
203*b0d29bc4SBrooks Davis /// \param format The format string.
204*b0d29bc4SBrooks Davis /// \param expansion The format string with any replacements performed so far.
205*b0d29bc4SBrooks Davis /// \param last_pos The position from which to start looking for formatting
206*b0d29bc4SBrooks Davis ///     placeholders.  This must be maintained in case one of the replacements
207*b0d29bc4SBrooks Davis ///     introduced a new placeholder, which must be ignored.  Think, for
208*b0d29bc4SBrooks Davis ///     example, replacing a "%s" string with "foo %s".
formatter(const std::string & format,const std::string & expansion,const std::string::size_type last_pos)209*b0d29bc4SBrooks Davis format::formatter::formatter(const std::string& format,
210*b0d29bc4SBrooks Davis                              const std::string& expansion,
211*b0d29bc4SBrooks Davis                              const std::string::size_type last_pos) :
212*b0d29bc4SBrooks Davis     _format(format),
213*b0d29bc4SBrooks Davis     _expansion(expansion),
214*b0d29bc4SBrooks Davis     _last_pos(last_pos),
215*b0d29bc4SBrooks Davis     _oss(NULL)
216*b0d29bc4SBrooks Davis {
217*b0d29bc4SBrooks Davis     init();
218*b0d29bc4SBrooks Davis }
219*b0d29bc4SBrooks Davis 
220*b0d29bc4SBrooks Davis 
221*b0d29bc4SBrooks Davis /// Constructs a new formatter object.
222*b0d29bc4SBrooks Davis ///
223*b0d29bc4SBrooks Davis /// \param format The format string.  The formatters in the string are not
224*b0d29bc4SBrooks Davis ///     validated during construction, but will cause errors when used later if
225*b0d29bc4SBrooks Davis ///     they are invalid.
formatter(const std::string & format)226*b0d29bc4SBrooks Davis format::formatter::formatter(const std::string& format) :
227*b0d29bc4SBrooks Davis     _format(format),
228*b0d29bc4SBrooks Davis     _expansion(format),
229*b0d29bc4SBrooks Davis     _last_pos(0),
230*b0d29bc4SBrooks Davis     _oss(NULL)
231*b0d29bc4SBrooks Davis {
232*b0d29bc4SBrooks Davis     init();
233*b0d29bc4SBrooks Davis }
234*b0d29bc4SBrooks Davis 
235*b0d29bc4SBrooks Davis 
~formatter(void)236*b0d29bc4SBrooks Davis format::formatter::~formatter(void)
237*b0d29bc4SBrooks Davis {
238*b0d29bc4SBrooks Davis     delete _oss;
239*b0d29bc4SBrooks Davis }
240*b0d29bc4SBrooks Davis 
241*b0d29bc4SBrooks Davis 
242*b0d29bc4SBrooks Davis /// Returns the formatted string.
243*b0d29bc4SBrooks Davis ///
244*b0d29bc4SBrooks Davis /// \return A string representation of the formatted string.
245*b0d29bc4SBrooks Davis const std::string&
str(void) const246*b0d29bc4SBrooks Davis format::formatter::str(void) const
247*b0d29bc4SBrooks Davis {
248*b0d29bc4SBrooks Davis     return _expansion;
249*b0d29bc4SBrooks Davis }
250*b0d29bc4SBrooks Davis 
251*b0d29bc4SBrooks Davis 
252*b0d29bc4SBrooks Davis /// Automatic conversion of formatter objects to strings.
253*b0d29bc4SBrooks Davis ///
254*b0d29bc4SBrooks Davis /// This is provided to allow painless injection of formatter objects into
255*b0d29bc4SBrooks Davis /// streams, without having to manually call the str() method.
operator const std::string&(void) const256*b0d29bc4SBrooks Davis format::formatter::operator const std::string&(void) const
257*b0d29bc4SBrooks Davis {
258*b0d29bc4SBrooks Davis     return _expansion;
259*b0d29bc4SBrooks Davis }
260*b0d29bc4SBrooks Davis 
261*b0d29bc4SBrooks Davis 
262*b0d29bc4SBrooks Davis /// Specialization of operator% for booleans.
263*b0d29bc4SBrooks Davis ///
264*b0d29bc4SBrooks Davis /// \param value The boolean to inject into the format string.
265*b0d29bc4SBrooks Davis ///
266*b0d29bc4SBrooks Davis /// \return A new formatter that has one less format placeholder.
267*b0d29bc4SBrooks Davis format::formatter
operator %(const bool & value) const268*b0d29bc4SBrooks Davis format::formatter::operator%(const bool& value) const
269*b0d29bc4SBrooks Davis {
270*b0d29bc4SBrooks Davis     (*_oss) << (value ? "true" : "false");
271*b0d29bc4SBrooks Davis     return replace(_oss->str());
272*b0d29bc4SBrooks Davis }
273*b0d29bc4SBrooks Davis 
274*b0d29bc4SBrooks Davis 
275*b0d29bc4SBrooks Davis /// Replaces the first formatting placeholder with a value.
276*b0d29bc4SBrooks Davis ///
277*b0d29bc4SBrooks Davis /// \param arg The replacement string.
278*b0d29bc4SBrooks Davis ///
279*b0d29bc4SBrooks Davis /// \return A new formatter in which the first formatting placeholder has been
280*b0d29bc4SBrooks Davis ///     replaced by arg and is ready to replace the next item.
281*b0d29bc4SBrooks Davis ///
282*b0d29bc4SBrooks Davis /// \throw utils::format::extra_args_error If there are no more formatting
283*b0d29bc4SBrooks Davis ///     placeholders in the input string, or if the placeholder is invalid.
284*b0d29bc4SBrooks Davis format::formatter
replace(const std::string & arg) const285*b0d29bc4SBrooks Davis format::formatter::replace(const std::string& arg) const
286*b0d29bc4SBrooks Davis {
287*b0d29bc4SBrooks Davis     if (_placeholder_pos == _expansion.length())
288*b0d29bc4SBrooks Davis         throw format::extra_args_error(_format, arg);
289*b0d29bc4SBrooks Davis 
290*b0d29bc4SBrooks Davis     const std::string expansion = _expansion.substr(0, _placeholder_pos)
291*b0d29bc4SBrooks Davis         + arg + _expansion.substr(_placeholder_pos + _placeholder.length());
292*b0d29bc4SBrooks Davis     return formatter(_format, expansion, _placeholder_pos + arg.length());
293*b0d29bc4SBrooks Davis }
294