forked from cataclysmbnteam/Cataclysm-BN
-
Notifications
You must be signed in to change notification settings - Fork 0
/
string_formatter.h
464 lines (444 loc) · 22 KB
/
string_formatter.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
#pragma once
#ifndef CATA_SRC_STRING_FORMATTER_H
#define CATA_SRC_STRING_FORMATTER_H
#include <cstddef>
#include <optional>
#include <string>
#include <type_traits>
#include <typeinfo>
#include <utility>
class translation;
template<typename T>
class string_id;
namespace cata
{
class string_formatter;
// wrapper to allow calling string_formatter::throw_error before the definition of string_formatter
[[noreturn]]
void throw_error( const string_formatter &, const std::string & );
// wrapper to access string_formatter::temp_buffer before the definition of string_formatter
std::string_view string_formatter_set_temp_buffer( const string_formatter &, std::string_view );
// Handle currently active exception from string_formatter and return it as string
std::string handle_string_format_error();
/**
* @defgroup string_formatter_convert Convert functions for @ref string_formatter
*
* The `convert` functions here are used to convert the input value of
* @ref string_formatter::parse into the requested type, as defined by the format specifiers.
*
* @tparam T the input type, as given by the call to `string_format`.
* @tparam RT the requested type. The `convert` functions return such a value or they throw
* an exception via @ref throw_error.
*
* Each function has the same parameters:
* First parameter defined the requested type. The value of the pointer is ignored, callers
* should use a (properly casted) `nullptr`. It is required to "simulate" overloading the
* return value. E.g. `long convert(long*, int)` and `short convert(short*, int)` both convert
* a input value of type `int`, but the first converts to `long` and the second converts to
* `short`. Without the first parameters their signature would be identical.
* The second parameter is used to call @ref throw_error / @ref string_formatter_set_temp_buffer.
* The third parameter is the input value that is to be converted.
* The fourth parameter is a dummy value, it is always ignored, callers should use `0` here.
* It is used so the fallback with the variadic arguments is *only* chosen when no other
* overload matches.
*/
/**@{*/
// Test for arithmetic type, *excluding* bool. printf can not handle bool, so can't we.
template<typename T>
using is_numeric = typename std::conditional <
std::is_arithmetic<typename std::decay<T>::type>::value &&
!std::is_same<typename std::decay<T>::type, bool>::value, std::true_type, std::false_type >::type;
// Test for integer type (not floating point, not bool).
template<typename T>
using is_integer = typename std::conditional < is_numeric<T>::value &&
!std::is_floating_point<typename std::decay<T>::type>::value, std::true_type,
std::false_type >::type;
template<typename T>
using is_char = typename
std::conditional<std::is_same<typename std::decay<T>::type, char>::value, std::true_type, std::false_type>::type;
// Test for std::string type.
template<typename T>
using is_string = typename
std::conditional<std::is_same<typename std::decay<T>::type, std::string>::value, std::true_type, std::false_type>::type;
// Test for std::string_view type.
template<typename T>
using is_string_view = typename
std::conditional<std::is_same<typename std::decay<T>::type, std::string_view>::value, std::true_type, std::false_type>::type;
// Test for c-string type.
template<typename T>
using is_cstring = typename std::conditional <
std::is_same<typename std::decay<T>::type, const char *>::value ||
std::is_same<typename std::decay<T>::type, char *>::value, std::true_type, std::false_type >::type;
// Test for class translation
template<typename T>
using is_translation = typename std::conditional <
std::is_same<typename std::decay<T>::type, translation>::value, std::true_type,
std::false_type >::type;
// Test for string_id<T>
template <typename, template <typename> class>
struct is_instance_of : std::false_type {};
template <typename T, template <typename> class TMPL>
struct is_instance_of<TMPL<T>, TMPL> : std::true_type {};
template<typename T>
using is_string_id = typename std::conditional <
is_instance_of<typename std::decay<T>::type, string_id>::value, std::true_type,
std::false_type >::type;
template<typename RT, typename T>
inline typename std::enable_if < is_integer<RT>::value &&is_integer<T>::value,
RT >::type convert( RT *, const string_formatter &, T &&value, int )
{
return value;
}
template<typename RT, typename T>
inline typename std::enable_if < is_integer<RT>::value
&&std::is_enum<typename std::decay<T>::type>::value,
RT >::type convert( RT *, const string_formatter &, T &&value, int )
{
return static_cast<RT>( value );
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_floating_point<RT>::value &&is_numeric<T>::value
&&!is_integer<T>::value, RT >::type convert( RT *, const string_formatter &, T &&value, int )
{
return value;
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, void *>::value
&&std::is_pointer<typename std::decay<T>::type>::value, void * >::type convert( RT *,
const string_formatter &, T &&value, int )
{
return const_cast<typename std::remove_const<typename std::remove_pointer<typename std::decay<T>::type>::type>::type *>
( value );
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value &&is_string<T>::value,
std::string_view >::type convert( RT *, const string_formatter &, T &&value, int )
{
return value;
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view >::value
&&is_string_view<T>::value, std::string_view >::type
convert( RT *, const string_formatter &, T &&value, int )
{
return value;
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value &&is_cstring<T>::value,
std::string_view >::type convert( RT *, const string_formatter &, T &&value, int )
{
return value;
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value
&&is_translation<T>::value,
std::string_view >::type convert( RT *, const string_formatter &sf, T &&value, int )
{
return string_formatter_set_temp_buffer( sf, value.translated() );
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value &&is_string_id<T>::value,
std::string_view >::type convert( RT *, const string_formatter &sf, T &&value, int )
{
return string_formatter_set_temp_buffer( sf, value.str() );
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value &&is_numeric<T>::value
&&!is_char<T>::value, std::string_view >::type convert( RT *, const string_formatter &sf, T &&value,
int )
{
return string_formatter_set_temp_buffer( sf, std::to_string( value ) );
}
template<typename RT, typename T>
inline typename std::enable_if < std::is_same<RT, std::string_view>::value &&is_numeric<T>::value
&&is_char<T>::value, std::string_view >::type convert( RT *, const string_formatter &sf, T &&value,
int )
{
return string_formatter_set_temp_buffer( sf, std::string( 1, value ) );
}
// Catch all remaining conversions (the '...' makes this the lowest overload priority).
// The static_assert is used to restrict the input type to those that can actually be printed,
// calling `string_format` with an unknown type will trigger a compile error because no other
// `convert` function will match, while this one will give a static_assert error.
template<typename RT, typename T>
// NOLINTNEXTLINE(cert-dcl50-cpp)
inline RT convert( RT *, const string_formatter &sf, T &&, ... )
{
static_assert( std::is_pointer<typename std::decay<T>::type>::value ||
is_numeric<T>::value ||
is_string<T>::value ||
is_string_view<T>::value ||
is_char<T>::value ||
std::is_enum<typename std::decay<T>::type>::value ||
is_cstring<T>::value ||
is_translation<T>::value ||
is_string_id<T>::value,
"Unsupported argument type" );
throw_error( sf, "Tried to convert argument of type " +
std::string( typeid( T ).name() ) + " to " +
std::string( typeid( RT ).name() ) + ", which is not possible" );
}
/**@}*/
/**
* Type-safe and undefined-behavior free wrapper over `sprintf`.
* See @ref string_format for usage.
* Basically it extracts the format specifiers and calls `sprintf` for each one separately
* and with proper conversion of the input type.
* For example `printf("%f", 7)` would yield undefined behavior as "%f" requires a `double`
* as argument. This class detects the format specifier and converts the input to `double`
* before calling `sprintf`. Similar for `printf("%d", "foo")` (yields UB again), but this
* class will just throw an exception.
*/
// Note: argument index is always 0-based *in this code*, but `printf` has 1-based arguments.
class string_formatter
{
private:
/// Complete format string, including all format specifiers (the string passed
/// to @ref printf).
const std::string_view format;
/// Used during parsing to denote the *next* character in @ref format to be
/// parsed.
size_t current_index_in_format = 0;
/// The formatted output string, filled during parsing of @ref format,
/// so it's only valid after the parsing has completed.
std::string output;
/// The *currently parsed format specifiers. This is extracted from @ref format
/// during parsing and given to @ref sprintf (along with the actual argument).
/// It is filled and reset during parsing for each format specifier in @ref format.
std::string current_format;
/// The *index* (not number) of the next argument to be formatted via @ref current_format.
int current_argument_index = 0;
/// Return the next character from @ref format and increment @ref current_index_in_format.
/// Returns a null-character when the end of the @ref format has been reached (and does not
/// change @ref current_index_in_format).
char consume_next_input();
/// Returns (like @ref consume_next_input) the next character from @ref format, but
/// does *not* change @ref current_index_in_format.
char get_current_input() const;
/// If the next character to read from @ref format is the given character, consume it
/// (like @ref consume_next_input) and return `true`. Otherwise don't do anything at all
/// and return `false`.
bool consume_next_input_if( char c );
/// Return whether @ref get_current_input has a decimal digit ('0'...'9').
bool has_digit() const;
/// Consume decimal digits, interpret them as integer and return it.
/// A starting '0' is allowed. Leaves @ref format at the first non-digit
/// character (or the end). Returns 0 if the first character is not a digit.
int parse_integer();
/// Read and consume format flag characters and append them to @ref current_format.
/// Leaves @ref format at the first character that is not a flag (or the end).
void read_flags();
/// Read and forward to @ref current_format any width specifier from @ref format.
/// Returns nothing if the width is not specified or if it is specified as fixed number,
/// otherwise returns the index of the printf-argument to be used for the width.
std::optional<int> read_width();
/// See @ref read_width. This does the same, but for the precision specifier.
std::optional<int> read_precision();
/// Read and return the index of the printf-argument that is to be formatted. Returns
/// nothing if @ref format does not refer to a specific index (caller should use
/// @ref current_argument_index).
std::optional<int> read_argument_index();
// Helper for common logic in @ref read_width and @ref read_precision.
std::optional<int> read_number_or_argument_index();
/// Throws an exception containing the given message and the @ref format.
[[noreturn]]
void throw_error( const std::string &msg ) const;
friend void throw_error( const string_formatter &sf, const std::string &msg ) {
sf.throw_error( msg );
}
mutable std::string temp_buffer;
/// Stores the given text in @ref temp_buffer and returns `c_str()` of it. This is used
/// for printing non-strings through "%s". It *only* works because this prints each format
/// specifier separately, so the content of @ref temp_buffer is only used once.
friend std::string_view string_formatter_set_temp_buffer( const string_formatter &sf,
std::string_view text ) {
sf.temp_buffer = text;
return std::string_view( sf.temp_buffer );
}
/**
* Extracts a printf argument from the argument list and converts it to the requested type.
* @tparam RT The type that the argument should be converted to.
* @tparam current_index The index of the first of the supplied arguments.
* @throws If there is no argument with the given index, or if the argument can not be
* converted to the requested type (via @ref convert).
*/
/**@{*/
template<typename RT, unsigned int current_index>
RT get_nth_arg_as( const unsigned int requested ) const {
throw_error( "Requested argument " + std::to_string( requested ) +
" but input has only " + std::to_string( current_index )
);
}
template<typename RT, unsigned int current_index, typename T, typename ...Args>
RT get_nth_arg_as( const unsigned int requested, T &&head, Args &&... args ) const {
if( requested > current_index ) {
return get_nth_arg_as < RT, current_index + 1 > ( requested, std::forward<Args>( args )... );
} else {
return convert( static_cast<RT *>( nullptr ), *this, std::forward<T>( head ), 0 );
}
}
/**@}*/
void add_long_long_length_modifier();
void discard_oct_hex_sign_flag();
template<typename ...Args>
void read_conversion( const int format_arg_index, Args &&... args ) {
// Removes the prefix "ll", "l", "h" and "hh", "z", and "t".
// We later add "ll" again and that
// would interfere with the existing prefix. We convert *all* input to (un)signed
// long long int and use the "ll" modifier all the time. This will print the
// expected value all the time, even when the original modifier did not match.
if( consume_next_input_if( 'l' ) ) {
consume_next_input_if( 'l' );
} else if( consume_next_input_if( 'h' ) ) {
consume_next_input_if( 'h' );
} else if( consume_next_input_if( 'z' ) ) {
// done with it
} else if( consume_next_input_if( 't' ) ) {
// done with it
}
const char c = consume_next_input();
current_format.push_back( c );
switch( c ) {
case 'c':
return do_formating( get_nth_arg_as<int, 0>( format_arg_index, std::forward<Args>( args )... ) );
case 'd':
case 'i':
add_long_long_length_modifier();
return do_formating( get_nth_arg_as<signed long long int, 0>( format_arg_index,
std::forward<Args>( args )... ) );
case 'o':
case 'x':
case 'X':
// Workaround for fmtlib prepending number with ' '/'+'
// when formatting with ' '/'+' flags and 'o'/'x'/'X' specifiers
discard_oct_hex_sign_flag();
// intentional fall-through
case 'u':
add_long_long_length_modifier();
return do_formating( get_nth_arg_as<unsigned long long int, 0>( format_arg_index,
std::forward<Args>( args )... ) );
case 'a':
case 'A':
case 'g':
case 'G':
case 'f':
case 'F':
case 'e':
case 'E':
return do_formating( get_nth_arg_as<double, 0>( format_arg_index, std::forward<Args>( args )... ) );
case 'p':
return do_formating( get_nth_arg_as<void *, 0>( format_arg_index,
std::forward<Args>( args )... ) );
case 's':
return do_formating( get_nth_arg_as<std::string_view, 0>( format_arg_index,
std::forward<Args>( args )... ) );
default:
throw_error( "Unsupported format conversion: " + std::string( 1, c ) );
}
}
void do_formating( int value );
void do_formating( signed long long int value );
void do_formating( unsigned long long int value );
void do_formating( double value );
void do_formating( void *value );
void do_formating( std::string_view value );
public:
/// @param format The format string as required by `sprintf`.
string_formatter( std::string_view format ) : format( format ) { }
/// Does the actual `sprintf`. It uses @ref format and puts the formatted
/// string into @ref output.
/// Note: use @ref get_output to get the formatted string after a successful
/// call to this function.
/// @throws Exceptions when the arguments do not match the format specifiers,
/// see @ref get_nth_arg_as, or when the format is invalid for whatever reason.
/// Note: @ref string_format is a wrapper that handles those exceptions.
template<typename ...Args>
void parse( Args &&... args ) {
output.reserve( format.size() );
output.resize( 0 );
current_index_in_format = 0;
current_argument_index = 0;
while( const char c = consume_next_input() ) {
if( c != '%' ) {
output.push_back( c );
continue;
}
if( consume_next_input_if( '%' ) ) {
output.push_back( '%' );
continue;
}
current_format = "%";
const std::optional<int> format_arg_index = read_argument_index();
read_flags();
if( const std::optional<int> width_argument_index = read_width() ) {
const int w = get_nth_arg_as<int, 0>( *width_argument_index, std::forward<Args>( args )... );
current_format += std::to_string( w );
}
if( const std::optional<int> precision_argument_index = read_precision() ) {
const int p = get_nth_arg_as<int, 0>( *precision_argument_index, std::forward<Args>( args )... );
current_format += std::to_string( p );
}
const int arg = format_arg_index ? *format_arg_index : current_argument_index++;
read_conversion( arg, std::forward<Args>( args )... );
}
}
std::string get_output() const {
return output;
}
};
} // namespace cata
/**
* Simple wrapper over @ref string_formatter::parse. It catches any exceptions and returns
* some error string. Otherwise it just returns the formatted string.
*
* These functions perform string formatting according to the rules of the `printf` function,
* see `man 3 printf` or any other documentation.
*
* In short: the \p format parameter is a string with optional placeholders, which will be
* replaced with formatted data from the further arguments. The further arguments must have
* a type that matches the type expected by the placeholder.
* The placeholders look like this:
* - `%s` expects an argument of type `const char*`, `std::string`, `std::string_view` or
* numeric (which is converted to a string via `std::to_string`), which is inserted as is.
* - `%d` expects an argument of an integer type (int, short, ...), which is formatted as
* decimal number.
* - `%f` expects a numeric argument (integer / floating point), which is formatted as
* decimal number.
*
* There are more placeholders and options to them (see documentation of `printf`).
* Note that this wrapper (via @ref string_formatter) automatically converts the arguments
* to match the given format specifier (if possible) - see @ref string_formatter_convert.
*/
/**@{*/
template<typename ...Args>
inline std::string string_format( std::string_view format, Args &&...args )
{
try {
cata::string_formatter formatter( std::move( format ) );
formatter.parse( std::forward<Args>( args )... );
return formatter.get_output();
} catch( ... ) {
return cata::handle_string_format_error();
}
}
template<typename T, typename ...Args>
inline typename std::enable_if<cata::is_translation<T>::value, std::string>::type
string_format( T &&format, Args &&...args )
{
return string_format( format.translated(), std::forward<Args>( args )... );
}
/**@}*/
/** Print string to stdout. */
void cata_print_stdout( const std::string &s );
/** Print string to stderr. */
void cata_print_stderr( const std::string &s );
/** Same as @ref string_format, but prints its result to stdout. */
/**@{*/
template<typename ...Args>
inline void cata_printf( std::string_view format, Args &&...args )
{
std::string s = string_format( format, std::forward<Args>( args )... );
cata_print_stdout( s );
}
/**@}*/
#endif // CATA_SRC_STRING_FORMATTER_H