1 // -*- C++ -*-
2 //===----------------------------------------------------------------------===//
3 //
4 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5 // See https://llvm.org/LICENSE.txt for license information.
6 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //
8 //===----------------------------------------------------------------------===//
9
10 #ifndef _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
11 #define _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
12
13 #include <__charconv/to_chars_integral.h>
14 #include <__charconv/to_chars_result.h>
15 #include <__charconv/traits.h>
16 #include <__concepts/arithmetic.h>
17 #include <__concepts/same_as.h>
18 #include <__config>
19 #include <__format/concepts.h>
20 #include <__format/format_error.h>
21 #include <__format/formatter_output.h>
22 #include <__format/parser_std_format_spec.h>
23 #include <__iterator/concepts.h>
24 #include <__iterator/iterator_traits.h>
25 #include <__memory/pointer_traits.h>
26 #include <__system_error/errc.h>
27 #include <__type_traits/make_unsigned.h>
28 #include <__utility/unreachable.h>
29 #include <array>
30 #include <limits>
31 #include <string>
32 #include <string_view>
33
34 #ifndef _LIBCPP_HAS_NO_LOCALIZATION
35 # include <__locale>
36 #endif
37
38 #if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
39 # pragma GCC system_header
40 #endif
41
42 _LIBCPP_PUSH_MACROS
43 #include <__undef_macros>
44
45 _LIBCPP_BEGIN_NAMESPACE_STD
46
47 #if _LIBCPP_STD_VER >= 20
48
49 namespace __formatter {
50
51 //
52 // Generic
53 //
54
55 template <contiguous_iterator _Iterator>
56 requires same_as<char, iter_value_t<_Iterator>>
__insert_sign(_Iterator __buf,bool __negative,__format_spec::__sign __sign)57 _LIBCPP_HIDE_FROM_ABI inline _Iterator __insert_sign(_Iterator __buf, bool __negative, __format_spec::__sign __sign) {
58 if (__negative)
59 *__buf++ = '-';
60 else
61 switch (__sign) {
62 case __format_spec::__sign::__default:
63 case __format_spec::__sign::__minus:
64 // No sign added.
65 break;
66 case __format_spec::__sign::__plus:
67 *__buf++ = '+';
68 break;
69 case __format_spec::__sign::__space:
70 *__buf++ = ' ';
71 break;
72 }
73
74 return __buf;
75 }
76
77 /**
78 * Determines the required grouping based on the size of the input.
79 *
80 * The grouping's last element will be repeated. For simplicity this repeating
81 * is unwrapped based on the length of the input. (When the input is short some
82 * groups are not processed.)
83 *
84 * @returns The size of the groups to write. This means the number of
85 * separator characters written is size() - 1.
86 *
87 * @note Since zero-sized groups cause issues they are silently ignored.
88 *
89 * @note The grouping field of the locale is always a @c std::string,
90 * regardless whether the @c std::numpunct's type is @c char or @c wchar_t.
91 */
__determine_grouping(ptrdiff_t __size,const string & __grouping)92 _LIBCPP_HIDE_FROM_ABI inline string __determine_grouping(ptrdiff_t __size, const string& __grouping) {
93 _LIBCPP_ASSERT_INTERNAL(!__grouping.empty() && __size > __grouping[0],
94 "The slow grouping formatting is used while there will be no separators written");
95 string __r;
96 auto __end = __grouping.end() - 1;
97 auto __ptr = __grouping.begin();
98
99 while (true) {
100 __size -= *__ptr;
101 if (__size > 0)
102 __r.push_back(*__ptr);
103 else {
104 // __size <= 0 so the value pushed will be <= *__ptr.
105 __r.push_back(*__ptr + __size);
106 return __r;
107 }
108
109 // Proceed to the next group.
110 if (__ptr != __end) {
111 do {
112 ++__ptr;
113 // Skip grouping with a width of 0.
114 } while (*__ptr == 0 && __ptr != __end);
115 }
116 }
117
118 __libcpp_unreachable();
119 }
120
121 //
122 // Char
123 //
124
125 template <__fmt_char_type _CharT>
126 _LIBCPP_HIDE_FROM_ABI auto
127 __format_char(integral auto __value,
128 output_iterator<const _CharT&> auto __out_it,
129 __format_spec::__parsed_specifications<_CharT> __specs) -> decltype(__out_it) {
130 using _Tp = decltype(__value);
131 if constexpr (!same_as<_CharT, _Tp>) {
132 // cmp_less and cmp_greater can't be used for character types.
133 if constexpr (signed_integral<_CharT> == signed_integral<_Tp>) {
134 if (__value < numeric_limits<_CharT>::min() || __value > numeric_limits<_CharT>::max())
135 std::__throw_format_error("Integral value outside the range of the char type");
136 } else if constexpr (signed_integral<_CharT>) {
137 // _CharT is signed _Tp is unsigned
138 if (__value > static_cast<make_unsigned_t<_CharT>>(numeric_limits<_CharT>::max()))
139 std::__throw_format_error("Integral value outside the range of the char type");
140 } else {
141 // _CharT is unsigned _Tp is signed
142 if (__value < 0 || static_cast<make_unsigned_t<_Tp>>(__value) > numeric_limits<_CharT>::max())
143 std::__throw_format_error("Integral value outside the range of the char type");
144 }
145 }
146
147 const auto __c = static_cast<_CharT>(__value);
148 return __formatter::__write(std::addressof(__c), std::addressof(__c) + 1, std::move(__out_it), __specs);
149 }
150
151 //
152 // Integer
153 //
154
155 /** Wrapper around @ref to_chars, returning the output iterator. */
156 template <contiguous_iterator _Iterator, integral _Tp>
157 requires same_as<char, iter_value_t<_Iterator>>
__to_buffer(_Iterator __first,_Iterator __last,_Tp __value,int __base)158 _LIBCPP_HIDE_FROM_ABI _Iterator __to_buffer(_Iterator __first, _Iterator __last, _Tp __value, int __base) {
159 // TODO FMT Evaluate code overhead due to not calling the internal function
160 // directly. (Should be zero overhead.)
161 to_chars_result __r = std::to_chars(std::to_address(__first), std::to_address(__last), __value, __base);
162 _LIBCPP_ASSERT_INTERNAL(__r.ec == errc(0), "Internal buffer too small");
163 auto __diff = __r.ptr - std::to_address(__first);
164 return __first + __diff;
165 }
166
167 /**
168 * Helper to determine the buffer size to output a integer in Base @em x.
169 *
170 * There are several overloads for the supported bases. The function uses the
171 * base as template argument so it can be used in a constant expression.
172 */
173 template <unsigned_integral _Tp, size_t _Base>
__buffer_size()174 consteval size_t __buffer_size() noexcept
175 requires(_Base == 2)
176 {
177 return numeric_limits<_Tp>::digits // The number of binary digits.
178 + 2 // Reserve space for the '0[Bb]' prefix.
179 + 1; // Reserve space for the sign.
180 }
181
182 template <unsigned_integral _Tp, size_t _Base>
__buffer_size()183 consteval size_t __buffer_size() noexcept
184 requires(_Base == 8)
185 {
186 return numeric_limits<_Tp>::digits // The number of binary digits.
187 / 3 // Adjust to octal.
188 + 1 // Turn floor to ceil.
189 + 1 // Reserve space for the '0' prefix.
190 + 1; // Reserve space for the sign.
191 }
192
193 template <unsigned_integral _Tp, size_t _Base>
__buffer_size()194 consteval size_t __buffer_size() noexcept
195 requires(_Base == 10)
196 {
197 return numeric_limits<_Tp>::digits10 // The floored value.
198 + 1 // Turn floor to ceil.
199 + 1; // Reserve space for the sign.
200 }
201
202 template <unsigned_integral _Tp, size_t _Base>
__buffer_size()203 consteval size_t __buffer_size() noexcept
204 requires(_Base == 16)
205 {
206 return numeric_limits<_Tp>::digits // The number of binary digits.
207 / 4 // Adjust to hexadecimal.
208 + 2 // Reserve space for the '0[Xx]' prefix.
209 + 1; // Reserve space for the sign.
210 }
211
212 template <class _OutIt, contiguous_iterator _Iterator, class _CharT>
213 requires same_as<char, iter_value_t<_Iterator>>
__write_using_decimal_separators(_OutIt __out_it,_Iterator __begin,_Iterator __first,_Iterator __last,string && __grouping,_CharT __sep,__format_spec::__parsed_specifications<_CharT> __specs)214 _LIBCPP_HIDE_FROM_ABI _OutIt __write_using_decimal_separators(
215 _OutIt __out_it,
216 _Iterator __begin,
217 _Iterator __first,
218 _Iterator __last,
219 string&& __grouping,
220 _CharT __sep,
221 __format_spec::__parsed_specifications<_CharT> __specs) {
222 int __size = (__first - __begin) + // [sign][prefix]
223 (__last - __first) + // data
224 (__grouping.size() - 1); // number of separator characters
225
226 __padding_size_result __padding = {0, 0};
227 if (__specs.__alignment_ == __format_spec::__alignment::__zero_padding) {
228 // Write [sign][prefix].
229 __out_it = __formatter::__copy(__begin, __first, std::move(__out_it));
230
231 if (__specs.__width_ > __size) {
232 // Write zero padding.
233 __padding.__before_ = __specs.__width_ - __size;
234 __out_it = __formatter::__fill(std::move(__out_it), __specs.__width_ - __size, _CharT('0'));
235 }
236 } else {
237 if (__specs.__width_ > __size) {
238 // Determine padding and write padding.
239 __padding = __formatter::__padding_size(__size, __specs.__width_, __specs.__alignment_);
240
241 __out_it = __formatter::__fill(std::move(__out_it), __padding.__before_, __specs.__fill_);
242 }
243 // Write [sign][prefix].
244 __out_it = __formatter::__copy(__begin, __first, std::move(__out_it));
245 }
246
247 auto __r = __grouping.rbegin();
248 auto __e = __grouping.rend() - 1;
249 _LIBCPP_ASSERT_INTERNAL(
250 __r != __e, "The slow grouping formatting is used while there will be no separators written.");
251 // The output is divided in small groups of numbers to write:
252 // - A group before the first separator.
253 // - A separator and a group, repeated for the number of separators.
254 // - A group after the last separator.
255 // This loop achieves that process by testing the termination condition
256 // midway in the loop.
257 //
258 // TODO FMT This loop evaluates the loop invariant `__parser.__type !=
259 // _Flags::_Type::__hexadecimal_upper_case` for every iteration. (This test
260 // happens in the __write call.) Benchmark whether making two loops and
261 // hoisting the invariant is worth the effort.
262 while (true) {
263 if (__specs.__std_.__type_ == __format_spec::__type::__hexadecimal_upper_case) {
264 __last = __first + *__r;
265 __out_it = __formatter::__transform(__first, __last, std::move(__out_it), __hex_to_upper);
266 __first = __last;
267 } else {
268 __out_it = __formatter::__copy(__first, *__r, std::move(__out_it));
269 __first += *__r;
270 }
271
272 if (__r == __e)
273 break;
274
275 ++__r;
276 *__out_it++ = __sep;
277 }
278
279 return __formatter::__fill(std::move(__out_it), __padding.__after_, __specs.__fill_);
280 }
281
282 template <unsigned_integral _Tp, contiguous_iterator _Iterator, class _CharT, class _FormatContext>
283 requires same_as<char, iter_value_t<_Iterator>>
__format_integer(_Tp __value,_FormatContext & __ctx,__format_spec::__parsed_specifications<_CharT> __specs,bool __negative,_Iterator __begin,_Iterator __end,const char * __prefix,int __base)284 _LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator __format_integer(
285 _Tp __value,
286 _FormatContext& __ctx,
287 __format_spec::__parsed_specifications<_CharT> __specs,
288 bool __negative,
289 _Iterator __begin,
290 _Iterator __end,
291 const char* __prefix,
292 int __base) {
293 _Iterator __first = __formatter::__insert_sign(__begin, __negative, __specs.__std_.__sign_);
294 if (__specs.__std_.__alternate_form_ && __prefix)
295 while (*__prefix)
296 *__first++ = *__prefix++;
297
298 _Iterator __last = __formatter::__to_buffer(__first, __end, __value, __base);
299
300 # ifndef _LIBCPP_HAS_NO_LOCALIZATION
301 if (__specs.__std_.__locale_specific_form_) {
302 const auto& __np = std::use_facet<numpunct<_CharT>>(__ctx.locale());
303 string __grouping = __np.grouping();
304 ptrdiff_t __size = __last - __first;
305 // Writing the grouped form has more overhead than the normal output
306 // routines. If there will be no separators written the locale-specific
307 // form is identical to the normal routine. Test whether to grouped form
308 // is required.
309 if (!__grouping.empty() && __size > __grouping[0])
310 return __formatter::__write_using_decimal_separators(
311 __ctx.out(),
312 __begin,
313 __first,
314 __last,
315 __formatter::__determine_grouping(__size, __grouping),
316 __np.thousands_sep(),
317 __specs);
318 }
319 # endif
320 auto __out_it = __ctx.out();
321 if (__specs.__alignment_ != __format_spec::__alignment::__zero_padding)
322 __first = __begin;
323 else {
324 // __buf contains [sign][prefix]data
325 // ^ location of __first
326 // The zero padding is done like:
327 // - Write [sign][prefix]
328 // - Write data right aligned with '0' as fill character.
329 __out_it = __formatter::__copy(__begin, __first, std::move(__out_it));
330 __specs.__alignment_ = __format_spec::__alignment::__right;
331 __specs.__fill_.__data[0] = _CharT('0');
332 int32_t __size = __first - __begin;
333
334 __specs.__width_ -= std::min(__size, __specs.__width_);
335 }
336
337 if (__specs.__std_.__type_ != __format_spec::__type::__hexadecimal_upper_case) [[likely]]
338 return __formatter::__write(__first, __last, __ctx.out(), __specs);
339
340 return __formatter::__write_transformed(__first, __last, __ctx.out(), __specs, __formatter::__hex_to_upper);
341 }
342
343 template <unsigned_integral _Tp, class _CharT, class _FormatContext>
344 _LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
345 __format_integer(_Tp __value,
346 _FormatContext& __ctx,
347 __format_spec::__parsed_specifications<_CharT> __specs,
348 bool __negative = false) {
349 switch (__specs.__std_.__type_) {
350 case __format_spec::__type::__binary_lower_case: {
351 array<char, __formatter::__buffer_size<decltype(__value), 2>()> __array;
352 return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0b", 2);
353 }
354 case __format_spec::__type::__binary_upper_case: {
355 array<char, __formatter::__buffer_size<decltype(__value), 2>()> __array;
356 return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0B", 2);
357 }
358 case __format_spec::__type::__octal: {
359 // Octal is special; if __value == 0 there's no prefix.
360 array<char, __formatter::__buffer_size<decltype(__value), 8>()> __array;
361 return __formatter::__format_integer(
362 __value, __ctx, __specs, __negative, __array.begin(), __array.end(), __value != 0 ? "0" : nullptr, 8);
363 }
364 case __format_spec::__type::__default:
365 case __format_spec::__type::__decimal: {
366 array<char, __formatter::__buffer_size<decltype(__value), 10>()> __array;
367 return __formatter::__format_integer(
368 __value, __ctx, __specs, __negative, __array.begin(), __array.end(), nullptr, 10);
369 }
370 case __format_spec::__type::__hexadecimal_lower_case: {
371 array<char, __formatter::__buffer_size<decltype(__value), 16>()> __array;
372 return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0x", 16);
373 }
374 case __format_spec::__type::__hexadecimal_upper_case: {
375 array<char, __formatter::__buffer_size<decltype(__value), 16>()> __array;
376 return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0X", 16);
377 }
378 default:
379 _LIBCPP_ASSERT_INTERNAL(false, "The parse function should have validated the type");
380 __libcpp_unreachable();
381 }
382 }
383
384 template <signed_integral _Tp, class _CharT, class _FormatContext>
385 _LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
__format_integer(_Tp __value,_FormatContext & __ctx,__format_spec::__parsed_specifications<_CharT> __specs)386 __format_integer(_Tp __value, _FormatContext& __ctx, __format_spec::__parsed_specifications<_CharT> __specs) {
387 // Depending on the std-format-spec string the sign and the value
388 // might not be outputted together:
389 // - alternate form may insert a prefix string.
390 // - zero-padding may insert additional '0' characters.
391 // Therefore the value is processed as a positive unsigned value.
392 // The function @ref __insert_sign will a '-' when the value was negative.
393 auto __r = std::__to_unsigned_like(__value);
394 bool __negative = __value < 0;
395 if (__negative)
396 __r = std::__complement(__r);
397
398 return __formatter::__format_integer(__r, __ctx, __specs, __negative);
399 }
400
401 //
402 // Formatter arithmetic (bool)
403 //
404
405 template <class _CharT>
406 struct _LIBCPP_TEMPLATE_VIS __bool_strings;
407
408 template <>
409 struct _LIBCPP_TEMPLATE_VIS __bool_strings<char> {
410 static constexpr string_view __true{"true"};
411 static constexpr string_view __false{"false"};
412 };
413
414 # ifndef _LIBCPP_HAS_NO_WIDE_CHARACTERS
415 template <>
416 struct _LIBCPP_TEMPLATE_VIS __bool_strings<wchar_t> {
417 static constexpr wstring_view __true{L"true"};
418 static constexpr wstring_view __false{L"false"};
419 };
420 # endif
421
422 template <class _CharT, class _FormatContext>
423 _LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
424 __format_bool(bool __value, _FormatContext& __ctx, __format_spec::__parsed_specifications<_CharT> __specs) {
425 # ifndef _LIBCPP_HAS_NO_LOCALIZATION
426 if (__specs.__std_.__locale_specific_form_) {
427 const auto& __np = std::use_facet<numpunct<_CharT>>(__ctx.locale());
428 basic_string<_CharT> __str = __value ? __np.truename() : __np.falsename();
429 return __formatter::__write_string_no_precision(basic_string_view<_CharT>{__str}, __ctx.out(), __specs);
430 }
431 # endif
432 basic_string_view<_CharT> __str =
433 __value ? __formatter::__bool_strings<_CharT>::__true : __formatter::__bool_strings<_CharT>::__false;
434 return __formatter::__write(__str.begin(), __str.end(), __ctx.out(), __specs);
435 }
436
437 } // namespace __formatter
438
439 #endif //_LIBCPP_STD_VER >= 20
440
441 _LIBCPP_END_NAMESPACE_STD
442
443 _LIBCPP_POP_MACROS
444
445 #endif // _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
446